雾聪
2023-08-10 ffb05b9ae7eccc47416e9e7fae9dea54d400a245
egs_modelscope/vad/speech_fsmn_vad_zh-cn-16k-common/demo.py
@@ -3,13 +3,13 @@
if __name__ == '__main__':
    audio_in = 'https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_audio/vad_example.wav'
    output_dir = None
    inference_pipline = pipeline(
    output_dir = "./results"
    inference_pipeline = pipeline(
        task=Tasks.voice_activity_detection,
        model="damo/speech_fsmn_vad_zh-cn-16k-common-pytorch",
        model_revision='v1.2.0',
        model_revision=None,
        output_dir=output_dir,
        batch_size=1,
    )
    segments_result = inference_pipline(audio_in=audio_in)
    segments_result = inference_pipeline(audio_in=audio_in)
    print(segments_result)