egs_modelscope/vad/speech_fsmn_vad_zh-cn-8k-common/infer.py
@@ -7,8 +7,8 @@ inference_pipline = pipeline( task=Tasks.voice_activity_detection, model="damo/speech_fsmn_vad_zh-cn-8k-common", model_revision=None, output_dir='./output_dir', model_revision='v1.2.0', output_dir=output_dir, batch_size=1, ) segments_result = inference_pipline(audio_in=audio_in)