游雁
2023-07-21 c542eacb0aadcbc49c63db40429fca4e08f807a4
egs_modelscope/vad/speech_fsmn_vad_zh-cn-8k-common/demo_online.py
@@ -7,11 +7,11 @@
import soundfile
if __name__ == '__main__':
    output_dir = None
    inference_pipline = pipeline(
    output_dir = "./results"
    inference_pipeline = pipeline(
        task=Tasks.voice_activity_detection,
        model="damo/speech_fsmn_vad_zh-cn-8k-common",
        model_revision='v1.2.0',
        model_revision=None,
        output_dir=output_dir,
        batch_size=1,
        mode='online',
@@ -30,7 +30,7 @@
        else:
            is_final = False
        param_dict['is_final'] = is_final
        segments_result = inference_pipline(audio_in=speech[sample_offset: sample_offset + step],
        segments_result = inference_pipeline(audio_in=speech[sample_offset: sample_offset + step],
                                            param_dict=param_dict)
        print(segments_result)