examples/industrial_data_pretraining/sense_voice/demo.py
@@ -7,8 +7,8 @@ model = AutoModel( model="/Users/zhifu/Downloads/modelscope_models/SenseVoiceModelscope", vad_model="iic/speech_fsmn_vad_zh-cn-16k-common-pytorch", vad_kwargs={"max_single_segment_time": 30000}, # vad_model="iic/speech_fsmn_vad_zh-cn-16k-common-pytorch", # vad_kwargs={"max_single_segment_time": 30000}, ) @@ -21,6 +21,7 @@ "language": "auto", "fp16": True, "gain_event": True, "beam_size": 5, } res = model.generate(input=input_wav, batch_size_s=0, DecodingOptions=DecodingOptions)