From f479f94832ce6ca0d381ed3d8e53675dea24a6ec Mon Sep 17 00:00:00 2001
From: 北念 <lzr265946@alibaba-inc.com>
Date: 星期四, 02 十一月 2023 16:35:10 +0800
Subject: [PATCH] fix paraformer-16k-en finetune pipeline
---
egs_modelscope/vad/TEMPLATE/README.md | 4 ++--
1 files changed, 2 insertions(+), 2 deletions(-)
diff --git a/egs_modelscope/vad/TEMPLATE/README.md b/egs_modelscope/vad/TEMPLATE/README.md
index 3539b3d..2651dce 100644
--- a/egs_modelscope/vad/TEMPLATE/README.md
+++ b/egs_modelscope/vad/TEMPLATE/README.md
@@ -24,7 +24,7 @@
#### [FSMN-VAD-online model](https://modelscope.cn/models/damo/speech_fsmn_vad_zh-cn-16k-common-pytorch/summary)
```python
inference_pipeline = pipeline(
- task=Tasks.auto_speech_recognition,
+ task=Tasks.voice_activity_detection,
model='damo/speech_fsmn_vad_zh-cn-16k-common-pytorch',
)
import soundfile
@@ -36,7 +36,7 @@
speech_chunk = speech[0:chunk_stride]
rec_result = inference_pipeline(audio_in=speech_chunk, param_dict=param_dict)
print(rec_result)
-# next chunk, 480ms
+# next chunk, 100ms
speech_chunk = speech[chunk_stride:chunk_stride+chunk_stride]
rec_result = inference_pipeline(audio_in=speech_chunk, param_dict=param_dict)
print(rec_result)
--
Gitblit v1.9.1