From 4ace5a95b052d338947fc88809a440ccd55cf6b4 Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期四, 16 十一月 2023 16:39:52 +0800
Subject: [PATCH] funasr pages
---
egs_modelscope/vad/TEMPLATE/README.md | 8 +++++---
1 files changed, 5 insertions(+), 3 deletions(-)
diff --git a/egs_modelscope/vad/TEMPLATE/README.md b/egs_modelscope/vad/TEMPLATE/README.md
index 945f9fa..2651dce 100644
--- a/egs_modelscope/vad/TEMPLATE/README.md
+++ b/egs_modelscope/vad/TEMPLATE/README.md
@@ -1,3 +1,5 @@
+([绠�浣撲腑鏂嘳(./README_zh.md)|English)
+
# Voice Activity Detection
> **Note**:
@@ -22,7 +24,7 @@
#### [FSMN-VAD-online model](https://modelscope.cn/models/damo/speech_fsmn_vad_zh-cn-16k-common-pytorch/summary)
```python
inference_pipeline = pipeline(
- task=Tasks.auto_speech_recognition,
+ task=Tasks.voice_activity_detection,
model='damo/speech_fsmn_vad_zh-cn-16k-common-pytorch',
)
import soundfile
@@ -34,7 +36,7 @@
speech_chunk = speech[0:chunk_stride]
rec_result = inference_pipeline(audio_in=speech_chunk, param_dict=param_dict)
print(rec_result)
-# next chunk, 480ms
+# next chunk, 100ms
speech_chunk = speech[chunk_stride:chunk_stride+chunk_stride]
rec_result = inference_pipeline(audio_in=speech_chunk, param_dict=param_dict)
print(rec_result)
@@ -97,7 +99,7 @@
--data_dir "./data/test" \
--output_dir "./results" \
--gpu_inference false \
- --njob 1
+ --njob 64
```
## Finetune with pipeline
--
Gitblit v1.9.1