From f479f94832ce6ca0d381ed3d8e53675dea24a6ec Mon Sep 17 00:00:00 2001
From: 北念 <lzr265946@alibaba-inc.com>
Date: 星期四, 02 十一月 2023 16:35:10 +0800
Subject: [PATCH] fix paraformer-16k-en finetune pipeline
---
funasr/bin/asr_inference_launch.py | 11 +++++++++--
1 files changed, 9 insertions(+), 2 deletions(-)
diff --git a/funasr/bin/asr_inference_launch.py b/funasr/bin/asr_inference_launch.py
index e3de05b..04ddd92 100644
--- a/funasr/bin/asr_inference_launch.py
+++ b/funasr/bin/asr_inference_launch.py
@@ -815,8 +815,7 @@
format="%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s",
)
- if sv_model_file is None:
- sv_model_file = "{}/damo/speech_paraformer-large-vad-punc-spk_asr_nat-zh-cn/campplus_cn_common.bin".format(get_cache_dir(None))
+ sv_model_file = asr_model_file.replace("model.pb", "campplus_cn_common.bin")
if param_dict is not None:
hotword_list_or_file = param_dict.get('hotword')
@@ -2056,6 +2055,12 @@
ncpu = kwargs.get("ncpu", 1)
torch.set_num_threads(ncpu)
+ if param_dict:
+ language = param_dict.get("language", None)
+ task = param_dict.get("task", "transcribe")
+ else:
+ language = None
+ task = "transcribe"
if batch_size > 1:
raise NotImplementedError("batch decoding is not implemented")
if word_lm_train_config is not None:
@@ -2099,6 +2104,8 @@
penalty=penalty,
nbest=nbest,
streaming=streaming,
+ language=language,
+ task=task,
)
logging.info("speech2text_kwargs: {}".format(speech2text_kwargs))
speech2text = Speech2TextWhisper(**speech2text_kwargs)
--
Gitblit v1.9.1