From f479f94832ce6ca0d381ed3d8e53675dea24a6ec Mon Sep 17 00:00:00 2001
From: 北念 <lzr265946@alibaba-inc.com>
Date: 星期四, 02 十一月 2023 16:35:10 +0800
Subject: [PATCH] fix paraformer-16k-en finetune pipeline

---
 funasr/bin/asr_inference_launch.py |   11 +++++++++--
 1 files changed, 9 insertions(+), 2 deletions(-)

diff --git a/funasr/bin/asr_inference_launch.py b/funasr/bin/asr_inference_launch.py
index e3de05b..04ddd92 100644
--- a/funasr/bin/asr_inference_launch.py
+++ b/funasr/bin/asr_inference_launch.py
@@ -815,8 +815,7 @@
         format="%(asctime)s (%(module)s:%(lineno)d) %(levelname)s: %(message)s",
     )
 
-    if sv_model_file is None:
-        sv_model_file = "{}/damo/speech_paraformer-large-vad-punc-spk_asr_nat-zh-cn/campplus_cn_common.bin".format(get_cache_dir(None))
+    sv_model_file = asr_model_file.replace("model.pb", "campplus_cn_common.bin")
 
     if param_dict is not None:
         hotword_list_or_file = param_dict.get('hotword')
@@ -2056,6 +2055,12 @@
 
     ncpu = kwargs.get("ncpu", 1)
     torch.set_num_threads(ncpu)
+    if param_dict:
+        language = param_dict.get("language", None)
+        task = param_dict.get("task", "transcribe")
+    else:
+        language = None
+        task = "transcribe"
     if batch_size > 1:
         raise NotImplementedError("batch decoding is not implemented")
     if word_lm_train_config is not None:
@@ -2099,6 +2104,8 @@
         penalty=penalty,
         nbest=nbest,
         streaming=streaming,
+        language=language,
+        task=task,
     )
     logging.info("speech2text_kwargs: {}".format(speech2text_kwargs))
     speech2text = Speech2TextWhisper(**speech2text_kwargs)

--
Gitblit v1.9.1