From 23e7ddebccd3b05cf7ef89809bcfe565ad6dfa1f Mon Sep 17 00:00:00 2001
From: majic31 <majic31@163.com>
Date: 星期二, 24 十二月 2024 10:00:14 +0800
Subject: [PATCH] Fix the variable name (#2328)
---
examples/industrial_data_pretraining/fsmn_kws_mt/finetune.sh | 12 +++++-------
1 files changed, 5 insertions(+), 7 deletions(-)
diff --git a/examples/industrial_data_pretraining/fsmn_kws_mt/finetune.sh b/examples/industrial_data_pretraining/fsmn_kws_mt/finetune.sh
index 1e87021..56162d7 100755
--- a/examples/industrial_data_pretraining/fsmn_kws_mt/finetune.sh
+++ b/examples/industrial_data_pretraining/fsmn_kws_mt/finetune.sh
@@ -27,19 +27,19 @@
# model_name from model_hub, or model_dir in local path
## option 1, download model automatically, unsupported currently
-model_name_or_model_dir="iic/speech_charctc_kws_phone-xiaoyun"
+model_name_or_model_dir="iic/speech_charctc_kws_phone-xiaoyun_mt"
## option 2, download model by git
local_path_root=${workspace}/modelscope_models
model_name_or_model_dir=${local_path_root}/${model_name_or_model_dir}
if [ ! -d $model_name_or_model_dir ]; then
mkdir -p ${model_name_or_model_dir}
- git clone https://www.modelscope.cn/iic/speech_charctc_kws_phone-xiaoyun.git ${model_name_or_model_dir}
+ git clone https://www.modelscope.cn/iic/speech_charctc_kws_phone-xiaoyun_mt.git ${model_name_or_model_dir}
fi
config=fsmn_4e_l10r2_250_128_fdim80_t2599_t4.yaml
token_list=${model_name_or_model_dir}/funasr/tokens_2599.txt
-token_list2=${model_name_or_model_dir}/funasr/tokens_xiaoyun_char.txt
+token_list2=${model_name_or_model_dir}/funasr/tokens_xiaoyun.txt
lexicon_list=${model_name_or_model_dir}/funasr/lexicon.txt
cmvn_file=${model_name_or_model_dir}/funasr/am.mvn.dim80_l2r2
init_param="${model_name_or_model_dir}/funasr/basetrain_fsmn_4e_l10r2_250_128_fdim80_t2599.pt"
@@ -141,10 +141,8 @@
--config-path="${output_dir}" \
--config-name="config.yaml" \
++init_param="${output_dir}/${inference_checkpoint}" \
- ++tokenizer_conf.token_list="${token_list}" \
- ++tokenizer_conf.seg_dict="${lexicon_list}" \
- ++tokenizer2_conf.token_list="${token_list2}" \
- ++tokenizer2_conf.seg_dict="${lexicon_list}" \
+ ++token_lists='['''${token_list}''', '''${token_list2}''']' \
+ ++seg_dicts='['''${lexicon_list}''', '''${lexicon_list}''']' \
++frontend_conf.cmvn_file="${cmvn_file}" \
++keywords="\"$keywords_string"\" \
++input="${_logdir}/keys.${JOB}.scp" \
--
Gitblit v1.9.1