From f479f94832ce6ca0d381ed3d8e53675dea24a6ec Mon Sep 17 00:00:00 2001
From: 北念 <lzr265946@alibaba-inc.com>
Date: 星期四, 02 十一月 2023 16:35:10 +0800
Subject: [PATCH] fix paraformer-16k-en finetune pipeline
---
funasr/bin/build_trainer.py | 6 ++++++
1 files changed, 6 insertions(+), 0 deletions(-)
diff --git a/funasr/bin/build_trainer.py b/funasr/bin/build_trainer.py
index dc295d8..61af766 100644
--- a/funasr/bin/build_trainer.py
+++ b/funasr/bin/build_trainer.py
@@ -548,6 +548,7 @@
init_param = modelscope_dict['init_model']
cmvn_file = modelscope_dict['cmvn_file']
seg_dict_file = modelscope_dict['seg_dict']
+ bpemodel = modelscope_dict['bpemodel']
# overwrite parameters
with open(config) as f:
@@ -581,6 +582,10 @@
args.seg_dict_file = seg_dict_file
else:
args.seg_dict_file = None
+ if os.path.exists(bpemodel):
+ args.bpemodel = bpemodel
+ else:
+ args.bpemodel = None
args.data_dir = data_dir
args.train_set = train_set
args.dev_set = dev_set
@@ -614,6 +619,7 @@
if batch_bins is not None:
if args.dataset_type == "small":
args.batch_bins = batch_bins
+ args.dataset_conf["batch_conf"]["batch_size"] = batch_bins
elif args.dataset_type == "large":
args.dataset_conf["batch_conf"]["batch_size"] = batch_bins
else:
--
Gitblit v1.9.1