From 1596f6f414f6f41da66506debb1dff19fffeb3ec Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期一, 24 六月 2024 11:55:17 +0800
Subject: [PATCH] fixbug hotwords
---
funasr/models/seaco_paraformer/template.yaml | 9 +++++++--
1 files changed, 7 insertions(+), 2 deletions(-)
diff --git a/funasr/models/seaco_paraformer/template.yaml b/funasr/models/seaco_paraformer/template.yaml
index 52654ac..fcaf524 100644
--- a/funasr/models/seaco_paraformer/template.yaml
+++ b/funasr/models/seaco_paraformer/template.yaml
@@ -68,13 +68,18 @@
use_output_layer: false
wo_input_layer: true
-predictor: CifPredictorV2
+predictor: CifPredictorV3
predictor_conf:
idim: 512
threshold: 1.0
l_order: 1
r_order: 1
tail_threshold: 0.45
+ smooth_factor2: 0.25
+ noise_threshold2: 0.01
+ upsample_times: 3
+ use_cif1_cnn: false
+ upsample_type: cnn_blstm
# frontend related
frontend: WavFrontend
@@ -129,7 +134,7 @@
dataset: AudioDataset
dataset_conf:
index_ds: IndexDSJsonl
- batch_sampler: DynamicBatchLocalShuffleSampler
+ batch_sampler: BatchSampler
batch_type: example # example or length
batch_size: 1 # if batch_type is example, batch_size is the numbers of samples; if length, batch_size is source_token_len+target_token_len;
max_token_length: 2048 # filter samples if source_token_len+target_token_len > max_token_length,
--
Gitblit v1.9.1