From cc2c1d1d53dea5d2c45f858d1baa5bd279f47987 Mon Sep 17 00:00:00 2001
From: nichongjia-2007 <nichongjia@gmail.com>
Date: 星期三, 31 五月 2023 14:39:25 +0800
Subject: [PATCH] Merge branch 'main' of https://github.com/alibaba-damo-academy/FunASR

---
 egs/aishell2/paraformerbert/conf/train_asr_paraformerbert_conformer_20e_6d_1280_320.yaml |   29 ++++++++++++++++++++---------
 1 files changed, 20 insertions(+), 9 deletions(-)

diff --git a/egs/aishell2/paraformerbert/conf/train_asr_paraformerbert_conformer_20e_6d_1280_320.yaml b/egs/aishell2/paraformerbert/conf/train_asr_paraformerbert_conformer_20e_6d_1280_320.yaml
index 19f123e..8968d2d 100644
--- a/egs/aishell2/paraformerbert/conf/train_asr_paraformerbert_conformer_20e_6d_1280_320.yaml
+++ b/egs/aishell2/paraformerbert/conf/train_asr_paraformerbert_conformer_20e_6d_1280_320.yaml
@@ -29,6 +29,17 @@
     self_attention_dropout_rate: 0.0
     src_attention_dropout_rate: 0.0
 
+# frontend related
+frontend: wav_frontend
+frontend_conf:
+    fs: 16000
+    window: hamming
+    n_mels: 80
+    frame_length: 25
+    frame_shift: 10
+    lfr_m: 1
+    lfr_n: 1
+
 # hybrid CTC/attention
 model: paraformer_bert
 model_conf:
@@ -36,7 +47,7 @@
     lsm_weight: 0.1     # label smoothing option
     length_normalized_loss: false
     predictor_weight: 1.0
-    glat_context_p: 0.4
+    sampling_ratio: 0.4
     embeds_id: 3
     embed_dims: 768
     embeds_loss_weight: 2.0
@@ -45,7 +56,7 @@
 accum_grad: 2
 grad_clip: 5
 patience: none
-max_epoch: 50
+max_epoch: 150
 val_scheduler_criterion:
     - valid
     - acc
@@ -78,24 +89,24 @@
     - 40
     num_time_mask: 2
 
-predictor: cif_predictor_sanm
+predictor: cif_predictor
 predictor_conf:
   idim: 320
   threshold: 1.0
   l_order: 1
   r_order: 1
 
-log_interval: 50
-normalize: None
-
 dataset_conf:
     data_names: speech,text,embed
-    data_types: kaldi_ark,text,kaldi_ark
+    data_types: sound,text,kaldi_ark
     shuffle: True
     shuffle_conf:
-        shuffle_size: 10240
+        shuffle_size: 2048
         sort_size: 500
     batch_conf:
         batch_type: token
         batch_size: 25000
-    num_workers: 8
\ No newline at end of file
+    num_workers: 8
+
+log_interval: 50
+normalize: None
\ No newline at end of file

--
Gitblit v1.9.1