From 33d3d2084403fd34b79c835d2f2fe04f6cd8f738 Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期三, 13 九月 2023 09:33:54 +0800
Subject: [PATCH] Merge branch 'main' of github.com:alibaba-damo-academy/FunASR add

---
 egs/wenetspeech/conformer/run.sh |   10 +++++-----
 1 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/egs/wenetspeech/conformer/run.sh b/egs/wenetspeech/conformer/run.sh
index 326440f..db18361 100644
--- a/egs/wenetspeech/conformer/run.sh
+++ b/egs/wenetspeech/conformer/run.sh
@@ -20,7 +20,7 @@
 type=sound
 scp=wav.scp
 speed_perturb="0.9 1.0 1.1"
-stage=0
+stage=3
 stop_stage=5
 
 # feature configuration
@@ -72,7 +72,7 @@
 if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then
     echo "stage 0: Data preparation"
     # Data preparation
-#    local/data.sh --set ${set} --nj $nj --data_dir $feats_dir --WENETSPEECH $raw_data --train_cmd $train_cmd
+    local/data.sh --set ${set} --nj $nj --data_dir $feats_dir --WENETSPEECH $raw_data --train_cmd $train_cmd
     mkdir $feats_dir/data
     mv $feats_dir/$train_set $feats_dir/data/$train_set
     for x in $test_sets; do
@@ -129,6 +129,7 @@
                 --use_preprocessor true \
                 --token_type $token_type \
                 --token_list $token_list \
+                --dataset_type large \
                 --data_dir ${feats_dir}/data \
                 --train_set ${train_set} \
                 --valid_set ${valid_set} \
@@ -157,8 +158,7 @@
         inference_tag="$(basename "${inference_config}" .yaml)"
         _dir="${asr_exp}/${inference_tag}/${inference_asr_model}/${dset}"
         _logdir="${_dir}/logdir"
-        if [ -d ${_dir} ]; then
-            echo "${_dir} is already exists. if you want to decode again, please delete this dir first."
+          you want to decode again, please delete this dir first."
             exit 0
         fi
         mkdir -p "${_logdir}"
@@ -215,7 +215,7 @@
         --am_model_name $inference_asr_model \
         --mode asr \
         --model_name conformer \
-        --dataset aishell \
+        --dataset wenetspeech \
         --output_dir $exp_dir/exp/$model_dir \
         --vocab_size $vocab_size \
         --tag $tag

--
Gitblit v1.9.1