From 3c3754dcc7568e76fa7d4b2c4e14849f68cc6ee7 Mon Sep 17 00:00:00 2001
From: 嘉渊 <wangjiaming.wjm@alibaba-inc.com>
Date: 星期日, 28 五月 2023 23:46:01 +0800
Subject: [PATCH] update repo

---
 egs/wenetspeech/conformer/run.sh |    5 +++--
 1 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/egs/wenetspeech/conformer/run.sh b/egs/wenetspeech/conformer/run.sh
index 326440f..3d1d9ec 100644
--- a/egs/wenetspeech/conformer/run.sh
+++ b/egs/wenetspeech/conformer/run.sh
@@ -20,7 +20,7 @@
 type=sound
 scp=wav.scp
 speed_perturb="0.9 1.0 1.1"
-stage=0
+stage=3
 stop_stage=5
 
 # feature configuration
@@ -72,7 +72,7 @@
 if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then
     echo "stage 0: Data preparation"
     # Data preparation
-#    local/data.sh --set ${set} --nj $nj --data_dir $feats_dir --WENETSPEECH $raw_data --train_cmd $train_cmd
+    local/data.sh --set ${set} --nj $nj --data_dir $feats_dir --WENETSPEECH $raw_data --train_cmd $train_cmd
     mkdir $feats_dir/data
     mv $feats_dir/$train_set $feats_dir/data/$train_set
     for x in $test_sets; do
@@ -129,6 +129,7 @@
                 --use_preprocessor true \
                 --token_type $token_type \
                 --token_list $token_list \
+                --dataset_type large \
                 --data_dir ${feats_dir}/data \
                 --train_set ${train_set} \
                 --valid_set ${valid_set} \

--
Gitblit v1.9.1