From e0a8c4b00631ed636418f4280964e473f05d5002 Mon Sep 17 00:00:00 2001
From: hnluo <haoneng.lhn@alibaba-inc.com>
Date: 星期四, 25 五月 2023 11:08:46 +0800
Subject: [PATCH] Merge pull request #552 from alibaba-damo-academy/dev_wjm2

---
 egs/aishell/transformer/utils/compute_cmvn.sh |   13 +++++++++----
 1 files changed, 9 insertions(+), 4 deletions(-)

diff --git a/egs/aishell/transformer/utils/compute_cmvn.sh b/egs/aishell/transformer/utils/compute_cmvn.sh
index 7663df9..ad8813d 100755
--- a/egs/aishell/transformer/utils/compute_cmvn.sh
+++ b/egs/aishell/transformer/utils/compute_cmvn.sh
@@ -2,15 +2,19 @@
 
 . ./path.sh || exit 1;
 # Begin configuration section.
+fbankdir=$1
 nj=32
 cmd=./utils/run.pl
 feats_dim=80
+config=
+scale=1.0
 
 echo "$0 $@"
 
 . utils/parse_options.sh || exit 1;
 
-fbankdir=$1
+# shellcheck disable=SC2046
+head -n $(awk -v lines="$(wc -l < ${fbankdir}/wav.scp)" -v scale="$scale" 'BEGIN { printf "%.0f\n", lines*scale }') ${fbankdir}/wav.scp > ${fbankdir}/wav.scp.scale
 
 split_dir=${fbankdir}/cmvn/split_${nj};
 mkdir -p $split_dir
@@ -18,17 +22,18 @@
 for n in $(seq $nj); do
     split_scps="$split_scps $split_dir/wav.$n.scp"
 done
-utils/split_scp.pl ${fbankdir}/wav.scp $split_scps || exit 1;
+utils/split_scp.pl ${fbankdir}/wav.scp.scale $split_scps || exit 1;
 
 logdir=${fbankdir}/cmvn/log
 $cmd JOB=1:$nj $logdir/cmvn.JOB.log \
     python utils/compute_cmvn.py \
       --dim ${feats_dim} \
       --wav_path $split_dir \
-      --idx JOB
+      --config $config \
+      --idx JOB \
 
 python utils/combine_cmvn_file.py --dim ${feats_dim} --cmvn_dir $split_dir --nj $nj --output_dir ${fbankdir}/cmvn
 
-python utils/cmvn_converter.py --cmvn_json ${fbankdir}/cmvn/cmvn.json --am_mvn ${fbankdir}/cmvn/cmvn.mvn
+python utils/cmvn_converter.py --cmvn_json ${fbankdir}/cmvn/cmvn.json --am_mvn ${fbankdir}/cmvn/am.mvn
 
 echo "$0: Succeeded compute global cmvn"

--
Gitblit v1.9.1