From 33d3d2084403fd34b79c835d2f2fe04f6cd8f738 Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期三, 13 九月 2023 09:33:54 +0800
Subject: [PATCH] Merge branch 'main' of github.com:alibaba-damo-academy/FunASR add
---
egs/aishell/transformer/utils/compute_cmvn.sh | 35 ++++++++++++++++++++++-------------
1 files changed, 22 insertions(+), 13 deletions(-)
diff --git a/egs/aishell/transformer/utils/compute_cmvn.sh b/egs/aishell/transformer/utils/compute_cmvn.sh
index 79354af..4e7f80e 100755
--- a/egs/aishell/transformer/utils/compute_cmvn.sh
+++ b/egs/aishell/transformer/utils/compute_cmvn.sh
@@ -2,29 +2,38 @@
. ./path.sh || exit 1;
# Begin configuration section.
+fbankdir=
nj=32
cmd=./utils/run.pl
feats_dim=80
+config_file=
+scale=1.0
echo "$0 $@"
. utils/parse_options.sh || exit 1;
-fbankdir=$1
-logdir=$2
+# shellcheck disable=SC2046
+head -n $(awk -v lines="$(wc -l < ${fbankdir}/wav.scp)" -v scale="$scale" 'BEGIN { printf "%.0f\n", lines*scale }') ${fbankdir}/wav.scp > ${fbankdir}/wav.scp.scale
-output_dir=${fbankdir}/cmvn/split_${nj};
-mkdir -p $output_dir
+split_dir=${fbankdir}/cmvn/split_${nj};
+mkdir -p $split_dir
split_scps=""
for n in $(seq $nj); do
- split_scps="$split_scps $output_dir/wav.$n.scp"
+ split_scps="$split_scps $split_dir/wav.$n.scp"
done
-utils/split_scp.pl ${fbankdir}/wav.scp $split_scps || exit 1;
+utils/split_scp.pl ${fbankdir}/wav.scp.scale $split_scps || exit 1;
-#$cmd JOB=1:$nj $logdir/cmvn.JOB.log \
-# python utils/compute_cmvn.py -d ${feats_dim} -a $fbankdir/ark -i JOB -o ${output_dir} \
-# || exit 1;
-#
-#python utils/combine_cmvn_file.py -d ${feats_dim} -c ${output_dir} -n $nj -o $fbankdir
-#
-#echo "$0: Succeeded compute global cmvn"
+logdir=${fbankdir}/cmvn/log
+$cmd JOB=1:$nj $logdir/cmvn.JOB.log \
+ python utils/compute_cmvn.py \
+ --dim ${feats_dim} \
+ --wav_path $split_dir \
+ --config_file $config_file \
+ --idx JOB \
+
+python utils/combine_cmvn_file.py --dim ${feats_dim} --cmvn_dir $split_dir --nj $nj --output_dir ${fbankdir}/cmvn
+
+python utils/cmvn_converter.py --cmvn_json ${fbankdir}/cmvn/cmvn.json --am_mvn ${fbankdir}/cmvn/am.mvn
+
+echo "$0: Succeeded compute global cmvn"
--
Gitblit v1.9.1