| | |
| | | nj=64 |
| | | |
| | | # data |
| | | raw_data=../raw_data |
| | | data_url=www.openslr.org/resources/33 |
| | | raw_data=/nfs/zhifu.gzf/wenetspeech_proc |
| | | |
| | | # exp tag |
| | | tag="exp1" |
| | |
| | | set -u |
| | | set -o pipefail |
| | | |
| | | train_set=train |
| | | train_set=train_l |
| | | valid_set=dev |
| | | test_sets="dev test_net test_meeting" |
| | | |
| | |
| | | fi |
| | | |
| | | if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then |
| | | echo "stage 0: Data preparation" |
| | | # Data preparation |
| | | local/wenetspeech_data_prep.sh \ |
| | | --train-subset $set \ |
| | | $wenetspeech_data_dir \ |
| | | data || exit 1; |
| | | # echo "stage 0: Data preparation" |
| | | # # Data preparation |
| | | # local/wenetspeech_data_prep.sh $raw_data $feats_dir |
| | | mkdir $feats_dir/data |
| | | mv $feats_dir/$train_set $feats_dir/data/$train_set |
| | | for x in $test_sets; do |
| | | mv mv $feats_dir/$x $feats_dir/data/ |
| | | done |
| | | fi |