| | |
| | | stop_stage=100 |
| | | set=L |
| | | data_dir="data" |
| | | WENETSPEECH= |
| | | |
| | | log "$0 $*" |
| | | . utils/parse_options.sh |
| | | |
| | | . ./path.sh || exit 1; |
| | | . ./cmd.sh || exit 1; |
| | | . ./db.sh || exit 1; |
| | | |
| | | if [ ! -e "${WENETSPEECH}" ]; then |
| | | log "Fill the value of 'WENETSPEECH' of db.sh" |
| | | log "or download the data set follwing the instruction in https://wenet-e2e.github.io/WenetSpeech/" |
| | | exit 1 |
| | | fi |
| | | |
| | | if [ ! -d "${WENETSPEECH}/audio" ] && [ ! -f "${WENETSPEECH}/WenetSpeech.json" ]; then |
| | | echo "Valid WENETSPEECH data not found in ${WENETSPEECH}." |
| | |
| | | if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then |
| | | echo "stage 0: Data preparation" |
| | | # Data preparation |
| | | local/data.sh "--set ${set}" |
| | | local/data.sh --set ${set} --nj 64 --data_dir $feats_dir --WENETSPEECH $raw_data |
| | | # mkdir $feats_dir/data |
| | | # mv $feats_dir/$train_set $feats_dir/data/$train_set |
| | | # for x in $test_sets; do |