| | |
| | | type=sound |
| | | scp=wav.scp |
| | | speed_perturb="0.9 1.0 1.1" |
| | | stage=0 |
| | | stage=3 |
| | | stop_stage=5 |
| | | |
| | | # feature configuration |
| | |
| | | if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then |
| | | echo "stage 0: Data preparation" |
| | | # Data preparation |
| | | # local/data.sh --set ${set} --nj $nj --data_dir $feats_dir --WENETSPEECH $raw_data --train_cmd $train_cmd |
| | | local/data.sh --set ${set} --nj $nj --data_dir $feats_dir --WENETSPEECH $raw_data --train_cmd $train_cmd |
| | | mkdir $feats_dir/data |
| | | mv $feats_dir/$train_set $feats_dir/data/$train_set |
| | | for x in $test_sets; do |
| | |
| | | --use_preprocessor true \ |
| | | --token_type $token_type \ |
| | | --token_list $token_list \ |
| | | --dataset_type large \ |
| | | --data_dir ${feats_dir}/data \ |
| | | --train_set ${train_set} \ |
| | | --valid_set ${valid_set} \ |
| | |
| | | inference_tag="$(basename "${inference_config}" .yaml)" |
| | | _dir="${asr_exp}/${inference_tag}/${inference_asr_model}/${dset}" |
| | | _logdir="${_dir}/logdir" |
| | | if [ -d ${_dir} ]; then |
| | | echo "${_dir} is already exists. if you want to decode again, please delete this dir first." |
| | | you want to decode again, please delete this dir first." |
| | | exit 0 |
| | | fi |
| | | mkdir -p "${_logdir}" |
| | |
| | | --am_model_name $inference_asr_model \ |
| | | --mode asr \ |
| | | --model_name conformer \ |
| | | --dataset aishell \ |
| | | --dataset wenetspeech \ |
| | | --output_dir $exp_dir/exp/$model_dir \ |
| | | --vocab_size $vocab_size \ |
| | | --tag $tag |