| | |
| | | scp=wav.scp |
| | | speed_perturb="0.9 1.0 1.1" |
| | | dataset_type=large |
| | | stage=3 |
| | | stop_stage=4 |
| | | stage=0 |
| | | stop_stage=5 |
| | | |
| | | skip_extract_embed=false |
| | | bert_model_name="bert-base-chinese" |
| | |
| | | nj=64 |
| | | |
| | | # data |
| | | tr_dir=/nfs/wangjiaming.wjm/asr_data/aishell2/AISHELL-2/iOS/data |
| | | dev_tst_dir=/nfs/wangjiaming.wjm/asr_data/aishell2/AISHELL-DEV-TEST-SET |
| | | tr_dir= |
| | | dev_tst_dir= |
| | | |
| | | # exp tag |
| | | tag="exp1" |
| | |
| | | echo "<unk>" >> ${token_list} |
| | | fi |
| | | |
| | | # Training Stage |
| | | # LM Training Stage |
| | | world_size=$gpu_num # run on one machine |
| | | if [ ${stage} -le 3 ] && [ ${stop_stage} -ge 3 ]; then |
| | | echo "stage 3: Training" |
| | | echo "stage 3: LM Training" |
| | | fi |
| | | |
| | | # ASR Training Stage |
| | | world_size=$gpu_num # run on one machine |
| | | if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then |
| | | echo "stage 4: ASR Training" |
| | | if ! "${skip_extract_embed}"; then |
| | | echo "extract embeddings..." |
| | | local/extract_embeds.sh \ |
| | |
| | | fi |
| | | |
| | | # Testing Stage |
| | | if [ ${stage} -le 4 ] && [ ${stop_stage} -ge 4 ]; then |
| | | echo "stage 4: Inference" |
| | | if [ ${stage} -le 5 ] && [ ${stop_stage} -ge 5 ]; then |
| | | echo "stage 5: Inference" |
| | | for dset in ${test_sets}; do |
| | | asr_exp=${exp_dir}/exp/${model_dir} |
| | | inference_tag="$(basename "${inference_config}" .yaml)" |