python/FunASR-XL.git

			@@ -20,7 +20,7 @@
			type=sound
			scp=wav.scp
			speed_perturb="0.9 1.0 1.1"
			stage=0
			stage=3
			stop_stage=5

			# feature configuration
			@@ -72,7 +72,7 @@
			if [ ${stage} -le 0 ] && [ ${stop_stage} -ge 0 ]; then
			echo "stage 0: Data preparation"
			# Data preparation
			# local/data.sh --set ${set} --nj $nj --data_dir $feats_dir --WENETSPEECH $raw_data --train_cmd $train_cmd
			local/data.sh --set ${set} --nj $nj --data_dir $feats_dir --WENETSPEECH $raw_data --train_cmd $train_cmd
			mkdir $feats_dir/data
			mv $feats_dir/$train_set $feats_dir/data/$train_set
			for x in $test_sets; do
			@@ -129,6 +129,7 @@
			--use_preprocessor true \
			--token_type $token_type \
			--token_list $token_list \
			--dataset_type large \
			--data_dir ${feats_dir}/data \
			--train_set ${train_set} \
			--valid_set ${valid_set} \
			@@ -157,8 +158,7 @@
			inference_tag="$(basename "${inference_config}" .yaml)"
			_dir="${asr_exp}/${inference_tag}/${inference_asr_model}/${dset}"
			_logdir="${_dir}/logdir"
			if [ -d ${_dir} ]; then
			echo "${_dir} is already exists. if you want to decode again, please delete this dir first."
			you want to decode again, please delete this dir first."
			exit 0
			fi
			mkdir -p "${_logdir}"
			@@ -215,7 +215,7 @@
			--am_model_name $inference_asr_model \
			--mode asr \
			--model_name conformer \
			--dataset aishell \
			--dataset wenetspeech \
			--output_dir $exp_dir/exp/$model_dir \
			--vocab_size $vocab_size \
			--tag $tag