liugz18
2024-07-18 d80ac2fd2df4e7fb8a28acfa512bb11472b5cc99
examples/aishell/paraformer/run.sh
@@ -5,7 +5,7 @@
# general configuration
feats_dir="../DATA" #feature output dictionary
exp_dir="."
exp_dir=`pwd`
lang=zh
token_type=char
stage=0
@@ -15,7 +15,7 @@
nj=32
inference_device="cuda" #"cpu"
inference_checkpoint="model.pt"
inference_checkpoint="model.pt.avg10"
inference_scp="wav.scp"
inference_batch_size=32
@@ -26,6 +26,8 @@
# exp tag
tag="exp1"
workspace=`pwd`
master_port=12345
. utils/parse_options.sh || exit 1;
@@ -76,8 +78,7 @@
    --config-path "${workspace}/conf" \
    --config-name "${config}" \
    ++train_data_set_list="${feats_dir}/data/${train_set}/audio_datasets.jsonl" \
    ++cmvn_file="${feats_dir}/data/${train_set}/cmvn.json" \
    ++dataset_conf.num_workers=$nj
    ++cmvn_file="${feats_dir}/data/${train_set}/cmvn.json"
fi
token_list=${feats_dir}/data/${lang}_token_list/$token_type/tokens.txt
@@ -114,6 +115,7 @@
  torchrun \
  --nnodes 1 \
  --nproc_per_node ${gpu_num} \
  --master_port ${master_port} \
  ../../../funasr/bin/train.py \
  --config-path "${workspace}/conf" \
  --config-name "${config}" \
@@ -144,6 +146,7 @@
    inference_dir="${exp_dir}/exp/${model_dir}/inference-${inference_checkpoint}/${dset}"
    _logdir="${inference_dir}/logdir"
    echo "inference_dir: ${inference_dir}"
    mkdir -p "${_logdir}"
    data_dir="${feats_dir}/data/${dset}"
@@ -171,6 +174,8 @@
          ++input="${_logdir}/keys.${JOB}.scp" \
          ++output_dir="${inference_dir}/${JOB}" \
          ++device="${inference_device}" \
          ++ncpu=1 \
          ++disable_log=true \
          ++batch_size="${inference_batch_size}" &> ${_logdir}/log.${JOB}.txt
        }&