zhifu gao
2024-04-23 2ac38adbe5f4e1374a079e032ed4b504351a207c
examples/aishell/paraformer/run.sh
@@ -5,7 +5,7 @@
# general configuration
feats_dir="../DATA" #feature output dictionary
exp_dir="."
exp_dir=`pwd`
lang=zh
token_type=char
stage=0
@@ -15,7 +15,7 @@
nj=32
inference_device="cuda" #"cpu"
inference_checkpoint="model.pt"
inference_checkpoint="model.pt.avg10"
inference_scp="wav.scp"
inference_batch_size=32
@@ -76,8 +76,7 @@
    --config-path "${workspace}/conf" \
    --config-name "${config}" \
    ++train_data_set_list="${feats_dir}/data/${train_set}/audio_datasets.jsonl" \
    ++cmvn_file="${feats_dir}/data/${train_set}/cmvn.json" \
    ++dataset_conf.num_workers=$nj
    ++cmvn_file="${feats_dir}/data/${train_set}/cmvn.json"
fi
token_list=${feats_dir}/data/${lang}_token_list/$token_type/tokens.txt
@@ -144,6 +143,7 @@
    inference_dir="${exp_dir}/exp/${model_dir}/inference-${inference_checkpoint}/${dset}"
    _logdir="${inference_dir}/logdir"
    echo "inference_dir: ${inference_dir}"
    mkdir -p "${_logdir}"
    data_dir="${feats_dir}/data/${dset}"
@@ -171,6 +171,8 @@
          ++input="${_logdir}/keys.${JOB}.scp" \
          ++output_dir="${inference_dir}/${JOB}" \
          ++device="${inference_device}" \
          ++ncpu=1 \
          ++disable_log=true \
          ++batch_size="${inference_batch_size}" &> ${_logdir}/log.${JOB}.txt
        }&