From cdca62d933c4e0766a05044c6cba7cfa0596e615 Mon Sep 17 00:00:00 2001
From: zhifu gao <zhifu.gzf@alibaba-inc.com>
Date: 星期三, 21 二月 2024 19:22:59 +0800
Subject: [PATCH] Dev gzf (#1377)
---
examples/industrial_data_pretraining/paraformer/finetune.sh | 7 ++++---
1 files changed, 4 insertions(+), 3 deletions(-)
diff --git a/examples/industrial_data_pretraining/paraformer/finetune.sh b/examples/industrial_data_pretraining/paraformer/finetune.sh
index 5fc7481..266346c 100644
--- a/examples/industrial_data_pretraining/paraformer/finetune.sh
+++ b/examples/industrial_data_pretraining/paraformer/finetune.sh
@@ -6,10 +6,12 @@
#git clone https://www.modelscope.cn/damo/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-pytorch.git ${local_path}
## generate jsonl from wav.scp and text.txt
-#python funasr/datasets/audio_datasets/scp2jsonl.py \
+#python -m funasr.datasets.audio_datasets.scp2jsonl \
#++scp_file_list='["/Users/zhifu/funasr1.0/test_local/wav.scp", "/Users/zhifu/funasr1.0/test_local/text.txt"]' \
#++data_type_list='["source", "target"]' \
#++jsonl_file_out=/Users/zhifu/funasr1.0/test_local/audio_datasets.jsonl
+
+
# torchrun \
# --nnodes 1 \
# --nproc_per_node 1 \
@@ -22,5 +24,4 @@
++dataset_conf.batch_type="example" \
++train_conf.max_epoch=2 \
++dataset_conf.num_workers=4 \
-+output_dir="outputs/debug/ckpt/funasr2/exp2" \
-+debug="true"
\ No newline at end of file
++output_dir="outputs/debug/ckpt/funasr2/exp2"
\ No newline at end of file
--
Gitblit v1.9.1