From 2a66366be4c2715870e4859fd5a5db6e8a9dc00a Mon Sep 17 00:00:00 2001
From: chenmengzheAAA <123789350+chenmengzheAAA@users.noreply.github.com>
Date: 星期四, 14 九月 2023 19:00:17 +0800
Subject: [PATCH] Merge pull request #956 from alibaba-damo-academy/chenmengzheAAA-patch-4
---
egs/aishell2/paraformerbert/local/extract_embeds.sh | 7 ++++---
1 files changed, 4 insertions(+), 3 deletions(-)
diff --git a/egs/aishell2/paraformerbert/local/extract_embeds.sh b/egs/aishell2/paraformerbert/local/extract_embeds.sh
index 049d38c..d7dd4f2 100755
--- a/egs/aishell2/paraformerbert/local/extract_embeds.sh
+++ b/egs/aishell2/paraformerbert/local/extract_embeds.sh
@@ -5,13 +5,12 @@
bert_model_name="bert-base-chinese"
raw_dataset_path="../DATA"
+nj=64
model_path=${bert_model_name}
. utils/parse_options.sh || exit 1;
-nj=32
-
-for data_set in train dev test;do
+for data_set in train dev_ios;do
scp=$raw_dataset_path/data/${data_set}/text
local_scp_dir_raw=${raw_dataset_path}/data/embeds/${data_set}
local_scp_dir=$local_scp_dir_raw/split$nj
@@ -55,6 +54,8 @@
cat ${local_records_dir}/embeds.${JOB}.shape || exit 1;
done > ${local_scp_dir_raw}/embeds.shape
fi
+
+ cp ${local_scp_dir_raw}/embeds.scp ${raw_dataset_path}/data/${data_set}/embeds.scp
done
echo "embeds is in: ${local_scp_dir_raw}"
--
Gitblit v1.9.1