From 9a43b5607d5bb7958c27d06d0252fee1dc858f3e Mon Sep 17 00:00:00 2001
From: 嘉渊 <wangjiaming.wjm@alibaba-inc.com>
Date: 星期日, 23 七月 2023 16:47:53 +0800
Subject: [PATCH] update
---
egs/callhome/eend_ola/run.sh | 8 ++++----
egs/callhome/eend_ola/local/run_prepare_shared_eda.sh | 14 +++++++-------
egs/callhome/eend_ola/local/split.py | 2 +-
3 files changed, 12 insertions(+), 12 deletions(-)
diff --git a/egs/callhome/eend_ola/local/run_prepare_shared_eda.sh b/egs/callhome/eend_ola/local/run_prepare_shared_eda.sh
index aec1ff2..f1019d6 100755
--- a/egs/callhome/eend_ola/local/run_prepare_shared_eda.sh
+++ b/egs/callhome/eend_ola/local/run_prepare_shared_eda.sh
@@ -22,16 +22,16 @@
# LDC2011S10, LDC2012S01, LDC2011S05, LDC2011S08
# - musan_root
# MUSAN corpus (https://www.openslr.org/17/)
-callhome_dir=/nfs/wangjiaming.wjm/speech-data/NIST/LDC2001S97
-swb2_phase1_train=/nfs/wangjiaming.wjm/speech-data/LDC/LDC98S75
-data_root=/nfs/wangjiaming.wjm/speech-data/LDC
-musan_root=/nfs/wangjiaming.wjm/speech-data/JHU/musan
+callhome_dir=
+swb2_phase1_train=
+data_root=
+musan_root=
# Modify simulated data storage area.
# This script distributes simulated data under these directories
simu_actual_dirs=(
-/nfs/wangjiaming.wjm/EEND_DATA_sad30_snr10n15n20_funasr_test/s05/$USER/diarization-data
-/nfs/wangjiaming.wjm/EEND_DATA_sad30_snr10n15n20_funasr_test/s08/$USER/diarization-data
-/nfs/wangjiaming.wjm/EEND_DATA_sad30_snr10n15n20_funasr_test/s09/$USER/diarization-data
+./s05/$USER/diarization-data
+./s08/$USER/diarization-data
+./s09/$USER/diarization-data
)
# data preparation options
diff --git a/egs/callhome/eend_ola/local/split.py b/egs/callhome/eend_ola/local/split.py
index aa50b1e..7ad1bad 100644
--- a/egs/callhome/eend_ola/local/split.py
+++ b/egs/callhome/eend_ola/local/split.py
@@ -60,7 +60,7 @@
for file in scp_files:
scp_file = os.path.join(work_path, file)
- idx = scp_file.split('.')[-2]
+ idx = scp_file.split('.')[-1]
reco2dur_file = os.path.join(work_path, 'reco2dur.{}'.format(str(idx)))
spk2utt_file = os.path.join(work_path, 'spk2utt.{}'.format(str(idx)))
segment_file = os.path.join(work_path, 'segments.{}'.format(str(idx)))
diff --git a/egs/callhome/eend_ola/run.sh b/egs/callhome/eend_ola/run.sh
index c3a3f32..ff6b75b 100644
--- a/egs/callhome/eend_ola/run.sh
+++ b/egs/callhome/eend_ola/run.sh
@@ -13,9 +13,9 @@
# feature configuration
data_dir="./data"
-simu_feats_dir=$data_dir/simu/ark_data/dump/simu_data/data
-simu_feats_dir_chunk2000=$data_dir/simu/ark_data/dump/simu_data_chunk2000/data
-callhome_feats_dir_chunk2000=$data_dir/simu/ark_data/dump/callhome_chunk2000/data
+simu_feats_dir=$data_dir/ark_data/dump/simu_data/data
+simu_feats_dir_chunk2000=$data_dir/ark_data/dump/simu_data_chunk2000/data
+callhome_feats_dir_chunk2000=$data_dir/ark_data/dump/callhome_chunk2000/data
simu_train_dataset=train
simu_valid_dataset=dev
callhome_train_dataset=callhome1_spkall
@@ -31,7 +31,7 @@
exp_dir="."
input_size=345
-stage=0
+stage=1
stop_stage=5
# exp tag
--
Gitblit v1.9.1