嘉渊
2023-07-23 9a43b5607d5bb7958c27d06d0252fee1dc858f3e
update
3个文件已修改
24 ■■■■ 已修改文件
egs/callhome/eend_ola/local/run_prepare_shared_eda.sh 14 ●●●● 补丁 | 查看 | 原始文档 | blame | 历史
egs/callhome/eend_ola/local/split.py 2 ●●● 补丁 | 查看 | 原始文档 | blame | 历史
egs/callhome/eend_ola/run.sh 8 ●●●● 补丁 | 查看 | 原始文档 | blame | 历史
egs/callhome/eend_ola/local/run_prepare_shared_eda.sh
@@ -22,16 +22,16 @@
#    LDC2011S10, LDC2012S01, LDC2011S05, LDC2011S08
#  - musan_root
#    MUSAN corpus (https://www.openslr.org/17/)
callhome_dir=/nfs/wangjiaming.wjm/speech-data/NIST/LDC2001S97
swb2_phase1_train=/nfs/wangjiaming.wjm/speech-data/LDC/LDC98S75
data_root=/nfs/wangjiaming.wjm/speech-data/LDC
musan_root=/nfs/wangjiaming.wjm/speech-data/JHU/musan
callhome_dir=
swb2_phase1_train=
data_root=
musan_root=
# Modify simulated data storage area.
# This script distributes simulated data under these directories
simu_actual_dirs=(
/nfs/wangjiaming.wjm/EEND_DATA_sad30_snr10n15n20_funasr_test/s05/$USER/diarization-data
/nfs/wangjiaming.wjm/EEND_DATA_sad30_snr10n15n20_funasr_test/s08/$USER/diarization-data
/nfs/wangjiaming.wjm/EEND_DATA_sad30_snr10n15n20_funasr_test/s09/$USER/diarization-data
./s05/$USER/diarization-data
./s08/$USER/diarization-data
./s09/$USER/diarization-data
)
# data preparation options
egs/callhome/eend_ola/local/split.py
@@ -60,7 +60,7 @@
    for file in scp_files:
        scp_file = os.path.join(work_path, file)
        idx = scp_file.split('.')[-2]
        idx = scp_file.split('.')[-1]
        reco2dur_file = os.path.join(work_path, 'reco2dur.{}'.format(str(idx)))
        spk2utt_file = os.path.join(work_path, 'spk2utt.{}'.format(str(idx)))
        segment_file = os.path.join(work_path, 'segments.{}'.format(str(idx)))
egs/callhome/eend_ola/run.sh
@@ -13,9 +13,9 @@
# feature configuration
data_dir="./data"
simu_feats_dir=$data_dir/simu/ark_data/dump/simu_data/data
simu_feats_dir_chunk2000=$data_dir/simu/ark_data/dump/simu_data_chunk2000/data
callhome_feats_dir_chunk2000=$data_dir/simu/ark_data/dump/callhome_chunk2000/data
simu_feats_dir=$data_dir/ark_data/dump/simu_data/data
simu_feats_dir_chunk2000=$data_dir/ark_data/dump/simu_data_chunk2000/data
callhome_feats_dir_chunk2000=$data_dir/ark_data/dump/callhome_chunk2000/data
simu_train_dataset=train
simu_valid_dataset=dev
callhome_train_dataset=callhome1_spkall
@@ -31,7 +31,7 @@
exp_dir="."
input_size=345
stage=0
stage=1
stop_stage=5
# exp tag