From 3aec61c6eaad0c55391ad86b5495e2be4cb359d1 Mon Sep 17 00:00:00 2001
From: 志浩 <neo.dzh@alibaba-inc.com>
Date: 星期三, 15 二月 2023 19:58:08 +0800
Subject: [PATCH] add scripts for simu data
---
egs/mars/sd/scripts/dump_rttm_to_labels.py | 14 ++++++++++++--
1 files changed, 12 insertions(+), 2 deletions(-)
diff --git a/egs/mars/sd/scripts/dump_rttm_to_labels.py b/egs/mars/sd/scripts/dump_rttm_to_labels.py
index b4508ec..ce9e7e8 100644
--- a/egs/mars/sd/scripts/dump_rttm_to_labels.py
+++ b/egs/mars/sd/scripts/dump_rttm_to_labels.py
@@ -31,8 +31,18 @@
for scp_path in wav_scp_list:
meeting_scp.update(load_scp_as_dict(scp_path))
- assert len(meeting_scp) == len(meeting2rttm), \
- "Number of wav and rttm mismatch {} != {}".format(len(meeting_scp), len(meeting2rttm))
+ if len(meeting_scp) != len(meeting2rttm):
+ logging.warning("Number of wav and rttm mismatch {} != {}".format(
+ len(meeting_scp), len(meeting2rttm)))
+ common_keys = set(meeting_scp.keys()) & set(meeting2rttm.keys())
+ logging.warning("Keep {} records.".format(len(common_keys)))
+ for key in meeting_scp:
+ if key not in common_keys:
+ meeting_scp.pop(key)
+ logging.warning("Pop {} from wav scp".format(key))
+ if key not in meeting2rttm:
+ meeting2rttm.pop(key)
+ logging.warning("Pop {} from rttm scp".format(key))
if not os.path.exists(args.out_dir):
os.makedirs(args.out_dir)
--
Gitblit v1.9.1