From 3aec61c6eaad0c55391ad86b5495e2be4cb359d1 Mon Sep 17 00:00:00 2001
From: 志浩 <neo.dzh@alibaba-inc.com>
Date: 星期三, 15 二月 2023 19:58:08 +0800
Subject: [PATCH] add scripts for simu data

---
 egs/mars/sd/scripts/dump_rttm_to_labels.py |   14 ++++++++++++--
 1 files changed, 12 insertions(+), 2 deletions(-)

diff --git a/egs/mars/sd/scripts/dump_rttm_to_labels.py b/egs/mars/sd/scripts/dump_rttm_to_labels.py
index b4508ec..ce9e7e8 100644
--- a/egs/mars/sd/scripts/dump_rttm_to_labels.py
+++ b/egs/mars/sd/scripts/dump_rttm_to_labels.py
@@ -31,8 +31,18 @@
         for scp_path in wav_scp_list:
             meeting_scp.update(load_scp_as_dict(scp_path))
 
-        assert len(meeting_scp) == len(meeting2rttm), \
-            "Number of wav and rttm mismatch {} != {}".format(len(meeting_scp), len(meeting2rttm))
+        if len(meeting_scp) != len(meeting2rttm):
+            logging.warning("Number of wav and rttm mismatch {} != {}".format(
+                len(meeting_scp), len(meeting2rttm)))
+            common_keys = set(meeting_scp.keys()) & set(meeting2rttm.keys())
+            logging.warning("Keep {} records.".format(len(common_keys)))
+            for key in meeting_scp:
+                if key not in common_keys:
+                    meeting_scp.pop(key)
+                    logging.warning("Pop {} from wav scp".format(key))
+                if key not in meeting2rttm:
+                    meeting2rttm.pop(key)
+                    logging.warning("Pop {} from rttm scp".format(key))
 
         if not os.path.exists(args.out_dir):
             os.makedirs(args.out_dir)

--
Gitblit v1.9.1