From 216dc0978c88d3d29c228b7e65445810d5b299bb Mon Sep 17 00:00:00 2001
From: speech_asr <wangjiaming.wjm@alibaba-inc.com>
Date: 星期二, 14 二月 2023 14:58:46 +0800
Subject: [PATCH] add wav/text mismatch process

---
 funasr/utils/wav_utils.py |    2 +-
 1 files changed, 1 insertions(+), 1 deletions(-)

diff --git a/funasr/utils/wav_utils.py b/funasr/utils/wav_utils.py
index 76ed678..590ccdb 100644
--- a/funasr/utils/wav_utils.py
+++ b/funasr/utils/wav_utils.py
@@ -311,7 +311,7 @@
         sample_name, txt = parts
         text_dict[sample_name] = txt
     filter_count = 0
-    with open(wav_file) as f_wav, open(text_file) as f_text:
+    with open(wav_file, "w") as f_wav, open(text_file, "w") as f_text:
         for sample_name, wav_path in wav_dict.items():
             if sample_name in text_dict.keys():
                 f_wav.write(sample_name + " " + wav_path  + "\n")

--
Gitblit v1.9.1