From 65396eeeff96cdc21f939828e13a2e3d0127f2c6 Mon Sep 17 00:00:00 2001
From: zhifu gao <zhifu.gzf@alibaba-inc.com>
Date: 星期五, 26 一月 2024 11:26:48 +0800
Subject: [PATCH] vad streaming return [beg, -1], [], [-1, end], [beg, end] (#1306)
---
runtime/python/websocket/funasr_wss_client.py | 9 ++++++---
1 files changed, 6 insertions(+), 3 deletions(-)
diff --git a/runtime/python/websocket/funasr_wss_client.py b/runtime/python/websocket/funasr_wss_client.py
index bfe4b0d..a2d8889 100644
--- a/runtime/python/websocket/funasr_wss_client.py
+++ b/runtime/python/websocket/funasr_wss_client.py
@@ -192,7 +192,7 @@
params = wav_file.getparams()
sample_rate = wav_file.getframerate()
frames = wav_file.readframes(wav_file.getnframes())
- audio_bytes = bytes(frames)
+ audio_bytes = bytes(frames)
else:
wav_format = "others"
with open(wav_path, "rb") as f:
@@ -256,6 +256,7 @@
wav_name = meg.get("wav_name", "demo")
text = meg["text"]
timestamp=""
+ offline_msg_done = meg.get("is_final", False)
if "timestamp" in meg:
timestamp = meg["timestamp"]
@@ -265,7 +266,9 @@
else:
text_write_line = "{}\t{}\n".format(wav_name, text)
ibest_writer.write(text_write_line)
-
+
+ if 'mode' not in meg:
+ continue
if meg["mode"] == "online":
text_print += "{}".format(text)
text_print = text_print[-args.words_max_print:]
@@ -292,7 +295,7 @@
text_print = text_print[-args.words_max_print:]
os.system('clear')
print("\rpid" + str(id) + ": " + text_print)
- offline_msg_done=True
+ # offline_msg_done=True
except Exception as e:
print("Exception:", e)
--
Gitblit v1.9.1