From 75be3ceccdf02599c43c7e9888bfdb6ba561fc71 Mon Sep 17 00:00:00 2001
From: 雾聪 <wucong.lyb@alibaba-inc.com>
Date: 星期二, 10 十月 2023 20:41:57 +0800
Subject: [PATCH] fix the issue of concatenating multiple VAD segments for en-bpe

---
 funasr/runtime/onnxruntime/src/funasrruntime.cpp |   10 ++++++++--
 1 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/funasr/runtime/onnxruntime/src/funasrruntime.cpp b/funasr/runtime/onnxruntime/src/funasrruntime.cpp
index 73738c7..150be70 100644
--- a/funasr/runtime/onnxruntime/src/funasrruntime.cpp
+++ b/funasr/runtime/onnxruntime/src/funasrruntime.cpp
@@ -257,11 +257,15 @@
 		int n_total = audio.GetQueueSize();
 		float start_time = 0.0;
 		std::string cur_stamp = "[";
+		std::string lang = (offline_stream->asr_handle)->GetLang();
 		while (audio.Fetch(buff, len, flag, start_time) > 0) {
 			string msg = (offline_stream->asr_handle)->Forward(buff, len, true, hw_emb);
 			std::vector<std::string> msg_vec = funasr::split(msg, '|');
 			if(msg_vec.size()==0){
 				continue;
+			}
+			if(lang == "en-bpe" and p_result->msg != ""){
+				p_result->msg += " ";
 			}
 			p_result->msg += msg_vec[0];
 			//timestamp
@@ -282,7 +286,6 @@
 			p_result->stamp += cur_stamp + "]";
 		}
 		if(offline_stream->UsePunc()){
-			string lang = (offline_stream->asr_handle)->GetLang();
 			string punc_res = (offline_stream->punc_handle)->AddPunc((p_result->msg).c_str(), lang);
 			p_result->msg = punc_res;
 		}
@@ -338,11 +341,15 @@
 		int n_total = audio.GetQueueSize();
 		float start_time = 0.0;
 		std::string cur_stamp = "[";
+		std::string lang = (offline_stream->asr_handle)->GetLang();
 		while (audio.Fetch(buff, len, flag, start_time) > 0) {
 			string msg = (offline_stream->asr_handle)->Forward(buff, len, true, hw_emb);
 			std::vector<std::string> msg_vec = funasr::split(msg, '|');
 			if(msg_vec.size()==0){
 				continue;
+			}
+			if(lang == "en-bpe" and p_result->msg != ""){
+				p_result->msg += " ";
 			}
 			p_result->msg += msg_vec[0];
 			//timestamp
@@ -364,7 +371,6 @@
 			p_result->stamp += cur_stamp + "]";
 		}
 		if(offline_stream->UsePunc()){
-			string lang = (offline_stream->asr_handle)->GetLang();
 			string punc_res = (offline_stream->punc_handle)->AddPunc((p_result->msg).c_str(), lang);
 			p_result->msg = punc_res;
 		}

--
Gitblit v1.9.1