From fcaf910ceb4e07a13bf2d133f46df684b069b3f0 Mon Sep 17 00:00:00 2001
From: 雾聪 <wucong.lyb@alibaba-inc.com>
Date: 星期三, 03 一月 2024 11:45:22 +0800
Subject: [PATCH] update online docs
---
runtime/onnxruntime/src/util.cpp | 14 +++++++++-----
1 files changed, 9 insertions(+), 5 deletions(-)
diff --git a/runtime/onnxruntime/src/util.cpp b/runtime/onnxruntime/src/util.cpp
index ac793f5..0fbec4f 100644
--- a/runtime/onnxruntime/src/util.cpp
+++ b/runtime/onnxruntime/src/util.cpp
@@ -305,6 +305,10 @@
}
bool TimestampIsPunctuation(U16CHAR_T &u16) {
+ // (& ' -) in the dict
+ if (u16 == 0x26 || u16 == 0x27 || u16 == 0x2D){
+ return false;
+ }
return (u16 >= 0x21 && u16 <= 0x2F) // 鏍囧噯ASCII鏍囩偣
|| (u16 >= 0x3A && u16 <= 0x40) // 鏍囧噯ASCII鏍囩偣
|| (u16 >= 0x5B && u16 <= 0x60) // 鏍囧噯ASCII鏍囩偣
@@ -580,7 +584,8 @@
}
}
// format
- ts_sent += "{'text':'" + text_seg + "',";
+ ts_sent += "{'text_seg':'" + text_seg + "',";
+ ts_sent += "'punc':'" + characters[idx_str] + "',";
ts_sent += "'start':'" + to_string(start) + "',";
ts_sent += "'end':'" + to_string(end) + "',";
ts_sent += "'ts_list':" + VectorToString(ts_seg) + "}";
@@ -590,9 +595,7 @@
} else{
ts_sentences += ts_sent + ",";
}
-
// clear
- idx_str++;
text_seg = "";
ts_sent = "";
start = 0;
@@ -605,9 +608,9 @@
text_seg += " " + characters[idx_str];
}
ts_seg.push_back(timestamps[idx_ts]);
- idx_str++;
idx_ts++;
}
+ idx_str++;
}
// for none punc results
if(ts_seg.size() >0){
@@ -618,7 +621,8 @@
end = ts_seg[ts_seg.size()-1][1];
}
// format
- ts_sent += "{'text':'" + text_seg + "',";
+ ts_sent += "{'text_seg':'" + text_seg + "',";
+ ts_sent += "'punc':'',";
ts_sent += "'start':'" + to_string(start) + "',";
ts_sent += "'end':'" + to_string(end) + "',";
ts_sent += "'ts_list':" + VectorToString(ts_seg) + "}";
--
Gitblit v1.9.1