From 0ee4565c8ec3deffde8362370aee306ae7029ebb Mon Sep 17 00:00:00 2001
From: shixian.shi <shixian.shi@alibaba-inc.com>
Date: 星期一, 22 一月 2024 18:44:07 +0800
Subject: [PATCH] update raw_text

---
 funasr/models/seaco_paraformer/model.py |    2 +-
 funasr/auto/auto_model.py               |    2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/funasr/auto/auto_model.py b/funasr/auto/auto_model.py
index 0641f06..1c7288e 100644
--- a/funasr/auto/auto_model.py
+++ b/funasr/auto/auto_model.py
@@ -406,7 +406,7 @@
                     for res, vadsegment in zip(restored_data, vadsegments):
                         sentence_list.append({"start": vadsegment[0],\
                                                 "end": vadsegment[1],
-                                                "sentence": res['text'],
+                                                "sentence": res['raw_text'],
                                                 "timestamp": res['timestamp']})
                 else: # punc_segment
                     sentence_list = timestamp_sentence(punc_res[0]['punc_array'], \
diff --git a/funasr/models/seaco_paraformer/model.py b/funasr/models/seaco_paraformer/model.py
index 1867bbf..e3cedb4 100644
--- a/funasr/models/seaco_paraformer/model.py
+++ b/funasr/models/seaco_paraformer/model.py
@@ -420,7 +420,7 @@
                     
                     if ibest_writer is not None:
                         ibest_writer["token"][key[i]] = " ".join(token)
-                        # ibest_writer["text"][key[i]] = text
+                        ibest_writer["raw_text"][key[i]] = text
                         ibest_writer["timestamp"][key[i]] = time_stamp_postprocessed
                         ibest_writer["text"][key[i]] = text_postprocessed
                 else:

--
Gitblit v1.9.1