From 88b464edb94531ba98744a5338965af539ab18ec Mon Sep 17 00:00:00 2001
From: slin000111 <127832064+slin000111@users.noreply.github.com>
Date: 星期六, 20 九月 2025 22:40:30 +0800
Subject: [PATCH] Fix prefix concatenation in timestamp post-processing for sensevoice (#2670)
---
funasr/models/sense_voice/model.py | 4 ++--
1 files changed, 2 insertions(+), 2 deletions(-)
diff --git a/funasr/models/sense_voice/model.py b/funasr/models/sense_voice/model.py
index 38943a2..6a29181 100644
--- a/funasr/models/sense_voice/model.py
+++ b/funasr/models/sense_voice/model.py
@@ -979,9 +979,9 @@
timestamp_new.append([start, end])
words_new.append(word)
elif prev_word is not None and prev_word.isalpha() and prev_word.isascii() and word.isalpha() and word.isascii():
- prev_word += word
+ word = prev_word + word
timestamp_new[-1][1] = end
- words_new[-1] = prev_word
+ words_new[-1] = word
else:
# timestamp_new[-1][0] += word
timestamp_new.append([start, end])
--
Gitblit v1.9.1