From a64b7d8d8aeb2bb543ca703045a45f42470e9a63 Mon Sep 17 00:00:00 2001
From: 彭震东 <zhendong.peng@qq.com>
Date: 星期四, 30 五月 2024 15:12:53 +0800
Subject: [PATCH] keep empty speech result (#1772)
---
funasr/models/sense_voice/whisper_lib/decoding.py | 4 +++-
1 files changed, 3 insertions(+), 1 deletions(-)
diff --git a/funasr/models/sense_voice/whisper_lib/decoding.py b/funasr/models/sense_voice/whisper_lib/decoding.py
index 382a180..a468efa 100644
--- a/funasr/models/sense_voice/whisper_lib/decoding.py
+++ b/funasr/models/sense_voice/whisper_lib/decoding.py
@@ -62,8 +62,10 @@
else:
x = x.to(mel.device)
-
+ # FIX(funasr): sense vocie
logits = model.logits(x[:, :-1], mel)[:, -1]
+ # logits = model.logits(x[:, :], mel)[:, -1]
+
# collect detected languages; suppress all non-language tokens
mask = torch.ones(logits.shape[-1], dtype=torch.bool)
mask[list(tokenizer.all_language_tokens)] = False
--
Gitblit v1.9.1