From fb0da9f849a5d3bd473dcdbaf6197c6a5ff24a57 Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期二, 07 五月 2024 15:53:26 +0800
Subject: [PATCH] decoding key
---
funasr/models/sense_voice/whisper_lib/decoding.py | 4 +++-
1 files changed, 3 insertions(+), 1 deletions(-)
diff --git a/funasr/models/sense_voice/whisper_lib/decoding.py b/funasr/models/sense_voice/whisper_lib/decoding.py
index 382a180..609d6a6 100644
--- a/funasr/models/sense_voice/whisper_lib/decoding.py
+++ b/funasr/models/sense_voice/whisper_lib/decoding.py
@@ -62,8 +62,10 @@
else:
x = x.to(mel.device)
+ # FIX(funasr): sense vocie
+ # logits = model.logits(x[:, :-1], mel)[:, -1]
+ logits = model.logits(x[:, :], mel)[:, -1]
- logits = model.logits(x[:, :-1], mel)[:, -1]
# collect detected languages; suppress all non-language tokens
mask = torch.ones(logits.shape[-1], dtype=torch.bool)
mask[list(tokenizer.all_language_tokens)] = False
--
Gitblit v1.9.1