From e8fd84f5a4c8a7528e474f37b47d9fecde3534b0 Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期三, 22 五月 2024 14:14:42 +0800
Subject: [PATCH] wenetspeech
---
funasr/models/sense_voice/decoder.py | 7 +++++--
1 files changed, 5 insertions(+), 2 deletions(-)
diff --git a/funasr/models/sense_voice/decoder.py b/funasr/models/sense_voice/decoder.py
index 3c62072..60af29a 100644
--- a/funasr/models/sense_voice/decoder.py
+++ b/funasr/models/sense_voice/decoder.py
@@ -146,7 +146,9 @@
qk = qk + mask[:n_ctx, :n_ctx]
else:
mask = mask.unsqueeze(1).eq(0) # (batch, 1, *, time2)
- min_value = float(np.finfo(torch.tensor(0, dtype=qk.dtype).numpy().dtype).min)
+ min_value = -float(
+ "inf"
+ ) # min_value = float(np.finfo(torch.tensor(0, dtype=qk.dtype).numpy().dtype).min)
qk = qk.masked_fill(mask, min_value)
qk = qk.float()
@@ -599,5 +601,6 @@
def score(self, ys, state, x):
"""Score."""
ys_mask = subsequent_mask(len(ys), device=x.device).unsqueeze(0)
- logp = self.forward(ys.unsqueeze(0), x.unsqueeze(0), cache=state)
+ logp = self.forward(ys.unsqueeze(0), x.unsqueeze(0), cache=None)
+ logp = torch.log_softmax(logp, dim=-1)
return logp.squeeze(0)[-1, :], state
--
Gitblit v1.9.1