From c458f20c09cf0b39af540ba24d9398c7575fd853 Mon Sep 17 00:00:00 2001
From: zhifu gao <zhifu.gzf@alibaba-inc.com>
Date: 星期一, 30 一月 2023 17:54:06 +0800
Subject: [PATCH] Merge pull request #47 from alibaba-damo-academy/dev
---
funasr/models/e2e_asr_paraformer.py | 6 +++---
1 files changed, 3 insertions(+), 3 deletions(-)
diff --git a/funasr/models/e2e_asr_paraformer.py b/funasr/models/e2e_asr_paraformer.py
index 65c70df..7596896 100644
--- a/funasr/models/e2e_asr_paraformer.py
+++ b/funasr/models/e2e_asr_paraformer.py
@@ -499,11 +499,11 @@
def sampler(self, encoder_out, encoder_out_lens, ys_pad, ys_pad_lens, pre_acoustic_embeds):
tgt_mask = (~make_pad_mask(ys_pad_lens, maxlen=ys_pad_lens.max())[:, :, None]).to(ys_pad.device)
- ys_pad = ys_pad * tgt_mask[:, :, 0]
+ ys_pad_masked = ys_pad * tgt_mask[:, :, 0]
if self.share_embedding:
- ys_pad_embed = self.decoder.output_layer.weight[ys_pad]
+ ys_pad_embed = self.decoder.output_layer.weight[ys_pad_masked]
else:
- ys_pad_embed = self.decoder.embed(ys_pad)
+ ys_pad_embed = self.decoder.embed(ys_pad_masked)
with torch.no_grad():
decoder_outs = self.decoder(
encoder_out, encoder_out_lens, pre_acoustic_embeds, ys_pad_lens
--
Gitblit v1.9.1