From ec42889511b121230e97bbcdf05f4d517f95d7ba Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期五, 23 二月 2024 15:09:35 +0800
Subject: [PATCH] update
---
funasr/models/llm_asr/model.py | 4 ++--
1 files changed, 2 insertions(+), 2 deletions(-)
diff --git a/funasr/models/llm_asr/model.py b/funasr/models/llm_asr/model.py
index e3cf551..937c8e1 100644
--- a/funasr/models/llm_asr/model.py
+++ b/funasr/models/llm_asr/model.py
@@ -217,7 +217,7 @@
) -> Tuple[torch.Tensor, torch.Tensor]:
audio_mask = kwargs.get("audio_mask")
- audio_token_lengths = audio_mask.sum(-1)
+ audio_token_lengths = audio_mask.sum(-1) if audio_mask else None
batch = {"speech": speech, "speech_lengths": speech_lengths}
enc, enc_lens = self.audio_encoder.encode(**batch)
@@ -279,7 +279,7 @@
prompt_pre = "USER: \nINSTRUCTION: {}\nINPUT: ".format(prompt)
- prompt_ids = self.tokenizer.encode(prompt_pre)
+ prompt_ids = tokenizer.encode(prompt_pre)
prompt_length = len(prompt_ids)
prompt_ids = torch.tensor(prompt_ids, dtype=torch.int64).to(kwargs["device"])
--
Gitblit v1.9.1