From 6fe10a8dbfbab2bdcc28a411f9c5da85a4a8d002 Mon Sep 17 00:00:00 2001
From: hohaiuhsx <hohaiuhsx@gmail.com>
Date: 星期一, 10 三月 2025 23:16:22 +0800
Subject: [PATCH] 修复 当选用SenseVoice模型处理长音频(同时开启vad和output_timestamp)时的异常 (#2413)

---
 funasr/datasets/sense_voice_datasets/datasets.py |    4 ++--
 1 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/funasr/datasets/sense_voice_datasets/datasets.py b/funasr/datasets/sense_voice_datasets/datasets.py
index 20232cc..2e0266e 100644
--- a/funasr/datasets/sense_voice_datasets/datasets.py
+++ b/funasr/datasets/sense_voice_datasets/datasets.py
@@ -325,8 +325,8 @@
             asr_target = item["target"]
             if self.preprocessor_text:
                 asr_target = self.preprocessor_text(asr_target)
-            emo_target = item["emo_target"]
-            event_target = item["event_target"]
+            emo_target = item.get("emo_target", "<|NEUTRAL|>")
+            event_target = item.get("event_target", "<|Speech|>")
             text_language = item.get("text_language", "<|zh|>")
             punc_itn_bottom = item.get("with_or_wo_itn", "<|woitn|>")
 

--
Gitblit v1.9.1