From 23e7ddebccd3b05cf7ef89809bcfe565ad6dfa1f Mon Sep 17 00:00:00 2001
From: majic31 <majic31@163.com>
Date: 星期二, 24 十二月 2024 10:00:14 +0800
Subject: [PATCH] Fix the variable name (#2328)

---
 funasr/datasets/audio_datasets/index_ds.py |   12 +++++++++---
 1 files changed, 9 insertions(+), 3 deletions(-)

diff --git a/funasr/datasets/audio_datasets/index_ds.py b/funasr/datasets/audio_datasets/index_ds.py
index da008b4..39ef409 100644
--- a/funasr/datasets/audio_datasets/index_ds.py
+++ b/funasr/datasets/audio_datasets/index_ds.py
@@ -35,7 +35,7 @@
             with open(path, encoding="utf-8") as fin:
                 file_list_all = fin.readlines()
 
-                num_per_slice = (len(file_list_all) - 1) // data_split_num + 1
+                num_per_slice = (len(file_list_all) - 1) // data_split_num + 1  # 16
                 file_list = file_list_all[
                     data_split_i * num_per_slice : (data_split_i + 1) * num_per_slice
                 ]
@@ -104,10 +104,10 @@
                             or target_len > self.max_target_length
                         ):
                             continue
-                            
+
                         if (source_len + target_len) > self.max_token_length:
                             continue
-                            
+
                         contents_i = {
                             "source": source,
                             "prompt": prompt,
@@ -118,6 +118,12 @@
                         text_language = data.get("text_language", None)
                         if text_language is not None:
                             contents_i["text_language"] = text_language
+                        if "emo_target" in data:
+                            contents_i["emo_target"] = data["emo_target"]
+                        if "event_target" in data:
+                            contents_i["event_target"] = data["event_target"]
+                        if "with_or_wo_itn" in data:
+                            contents_i["with_or_wo_itn"] = data["with_or_wo_itn"]
                         # audio_language = data.get("audio_language", None)
                         # if audio_language is not None:
                         #     contents_i["audio_language"] = audio_language

--
Gitblit v1.9.1