From 54a91194901ad72562d5cb5856ee8c302d93fb0e Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期一, 27 十一月 2023 14:11:54 +0800
Subject: [PATCH] dataloader

---
 funasr/datasets/dataset_jsonl.py |    7 +++++++
 1 files changed, 7 insertions(+), 0 deletions(-)

diff --git a/funasr/datasets/dataset_jsonl.py b/funasr/datasets/dataset_jsonl.py
index 543b60e..3a548c8 100644
--- a/funasr/datasets/dataset_jsonl.py
+++ b/funasr/datasets/dataset_jsonl.py
@@ -78,6 +78,13 @@
 	
 	def __getitem__(self, index):
 		return self.contents[index]
+	
+	def get_source_len(self, data_dict):
+		return data_dict["source_len"]
+
+	def get_target_len(self, data_dict):
+		
+		return data_dict["target_len"] if "target_len" in data_dict else 0
 
 
 class AudioDataset(torch.utils.data.Dataset):

--
Gitblit v1.9.1