From 54a91194901ad72562d5cb5856ee8c302d93fb0e Mon Sep 17 00:00:00 2001 From: 游雁 <zhifu.gzf@alibaba-inc.com> Date: 星期一, 27 十一月 2023 14:11:54 +0800 Subject: [PATCH] dataloader --- funasr/datasets/dataset_jsonl.py | 7 +++++++ 1 files changed, 7 insertions(+), 0 deletions(-) diff --git a/funasr/datasets/dataset_jsonl.py b/funasr/datasets/dataset_jsonl.py index 543b60e..3a548c8 100644 --- a/funasr/datasets/dataset_jsonl.py +++ b/funasr/datasets/dataset_jsonl.py @@ -78,6 +78,13 @@ def __getitem__(self, index): return self.contents[index] + + def get_source_len(self, data_dict): + return data_dict["source_len"] + + def get_target_len(self, data_dict): + + return data_dict["target_len"] if "target_len" in data_dict else 0 class AudioDataset(torch.utils.data.Dataset): -- Gitblit v1.9.1