From ec5e15d47c9f5392700a0bce59c697a4960b8741 Mon Sep 17 00:00:00 2001
From: 嘉渊 <wangjiaming.wjm@alibaba-inc.com>
Date: 星期二, 25 四月 2023 11:48:12 +0800
Subject: [PATCH] update

---
 funasr/utils/prepare_data.py |    8 ++++++++
 1 files changed, 8 insertions(+), 0 deletions(-)

diff --git a/funasr/utils/prepare_data.py b/funasr/utils/prepare_data.py
index c9a99e5..8ed97d5 100644
--- a/funasr/utils/prepare_data.py
+++ b/funasr/utils/prepare_data.py
@@ -157,7 +157,15 @@
 
 
 def prepare_data(args, distributed_option):
+    if args.dataset_type == "small" and args.train_data_path_and_name_and_type is not None:
+        return
+    if args.dataset_type == "large" and args.train_data_file is not None:
+        return
     distributed = distributed_option.distributed
+    if not hasattr(args, "train_set"):
+        args.train_set = "train"
+    if not hasattr(args, "dev_set"):
+        args.dev_set = "validation"
     if not distributed or distributed_option.dist_rank == 0:
         filter_wav_text(args.data_dir, args.train_set)
         filter_wav_text(args.data_dir, args.dev_set)

--
Gitblit v1.9.1