| | |
| | | logging.info("dataloader config: {}".format(self.dataset_conf)) |
| | | batch_mode = self.dataset_conf.get("batch_mode", "padding") |
| | | self.dataset = Dataset(args.data_list, symbol_table, seg_dict, punc_dict, bpe_tokenizer, |
| | | self.dataset_conf, self.frontend_conf, speed_perturb=args.speed_perturb, |
| | | self.dataset_conf, self.frontend_conf, |
| | | speed_perturb=args.speed_perturb if mode == "train" else None, |
| | | mode=mode, batch_mode=batch_mode) |
| | | |
| | | def build_iter(self, epoch, shuffle=True): |
| | |
| | | data_path_and_name_and_type, |
| | | preprocess=preprocess_fn, |
| | | dest_sample_rate=dest_sample_rate, |
| | | speed_perturb=args.speed_perturb, |
| | | speed_perturb=args.speed_perturb if mode=="train" else None, |
| | | ) |
| | | |
| | | # sampler |