From 887039e9d335f9964ebacb14b0205ee891e6819b Mon Sep 17 00:00:00 2001
From: 嘉渊 <wangjiaming.wjm@alibaba-inc.com>
Date: 星期日, 23 四月 2023 17:42:42 +0800
Subject: [PATCH] update

---
 funasr/bin/train.py |   71 ++++++++++++++++++++++++++++++-----
 1 files changed, 61 insertions(+), 10 deletions(-)

diff --git a/funasr/bin/train.py b/funasr/bin/train.py
index c6f19b6..c32a362 100644
--- a/funasr/bin/train.py
+++ b/funasr/bin/train.py
@@ -6,18 +6,20 @@
 
 import torch
 
+from funasr.build_utils.build_args import build_args
+from funasr.build_utils.build_dataloader import build_dataloader
+from funasr.build_utils.build_distributed import build_distributed
+from funasr.build_utils.build_model import build_model
+from funasr.build_utils.build_optimizer import build_optimizer
+from funasr.build_utils.build_scheduler import build_scheduler
+from funasr.text.phoneme_tokenizer import g2p_choices
 from funasr.torch_utils.model_summary import model_summary
 from funasr.torch_utils.pytorch_version import pytorch_cudnn_version
 from funasr.torch_utils.set_all_random_seed import set_all_random_seed
 from funasr.utils import config_argparse
-from funasr.utils.build_args import build_args
-from funasr.utils.build_dataloader import build_dataloader
-from funasr.utils.build_distributed import build_distributed
-from funasr.utils.build_model import build_model
-from funasr.utils.build_optimizer import build_optimizer
-from funasr.utils.build_scheduler import build_scheduler
 from funasr.utils.prepare_data import prepare_data
 from funasr.utils.types import str2bool
+from funasr.utils.types import str_or_none
 from funasr.utils.yaml_no_alias_safe_dump import yaml_no_alias_safe_dump
 
 
@@ -281,6 +283,55 @@
         help="Apply preprocessing to data or not",
     )
 
+    # most task related
+    parser.add_argument(
+        "--init",
+        type=lambda x: str_or_none(x.lower()),
+        default=None,
+        help="The initialization method",
+        choices=[
+            "chainer",
+            "xavier_uniform",
+            "xavier_normal",
+            "kaiming_uniform",
+            "kaiming_normal",
+            None,
+        ],
+    )
+    parser.add_argument(
+        "--token_list",
+        type=str_or_none,
+        default=None,
+        help="A text mapping int-id to token",
+    )
+    parser.add_argument(
+        "--token_type",
+        type=str,
+        default="bpe",
+        choices=["bpe", "char", "word"],
+        help="",
+    )
+    parser.add_argument(
+        "--bpemodel",
+        type=str_or_none,
+        default=None,
+        help="The model file fo sentencepiece",
+    )
+    parser.add_argument(
+        "--cleaner",
+        type=str_or_none,
+        choices=[None, "tacotron", "jaconv", "vietnamese"],
+        default=None,
+        help="Apply text cleaning",
+    )
+    parser.add_argument(
+        "--g2p",
+        type=str_or_none,
+        choices=g2p_choices,
+        default=None,
+        help="Specify g2p method if --token_type=phn",
+    )
+
     # pai related
     parser.add_argument(
         "--use_pai",
@@ -369,16 +420,16 @@
     prepare_data(args, distributed_option)
 
     model = build_model(args)
-    optimizer = build_optimizer(args, model=model)
-    scheduler = build_scheduler(args, optimizer)
+    optimizers = build_optimizer(args, model=model)
+    schedulers = build_scheduler(args, optimizers)
 
     logging.info("world size: {}, rank: {}, local_rank: {}".format(distributed_option.dist_world_size,
                                                                    distributed_option.dist_rank,
                                                                    distributed_option.local_rank))
     logging.info(pytorch_cudnn_version())
     logging.info(model_summary(model))
-    logging.info("Optimizer: {}".format(optimizer))
-    logging.info("Scheduler: {}".format(scheduler))
+    logging.info("Optimizer: {}".format(optimizers))
+    logging.info("Scheduler: {}".format(schedulers))
 
     # dump args to config.yaml
     if not distributed_option.distributed or distributed_option.dist_rank == 0:

--
Gitblit v1.9.1