From b8e2cab7ee61cb7762ca628f52bff7f6f32f1793 Mon Sep 17 00:00:00 2001
From: haoneng.lhn <haoneng.lhn@alibaba-inc.com>
Date: 星期四, 20 七月 2023 09:46:33 +0800
Subject: [PATCH] add lora finetune code
---
funasr/bin/build_trainer.py | 16 +++++++++-------
1 files changed, 9 insertions(+), 7 deletions(-)
diff --git a/funasr/bin/build_trainer.py b/funasr/bin/build_trainer.py
index df3434f..0f87186 100644
--- a/funasr/bin/build_trainer.py
+++ b/funasr/bin/build_trainer.py
@@ -1,12 +1,7 @@
-# -*- encoding: utf-8 -*-
-#!/usr/bin/env python3
-# Copyright FunASR (https://github.com/alibaba-damo-academy/FunASR). All Rights Reserved.
-# MIT License (https://opensource.org/licenses/MIT)
-
import os
import yaml
-
+import logging
def update_dct(fin_configs, root):
if root == {}:
@@ -27,6 +22,8 @@
if mode == "asr":
from funasr.tasks.asr import ASRTask as ASRTask
elif mode == "paraformer":
+ from funasr.tasks.asr import ASRTaskParaformer as ASRTask
+ elif mode == "paraformer_streaming":
from funasr.tasks.asr import ASRTaskParaformer as ASRTask
elif mode == "paraformer_vad_punc":
from funasr.tasks.asr import ASRTaskParaformer as ASRTask
@@ -58,7 +55,7 @@
scheduler_conf=None,
specaug=None,
specaug_conf=None,
- param_dict=None,
+ mate_params=None,
**kwargs):
mode = modelscope_dict['mode']
args, ASRTask = parse_args(mode=mode)
@@ -88,6 +85,7 @@
finetune_configs = yaml.safe_load(f)
# set data_types
if dataset_type == "large":
+ # finetune_configs["dataset_conf"]["data_types"] = "sound,text"
if 'data_types' not in finetune_configs['dataset_conf']:
finetune_configs["dataset_conf"]["data_types"] = "sound,text"
finetune_configs = update_dct(configs, finetune_configs)
@@ -146,6 +144,10 @@
args.patience = None
args.local_rank = local_rank
args.distributed = distributed
+ if mate_params is not None:
+ for key, value in mate_params.items():
+ if hasattr(args, key):
+ setattr(args, key, value)
ASRTask.finetune_args = args
return ASRTask
--
Gitblit v1.9.1