From 9b4e9cc8a0311e5243d69b73ed073e7ea441982e Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期三, 27 三月 2024 16:05:29 +0800
Subject: [PATCH] train update

---
 setup.py |   26 ++++++++++++++++++++++----
 1 files changed, 22 insertions(+), 4 deletions(-)

diff --git a/setup.py b/setup.py
index 4e76c80..64c60ec 100644
--- a/setup.py
+++ b/setup.py
@@ -14,16 +14,14 @@
         "librosa",
         "jamo",  # For kss
         "PyYAML>=5.1.2",
-        # "soundfile>=0.12.1",
+        "soundfile>=0.12.1",
         "kaldiio>=2.17.0",
         "torch_complex",
         # "nltk>=3.4.5",
-        # ASR
         "sentencepiece", # train
         "jieba",
-        # "rotary_embedding_torch",
+        "rotary_embedding_torch",
         # "ffmpeg-python",
-        # TTS
         # "pypinyin>=0.44.0",
         # "espnet_tts_frontend",
         # ENH
@@ -41,6 +39,7 @@
         "jaconv",
         "hydra-core>=1.3.2",
         "tensorboardX",
+        "rotary_embedding_torch",
     ],
     # train: The modules invoked when training only.
     "train": [
@@ -53,6 +52,7 @@
         "torch_optimizer",
         "fairscale",
         "transformers",
+        "openai-whisper"
     ],
     "setup": [
         "numpy",
@@ -82,8 +82,20 @@
         "sphinx-markdown-tables>=0.0.12",
         "configargparse>=1.2.1"
     ],
+    "llm":[
+        "transformers>=4.32.0",
+        "accelerate",
+        "tiktoken",
+        "einops",
+        "transformers_stream_generator>=0.0.4",
+        "scipy",
+        "torchvision",
+        "pillow",
+        "matplotlib",
+    ],
 }
 requirements["all"].extend(requirements["train"])
+requirements["all"].extend(requirements["llm"])
 requirements["test"].extend(requirements["train"])
 
 install_requires = requirements["install"]
@@ -128,5 +140,11 @@
     ],
     entry_points={"console_scripts": [
         "funasr = funasr.bin.inference:main_hydra",
+        "funasr-train = funasr.bin.train:main_hydra",
+        "funasr-export = funasr.bin.export:main_hydra",
+        "scp2jsonl = funasr.datasets.audio_datasets.scp2jsonl:main_hydra",
+        "jsonl2scp = funasr.datasets.audio_datasets.jsonl2scp:main_hydra",
+        "funasr-scp2jsonl = funasr.datasets.audio_datasets.scp2jsonl:main_hydra",
+        "funasr-jsonl2scp = funasr.datasets.audio_datasets.jsonl2scp:main_hydra",
     ]},
 )

--
Gitblit v1.9.1