shixian.shi
2023-06-28 438c4663d2094ed7ce1762fa4f16cf89401b8bec
setup.py
@@ -17,10 +17,10 @@
        "humanfriendly",
        "scipy>=1.4.1",
        # "filelock",
        "librosa==0.8.1",
        "librosa",
        "jamo==0.4.1",  # For kss
        "PyYAML>=5.1.2",
        "soundfile>=0.10.2",
        "soundfile>=0.11.0",
        "h5py>=2.10.0",
        "kaldiio>=2.17.0",
        "torch_complex",
@@ -35,12 +35,17 @@
        # ENH
        # "ci_sdr",
        "pytorch_wpe",
        "editdistance==0.5.2",
        "editdistance>=0.5.2",
        "tensorboard==1.15",
        "g2p",
        # PAI
        "oss2",
        "kaldi-native-fbank",
        # "kaldi-native-fbank",
        # timestamp
        "edit-distance",
        # textgrid
        "textgrid",
        "protobuf==3.20.0",
    ],
    # train: The modules invoked when training only.
    "train": [
@@ -76,7 +81,7 @@
        # "gtn==0.0.0",
    ],
    "setup": [
        "numpy<=1.21.3",
        "numpy",
        "pytest-runner",
    ],
    "test": [
@@ -121,7 +126,7 @@
    name="funasr",
    version=version,
    url="https://github.com/alibaba-damo-academy/FunASR.git",
    author="Speech Lab, Alibaba Group, China",
    author="Speech Lab of DAMO Academy, Alibaba Group",
    author_email="funasr@list.alibaba-inc.com",
    description="FunASR: A Fundamental End-to-End Speech Recognition Toolkit",
    long_description=open(os.path.join(dirname, "README.md"), encoding="utf-8").read(),