| New file |
| | |
| | | from modelscope.pipelines import pipeline |
| | | from modelscope.utils.constant import Tasks |
| | | import numpy as np |
| | | import os |
| | | |
| | | |
| | | def test_wav_cpu_infer(): |
| | | output_dir = "./outputs" |
| | | data_path_and_name_and_type = [ |
| | | "data/unit_test/test_wav.scp,speech,sound", |
| | | "data/unit_test/test_profile.scp,profile,kaldi_ark", |
| | | ] |
| | | diar_pipeline = pipeline( |
| | | task=Tasks.speaker_diarization, |
| | | model='damo/speech_diarization_sond-zh-cn-alimeeting-16k-n16k4-pytorch', |
| | | mode="sond", |
| | | output_dir=output_dir, |
| | | num_workers=0, |
| | | log_level="WARNING", |
| | | ) |
| | | results = diar_pipeline(data_path_and_name_and_type) |
| | | print(results) |
| | | |
| | | |
| | | def test_wav_gpu_infer(): |
| | | output_dir = "./outputs" |
| | | data_path_and_name_and_type = [ |
| | | "data/unit_test/test_wav.scp,speech,sound", |
| | | "data/unit_test/test_profile.scp,profile,kaldi_ark", |
| | | ] |
| | | diar_pipeline = pipeline( |
| | | task=Tasks.speaker_diarization, |
| | | model='damo/speech_diarization_sond-zh-cn-alimeeting-16k-n16k4-pytorch', |
| | | mode="sond", |
| | | output_dir=output_dir, |
| | | num_workers=0, |
| | | log_level="WARNING", |
| | | ) |
| | | results = diar_pipeline(data_path_and_name_and_type) |
| | | print(results) |
| | | |
| | | |
| | | def test_without_profile_gpu_infer(): |
| | | raw_inputs = [ |
| | | "data/unit_test/raw_inputs/record.wav", |
| | | "data/unit_test/raw_inputs/spk1.wav", |
| | | "data/unit_test/raw_inputs/spk2.wav", |
| | | "data/unit_test/raw_inputs/spk3.wav", |
| | | "data/unit_test/raw_inputs/spk4.wav" |
| | | ] |
| | | diar_pipeline = pipeline( |
| | | task=Tasks.speaker_diarization, |
| | | model='damo/speech_diarization_sond-zh-cn-alimeeting-16k-n16k4-pytorch', |
| | | mode="sond_demo", |
| | | sv_model="damo/speech_xvector_sv-zh-cn-cnceleb-16k-spk3465-pytorch", |
| | | sv_model_revision="master", |
| | | num_workers=0, |
| | | log_level="WARNING", |
| | | param_dict={}, |
| | | ) |
| | | results = diar_pipeline(raw_inputs) |
| | | print(results) |
| | | |
| | | |
| | | def test_url_without_profile_gpu_infer(): |
| | | raw_inputs = [ |
| | | "https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_data/speaker_diarization/record.wav", |
| | | "https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_data/speaker_diarization/spk1.wav", |
| | | "https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_data/speaker_diarization/spk2.wav", |
| | | "https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_data/speaker_diarization/spk3.wav", |
| | | "https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_data/speaker_diarization/spk4.wav", |
| | | ] |
| | | diar_pipeline = pipeline( |
| | | task=Tasks.speaker_diarization, |
| | | model='damo/speech_diarization_sond-zh-cn-alimeeting-16k-n16k4-pytorch', |
| | | mode="sond_demo", |
| | | sv_model="damo/speech_xvector_sv-zh-cn-cnceleb-16k-spk3465-pytorch", |
| | | sv_model_revision="master", |
| | | num_workers=0, |
| | | log_level="WARNING", |
| | | param_dict={}, |
| | | ) |
| | | results = diar_pipeline(raw_inputs) |
| | | print(results) |
| | | |
| | | |
| | | if __name__ == '__main__': |
| | | os.environ["CUDA_VISIBLE_DEVICES"] = "0" |
| | | test_wav_cpu_infer() |
| | | test_wav_gpu_infer() |
| | | test_without_profile_gpu_infer() |
| | | test_url_without_profile_gpu_infer() |