Shi Xian
2023-12-06 b3fcd42bf6e60372ed0f0d3e53798fcdd713fe08
funasr/bin/ss_inference_launch.py
@@ -13,7 +13,7 @@
import numpy as np
import torch
import soundfile as sf
import librosa
from funasr.build_utils.build_streaming_iterator import build_streaming_iterator
from funasr.torch_utils.set_all_random_seed import set_all_random_seed
from funasr.utils import config_argparse
@@ -104,7 +104,12 @@
            ss_results = speech_separator(**batch)
            
            for spk in range(num_spks):
                sf.write(os.path.join(output_path, keys[0] + '_s' + str(spk+1)+'.wav'), ss_results[spk], sample_rate)
                # sf.write(os.path.join(output_path, keys[0] + '_s' + str(spk+1)+'.wav'), ss_results[spk], sample_rate)
                try:
                    librosa.output.write_wav(os.path.join(output_path, keys[0] + '_s' + str(spk+1)+'.wav'), ss_results[spk], sample_rate)
                except:
                    print("To write wav by librosa, you should install librosa<=0.8.0")
                    raise
        torch.cuda.empty_cache()
        return ss_results