From b57b98364ff60ae0119b2e8d92471316bb4e504f Mon Sep 17 00:00:00 2001
From: zhifu gao <zhifu.gzf@alibaba-inc.com>
Date: 星期三, 22 十一月 2023 00:36:35 +0800
Subject: [PATCH] funasr v2 setup (#1106)

---
 funasr/bin/asr_infer.py |   29 ++++++++++++++---------------
 1 files changed, 14 insertions(+), 15 deletions(-)

diff --git a/funasr/bin/asr_infer.py b/funasr/bin/asr_infer.py
index 4648fb3..c1d08df 100644
--- a/funasr/bin/asr_infer.py
+++ b/funasr/bin/asr_infer.py
@@ -44,9 +44,9 @@
     """Speech2Text class
 
     Examples:
-        >>> import soundfile
+        >>> import librosa
         >>> speech2text = Speech2Text("asr_config.yml", "asr.pb")
-        >>> audio, rate = soundfile.read("speech.wav")
+        >>> audio, rate = librosa.load("speech.wav")
         >>> speech2text(audio)
         [(text, token, token_int, hypothesis object), ...]
 
@@ -251,9 +251,9 @@
     """Speech2Text class
 
     Examples:
-            >>> import soundfile
+            >>> import librosa
             >>> speech2text = Speech2TextParaformer("asr_config.yml", "asr.pb")
-            >>> audio, rate = soundfile.read("speech.wav")
+            >>> audio, rate = librosa.load("speech.wav")
             >>> speech2text(audio)
             [(text, token, token_int, hypothesis object), ...]
 
@@ -625,9 +625,9 @@
     """Speech2Text class
 
     Examples:
-            >>> import soundfile
+            >>> import librosa
             >>> speech2text = Speech2TextParaformerOnline("asr_config.yml", "asr.pth")
-            >>> audio, rate = soundfile.read("speech.wav")
+            >>> audio, rate = librosa.load("speech.wav")
             >>> speech2text(audio)
             [(text, token, token_int, hypothesis object), ...]
 
@@ -876,9 +876,9 @@
     """Speech2Text class
 
     Examples:
-        >>> import soundfile
+        >>> import librosa
         >>> speech2text = Speech2TextUniASR("asr_config.yml", "asr.pb")
-        >>> audio, rate = soundfile.read("speech.wav")
+        >>> audio, rate = librosa.load("speech.wav")
         >>> speech2text(audio)
         [(text, token, token_int, hypothesis object), ...]
 
@@ -1106,9 +1106,9 @@
     """Speech2Text class
 
     Examples:
-        >>> import soundfile
+        >>> import librosa
         >>> speech2text = Speech2TextMFCCA("asr_config.yml", "asr.pb")
-        >>> audio, rate = soundfile.read("speech.wav")
+        >>> audio, rate = librosa.load("speech.wav")
         >>> speech2text(audio)
         [(text, token, token_int, hypothesis object), ...]
 
@@ -1605,7 +1605,6 @@
         feats_lengths = to_device(feats_lengths, device=self.device)
 
         enc_out, _, _ = self.asr_model.encoder(feats, feats_lengths)
-
         nbest_hyps = self.beam_search(enc_out[0])
 
         return nbest_hyps
@@ -1638,9 +1637,9 @@
     """Speech2Text class
 
     Examples:
-        >>> import soundfile
+        >>> import librosa
         >>> speech2text = Speech2TextSAASR("asr_config.yml", "asr.pb")
-        >>> audio, rate = soundfile.read("speech.wav")
+        >>> audio, rate = librosa.load("speech.wav")
         >>> speech2text(audio)
         [(text, token, token_int, hypothesis object), ...]
 
@@ -1886,9 +1885,9 @@
     """Speech2Text class
 
     Examples:
-        >>> import soundfile
+        >>> import librosa
         >>> speech2text = Speech2Text("asr_config.yml", "asr.pb")
-        >>> audio, rate = soundfile.read("speech.wav")
+        >>> audio, rate = librosa.load("speech.wav")
         >>> speech2text(audio)
         [(text, token, token_int, hypothesis object), ...]
 

--
Gitblit v1.9.1