From 8827e26b8d487f123f8d7d5cbd8d00b81dcefcff Mon Sep 17 00:00:00 2001
From: 游雁 <zhifu.gzf@alibaba-inc.com>
Date: 星期五, 23 二月 2024 00:58:18 +0800
Subject: [PATCH] fp16

---
 examples/industrial_data_pretraining/seaco_paraformer/demo.py |   10 ++++++++--
 1 files changed, 8 insertions(+), 2 deletions(-)

diff --git a/examples/industrial_data_pretraining/seaco_paraformer/demo.py b/examples/industrial_data_pretraining/seaco_paraformer/demo.py
index e9e226d..a44c649 100644
--- a/examples/industrial_data_pretraining/seaco_paraformer/demo.py
+++ b/examples/industrial_data_pretraining/seaco_paraformer/demo.py
@@ -19,12 +19,18 @@
 # example1
 res = model.generate(input="https://isv-data.oss-cn-hangzhou.aliyuncs.com/ics/MaaS/ASR/test_audio/asr_example_zh.wav",
                      hotword='杈炬懇闄� 榄旀惌',
+                     # return_raw_text=True,     # return raw text recognition results splited by space of equal length with timestamp
+                     # preset_spk_num=2,         # preset speaker num for speaker cluster model
                      # sentence_timestamp=True,  # return sentence level information when spk_model is not given
                     )
 print(res)
 
+
+'''
+# tensor or numpy as input
 # example2
 import torchaudio
+import os
 wav_file = os.path.join(model.model_path, "example/asr_example.wav")
 input_tensor, sample_rate = torchaudio.load(wav_file)
 input_tensor = input_tensor.mean(0)
@@ -33,8 +39,8 @@
 
 # example3
 import soundfile
-import os
+
 wav_file = os.path.join(model.model_path, "example/asr_example.wav")
 speech, sample_rate = soundfile.read(wav_file)
 res = model.generate(input=[speech], batch_size_s=300, is_final=True)
-
+'''
\ No newline at end of file

--
Gitblit v1.9.1