python/FunASR-XL.git

			@@ -23,6 +23,5 @@
			\| paraformer-zh-spk <br> ( [⭐](https://modelscope.cn/models/damo/speech_paraformer-large-vad-punc-spk_asr_nat-zh-cn/summary) [🤗]() ) \| 分角色语音识别，带时间戳输出，非实时 \| 60000小时，中文 \| 220M \|
			\| paraformer-zh-streaming <br> ( [⭐](https://modelscope.cn/models/damo/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-online/summary) [🤗]() ) \| 语音识别，实时 \| 60000小时，中文 \| 220M \|
			\| paraformer-zh-streaming-small <br> ( [⭐](https://www.modelscope.cn/models/iic/speech_paraformer_asr_nat-zh-cn-16k-common-vocab8404-online/summary) [🤗]() ) \| 语音识别，实时 \| 60000小时，中文 \| 220M \|

			\| paraformer-en <br> ( [⭐](https://www.modelscope.cn/models/damo/speech_paraformer-large-vad-punc_asr_nat-en-16k-common-vocab10020/summary) [🤗]() ) \| 语音识别，非实时 \| 50000小时，英文 \| 220M \|

			@@ -42,6 +42,11 @@
			vector<int> InputData;
			string strText; //full_text
			strText = accumulate(arr_cache.begin(), arr_cache.end(), strText);

			// 如果上一句的结尾是英语字母，并且这一句的开始也是英语字母，应该添加空格
			if ((strText.size() > 0 and !(strText[strText.size()-1] & 0x80)) && (strlen(sz_input) > 0 && !(sz_input[0] & 0x80)))
			strText += " ";

			strText += sz_input; // full_text = precache + text
			m_tokenizer.Tokenize(strText.c_str(), strOut, InputData);

			@@ -107,7 +112,7 @@
			{
			if (!(sentence_words_list[i][0] & 0x80) && (i + 1) < sentence_words_list.size() && !(sentence_words_list[i + 1][0] & 0x80))
			{
			sentence_words_list[i] = " " + sentence_words_list[i];
			sentence_words_list[i] = sentence_words_list[i] + " ";
			}
			if (nSkipNum < arr_cache.size()) // if skip_num < len(cache):
			nSkipNum++;

	model_zoo/readme_zh.md	1 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	runtime/onnxruntime/src/ct-transformer-online.cpp	7 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史

			@@ -23,6 +23,5 @@
			\| paraformer-zh-spk <br> ( [⭐](https://modelscope.cn/models/damo/speech_paraformer-large-vad-punc-spk_asr_nat-zh-cn/summary) [🤗]() ) \| 分角色语音识别，带时间戳输出，非实时 \| 60000小时，中文 \| 220M \|
			\| paraformer-zh-streaming <br> ( [⭐](https://modelscope.cn/models/damo/speech_paraformer-large_asr_nat-zh-cn-16k-common-vocab8404-online/summary) [🤗]() ) \| 语音识别，实时 \| 60000小时，中文 \| 220M \|
			\| paraformer-zh-streaming-small <br> ( [⭐](https://www.modelscope.cn/models/iic/speech_paraformer_asr_nat-zh-cn-16k-common-vocab8404-online/summary) [🤗]() ) \| 语音识别，实时 \| 60000小时，中文 \| 220M \|

			\| paraformer-en <br> ( [⭐](https://www.modelscope.cn/models/damo/speech_paraformer-large-vad-punc_asr_nat-en-16k-common-vocab10020/summary) [🤗]() ) \| 语音识别，非实时 \| 50000小时，英文 \| 220M \|