python/FunASR-XL.git

parent: dc682db8 | 补丁 | 提交 | ignore whitespace

Merge branch 'main' into dev_gzf_funasr2

zhifu gao

2023-11-23 61567c6d3bc8723243ffabd2d88a227a2d416e89

Merge branch 'main' into dev_gzf_funasr2

11个文件已修改

	funasr/datasets/large_datasets/utils/padding.py	18 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	funasr/quick_start.md	4 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	funasr/quick_start_zh.md	4 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	runtime/docs/SDK_advanced_guide_offline.md	4 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	runtime/docs/SDK_advanced_guide_offline_en.md	4 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	runtime/docs/SDK_advanced_guide_offline_en_zh.md	4 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	runtime/docs/SDK_advanced_guide_offline_zh.md	7 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	runtime/docs/SDK_advanced_guide_online.md	4 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	runtime/docs/SDK_advanced_guide_online_zh.md	7 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	runtime/python/websocket/README.md	2 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史
	runtime/python/websocket/funasr_wss_server.py	4 ●●●●● 补丁 \| 查看 \| 原始文档 \| blame \| 历史

 funasr/datasets/large_datasets/utils/padding.py

@@ -32,7 +32,7 @@
            batch[data_name] = tensor_pad
            batch[data_name + "_lengths"] = tensor_lengths

    # DHA, EAHC NOT INCLUDED
    # SAC LABEL INCLUDE
    if "hotword_indxs" in batch:
        # if hotword indxs in batch
        # use it to slice hotwords out
@@ -41,28 +41,25 @@
        text = batch['text']
        text_lengths = batch['text_lengths']
        hotword_indxs = batch['hotword_indxs']
        num_hw = sum([int(i) for i in batch['hotword_indxs_lengths'] if i != 1]) // 2
        B, t1 = text.shape
        dha_pad = torch.ones_like(text) * -1
        _, t1 = text.shape
        t1 += 1  # TODO: as parameter which is same as predictor_bias
        ideal_attn = torch.zeros(B, t1, num_hw+1)
        nth_hw = 0
        for b, (hotword_indx, one_text, length) in enumerate(zip(hotword_indxs, text, text_lengths)):
            ideal_attn[b][:,-1] = 1
            dha_pad[b][:length] = 8405
            if hotword_indx[0] != -1:
                start, end = int(hotword_indx[0]), int(hotword_indx[1])
                hotword = one_text[start: end+1]
                hotword_list.append(hotword)
                hotword_lengths.append(end-start+1)
                ideal_attn[b][start:end+1, nth_hw] = 1
                ideal_attn[b][start:end+1, -1] = 0
                dha_pad[b][start: end+1] = one_text[start: end+1]
                nth_hw += 1
                if len(hotword_indx) == 4 and hotword_indx[2] != -1:
                    # the second hotword if exist
                    start, end = int(hotword_indx[2]), int(hotword_indx[3])
                    hotword_list.append(one_text[start: end+1])
                    hotword_lengths.append(end-start+1)
                    ideal_attn[b][start:end+1, nth_hw-1] = 1
                    ideal_attn[b][start:end+1, -1] = 0
                    dha_pad[b][start: end+1] = one_text[start: end+1]
                    nth_hw += 1
        hotword_list.append(torch.tensor([1]))
        hotword_lengths.append(1)
@@ -71,8 +68,7 @@
                                padding_value=0)
        batch["hotword_pad"] = hotword_pad
        batch["hotword_lengths"] = torch.tensor(hotword_lengths, dtype=torch.int32)
        batch['ideal_attn'] = ideal_attn
        batch['dha_pad'] = dha_pad
        del batch['hotword_indxs']
        del batch['hotword_indxs_lengths']

    return keys, batch

 funasr/quick_start.md

@@ -16,7 +16,7 @@
#### Server Deployment

```shell
cd funasr/runtime/python/websocket
cd runtime/python/websocket
python funasr_wss_server.py --port 10095
```

@@ -161,4 +161,4 @@
cd egs/aishell/paraformer
. ./run.sh --CUDA_VISIBLE_DEVICES="0,1" --gpu_num=2
```
More examples could be found in [docs](https://alibaba-damo-academy.github.io/FunASR/en/modelscope_pipeline/quick_start.html)
More examples could be found in [docs](https://alibaba-damo-academy.github.io/FunASR/en/modelscope_pipeline/quick_start.html)

 funasr/quick_start_zh.md

@@ -17,7 +17,7 @@

##### 服务端部署
```shell
cd funasr/runtime/python/websocket
cd runtime/python/websocket
python funasr_wss_server.py --port 10095
```

@@ -161,4 +161,4 @@
. ./run.sh --CUDA_VISIBLE_DEVICES="0,1" --gpu_num=2
```

更多例子可以参考（[点击此处](https://alibaba-damo-academy.github.io/FunASR/en/academic_recipe/asr_recipe.html)）
更多例子可以参考（[点击此处](https://alibaba-damo-academy.github.io/FunASR/en/academic_recipe/asr_recipe.html)）

 runtime/docs/SDK_advanced_guide_offline.md

@@ -94,7 +94,9 @@
--punc-quant: True for quantized PUNC model, False for non-quantized PUNC model. Default is True.
--itn-dir modelscope model ID or local model path.
--port: Port number that the server listens on. Default is 10095.
--decoder-thread-num: Number of inference threads that the server starts. Default is 8.
--decoder-thread-num: The number of thread pools on the server side that can handle concurrent requests. The default value is 8.
--model-thread-num: The number of internal threads for each recognition route to control the parallelism of the ONNX model. 
        The default value is 1. It is recommended that decoder-thread-num * model-thread-num equals the total number of threads.
--io-thread-num: Number of IO threads that the server starts. Default is 1.
--certfile <string>: SSL certificate file. Default is ../../../ssl_key/server.crt. If you want to close ssl，set 0
--keyfile <string>: SSL key file. Default is ../../../ssl_key/server.key. 

 runtime/docs/SDK_advanced_guide_offline_en.md

@@ -73,7 +73,9 @@
--punc-quant: True for quantized PUNC model, False for non-quantized PUNC model. Default is True.
--itn-dir modelscope model ID or local model path.
--port: Port number that the server listens on. Default is 10095.
--decoder-thread-num: Number of inference threads that the server starts. Default is 8.
--decoder-thread-num: The number of thread pools on the server side that can handle concurrent requests. The default value is 8.
--model-thread-num: The number of internal threads for each recognition route to control the parallelism of the ONNX model. 
        The default value is 1. It is recommended that decoder-thread-num * model-thread-num equals the total number of threads.
--io-thread-num: Number of IO threads that the server starts. Default is 1.
--certfile <string>: SSL certificate file. Default is ../../../ssl_key/server.crt. If you want to close ssl，set 0
--keyfile <string>: SSL key file. Default is ../../../ssl_key/server.key. 

 runtime/docs/SDK_advanced_guide_offline_en_zh.md

@@ -158,7 +158,9 @@
--punc-quant   True为量化PUNC模型，False为非量化PUNC模型，默认是True
--itn-dir modelscope model ID 或者 本地模型路径
--port  服务端监听的端口号，默认为 10095
--decoder-thread-num  服务端启动的推理线程数，默认为 8
--decoder-thread-num  服务端线程池个数(支持的最大并发路数)，默认为 8
--model-thread-num  每路识别的内部线程数(控制ONNX模型的并行)，默认为 1，
                    其中建议 decoder-thread-num*model-thread-num 等于总线程数
--io-thread-num  服务端启动的IO线程数，默认为 1
--certfile  ssl的证书文件，默认为：../../../ssl_key/server.crt，如果需要关闭ssl，参数设置为0
--keyfile   ssl的密钥文件，默认为：../../../ssl_key/server.key

 runtime/docs/SDK_advanced_guide_offline_zh.md

@@ -175,11 +175,14 @@
--lm-dir modelscope model ID 或者 本地模型路径
--itn-dir modelscope model ID 或者 本地模型路径
--port  服务端监听的端口号，默认为 10095
--decoder-thread-num  服务端启动的推理线程数，默认为 8
--decoder-thread-num  服务端线程池个数(支持的最大并发路数)，默认为 8
--model-thread-num  每路识别的内部线程数(控制ONNX模型的并行)，默认为 1，
                    其中建议 decoder-thread-num*model-thread-num 等于总线程数
--io-thread-num  服务端启动的IO线程数，默认为 1
--certfile  ssl的证书文件，默认为：../../../ssl_key/server.crt，如果需要关闭ssl，参数设置为0
--keyfile   ssl的密钥文件，默认为：../../../ssl_key/server.key
--hotword   热词文件路径，每行一个热词，格式：热词 权重(例如:阿里巴巴 20)，如果客户端提供热词，则与客户端提供的热词合并一起使用。
--hotword   热词文件路径，每行一个热词，格式：热词 权重(例如:阿里巴巴 20)，
            如果客户端提供热词，则与客户端提供的热词合并一起使用，服务端热词全局生效，客户端热词只针对对应客户端生效。
```

### 关闭FunASR服务

 runtime/docs/SDK_advanced_guide_online.md

@@ -111,7 +111,9 @@
--punc-quant: True for quantized PUNC model, False for non-quantized PUNC model. Default is True.
--itn-dir modelscope model ID or local model path.
--port: Port number that the server listens on. Default is 10095.
--decoder-thread-num: Number of inference threads that the server starts. Default is 8.
--decoder-thread-num: The number of thread pools on the server side that can handle concurrent requests. The default value is 8.
--model-thread-num: The number of internal threads for each recognition route to control the parallelism of the ONNX model. 
        The default value is 1. It is recommended that decoder-thread-num * model-thread-num equals the total number of threads.
--io-thread-num: Number of IO threads that the server starts. Default is 1.
--certfile <string>: SSL certificate file. Default is ../../../ssl_key/server.crt. If you want to close ssl，set 0
--keyfile <string>: SSL key file. Default is ../../../ssl_key/server.key. 

 runtime/docs/SDK_advanced_guide_online_zh.md

@@ -120,11 +120,14 @@
--punc-quant   True为量化PUNC模型，False为非量化PUNC模型，默认是True
--itn-dir modelscope model ID 或者 本地模型路径
--port  服务端监听的端口号，默认为 10095
--decoder-thread-num  服务端启动的推理线程数，默认为 8
--decoder-thread-num  服务端线程池个数(支持的最大并发路数)，默认为 8
--model-thread-num  每路识别的内部线程数(控制ONNX模型的并行)，默认为 1，
                    其中建议 decoder-thread-num*model-thread-num 等于总线程数
--io-thread-num  服务端启动的IO线程数，默认为 1
--certfile  ssl的证书文件，默认为：../../../ssl_key/server.crt，如果需要关闭ssl，参数设置为0
--keyfile   ssl的密钥文件，默认为：../../../ssl_key/server.key
--hotword   热词文件路径，每行一个热词，格式：热词 权重(例如:阿里巴巴 20)，如果客户端提供热词，则与客户端提供的热词合并一起使用。
--hotword   热词文件路径，每行一个热词，格式：热词 权重(例如:阿里巴巴 20)，
            如果客户端提供热词，则与客户端提供的热词合并一起使用，服务端热词全局生效，客户端热词只针对对应客户端生效。
```

### 关闭FunASR服务

 runtime/python/websocket/README.md

@@ -16,7 +16,7 @@
### Install the requirements for server

```shell
cd funasr/runtime/python/websocket
cd runtime/python/websocket
pip install -r requirements_server.txt
```


 runtime/python/websocket/funasr_wss_server.py

@@ -53,13 +53,13 @@
                    help="cpu cores")
parser.add_argument("--certfile",
                    type=str,
                    default="../ssl_key/server.crt",
                    default="../../ssl_key/server.crt",
                    required=False,
                    help="certfile for ssl")

parser.add_argument("--keyfile",
                    type=str,
                    default="../ssl_key/server.key",
                    default="../../ssl_key/server.key",
                    required=False,
                    help="keyfile for ssl")
args = parser.parse_args()

			@@ -32,7 +32,7 @@
			batch[data_name] = tensor_pad
			batch[data_name + "_lengths"] = tensor_lengths

			# DHA, EAHC NOT INCLUDED
			# SAC LABEL INCLUDE
			if "hotword_indxs" in batch:
			# if hotword indxs in batch
			# use it to slice hotwords out
			@@ -41,28 +41,25 @@
			text = batch['text']
			text_lengths = batch['text_lengths']
			hotword_indxs = batch['hotword_indxs']
			num_hw = sum([int(i) for i in batch['hotword_indxs_lengths'] if i != 1]) // 2
			B, t1 = text.shape
			dha_pad = torch.ones_like(text) * -1
			_, t1 = text.shape
			t1 += 1 # TODO: as parameter which is same as predictor_bias
			ideal_attn = torch.zeros(B, t1, num_hw+1)
			nth_hw = 0
			for b, (hotword_indx, one_text, length) in enumerate(zip(hotword_indxs, text, text_lengths)):
			ideal_attn[b][:,-1] = 1
			dha_pad[b][:length] = 8405
			if hotword_indx[0] != -1:
			start, end = int(hotword_indx[0]), int(hotword_indx[1])
			hotword = one_text[start: end+1]
			hotword_list.append(hotword)
			hotword_lengths.append(end-start+1)
			ideal_attn[b][start:end+1, nth_hw] = 1
			ideal_attn[b][start:end+1, -1] = 0
			dha_pad[b][start: end+1] = one_text[start: end+1]
			nth_hw += 1
			if len(hotword_indx) == 4 and hotword_indx[2] != -1:
			# the second hotword if exist
			start, end = int(hotword_indx[2]), int(hotword_indx[3])
			hotword_list.append(one_text[start: end+1])
			hotword_lengths.append(end-start+1)
			ideal_attn[b][start:end+1, nth_hw-1] = 1
			ideal_attn[b][start:end+1, -1] = 0
			dha_pad[b][start: end+1] = one_text[start: end+1]
			nth_hw += 1
			hotword_list.append(torch.tensor([1]))
			hotword_lengths.append(1)
			@@ -71,8 +68,7 @@
			padding_value=0)
			batch["hotword_pad"] = hotword_pad
			batch["hotword_lengths"] = torch.tensor(hotword_lengths, dtype=torch.int32)
			batch['ideal_attn'] = ideal_attn
			batch['dha_pad'] = dha_pad
			del batch['hotword_indxs']
			del batch['hotword_indxs_lengths']

			return keys, batch

			@@ -16,7 +16,7 @@
			#### Server Deployment

			```shell
			cd funasr/runtime/python/websocket
			cd runtime/python/websocket
			python funasr_wss_server.py --port 10095
			```

			@@ -161,4 +161,4 @@
			cd egs/aishell/paraformer
			. ./run.sh --CUDA_VISIBLE_DEVICES="0,1" --gpu_num=2
			```
			More examples could be found in [docs](https://alibaba-damo-academy.github.io/FunASR/en/modelscope_pipeline/quick_start.html)
			More examples could be found in [docs](https://alibaba-damo-academy.github.io/FunASR/en/modelscope_pipeline/quick_start.html)

			@@ -17,7 +17,7 @@

			##### 服务端部署
			```shell
			cd funasr/runtime/python/websocket
			cd runtime/python/websocket
			python funasr_wss_server.py --port 10095
			```

			@@ -161,4 +161,4 @@
			. ./run.sh --CUDA_VISIBLE_DEVICES="0,1" --gpu_num=2
			```

			更多例子可以参考（[点击此处](https://alibaba-damo-academy.github.io/FunASR/en/academic_recipe/asr_recipe.html)）
			更多例子可以参考（[点击此处](https://alibaba-damo-academy.github.io/FunASR/en/academic_recipe/asr_recipe.html)）

			@@ -94,7 +94,9 @@
			--punc-quant: True for quantized PUNC model, False for non-quantized PUNC model. Default is True.
			--itn-dir modelscope model ID or local model path.
			--port: Port number that the server listens on. Default is 10095.
			--decoder-thread-num: Number of inference threads that the server starts. Default is 8.
			--decoder-thread-num: The number of thread pools on the server side that can handle concurrent requests. The default value is 8.
			--model-thread-num: The number of internal threads for each recognition route to control the parallelism of the ONNX model.
			The default value is 1. It is recommended that decoder-thread-num * model-thread-num equals the total number of threads.
			--io-thread-num: Number of IO threads that the server starts. Default is 1.
			--certfile <string>: SSL certificate file. Default is ../../../ssl_key/server.crt. If you want to close ssl，set 0
			--keyfile <string>: SSL key file. Default is ../../../ssl_key/server.key.

			@@ -73,7 +73,9 @@
			--punc-quant: True for quantized PUNC model, False for non-quantized PUNC model. Default is True.
			--itn-dir modelscope model ID or local model path.
			--port: Port number that the server listens on. Default is 10095.
			--decoder-thread-num: Number of inference threads that the server starts. Default is 8.
			--decoder-thread-num: The number of thread pools on the server side that can handle concurrent requests. The default value is 8.
			--model-thread-num: The number of internal threads for each recognition route to control the parallelism of the ONNX model.
			The default value is 1. It is recommended that decoder-thread-num * model-thread-num equals the total number of threads.
			--io-thread-num: Number of IO threads that the server starts. Default is 1.
			--certfile <string>: SSL certificate file. Default is ../../../ssl_key/server.crt. If you want to close ssl，set 0
			--keyfile <string>: SSL key file. Default is ../../../ssl_key/server.key.

			@@ -158,7 +158,9 @@
			--punc-quant True为量化PUNC模型，False为非量化PUNC模型，默认是True
			--itn-dir modelscope model ID 或者本地模型路径
			--port 服务端监听的端口号，默认为 10095
			--decoder-thread-num 服务端启动的推理线程数，默认为 8
			--decoder-thread-num 服务端线程池个数(支持的最大并发路数)，默认为 8
			--model-thread-num 每路识别的内部线程数(控制ONNX模型的并行)，默认为 1，
			其中建议 decoder-thread-num*model-thread-num 等于总线程数
			--io-thread-num 服务端启动的IO线程数，默认为 1
			--certfile ssl的证书文件，默认为：../../../ssl_key/server.crt，如果需要关闭ssl，参数设置为0
			--keyfile ssl的密钥文件，默认为：../../../ssl_key/server.key

			@@ -175,11 +175,14 @@
			--lm-dir modelscope model ID 或者本地模型路径
			--itn-dir modelscope model ID 或者本地模型路径
			--port 服务端监听的端口号，默认为 10095
			--decoder-thread-num 服务端启动的推理线程数，默认为 8
			--decoder-thread-num 服务端线程池个数(支持的最大并发路数)，默认为 8
			--model-thread-num 每路识别的内部线程数(控制ONNX模型的并行)，默认为 1，
			其中建议 decoder-thread-num*model-thread-num 等于总线程数
			--io-thread-num 服务端启动的IO线程数，默认为 1
			--certfile ssl的证书文件，默认为：../../../ssl_key/server.crt，如果需要关闭ssl，参数设置为0
			--keyfile ssl的密钥文件，默认为：../../../ssl_key/server.key
			--hotword 热词文件路径，每行一个热词，格式：热词权重(例如:阿里巴巴 20)，如果客户端提供热词，则与客户端提供的热词合并一起使用。
			--hotword 热词文件路径，每行一个热词，格式：热词权重(例如:阿里巴巴 20)，
			如果客户端提供热词，则与客户端提供的热词合并一起使用，服务端热词全局生效，客户端热词只针对对应客户端生效。
			```

			### 关闭FunASR服务

			@@ -111,7 +111,9 @@
			--punc-quant: True for quantized PUNC model, False for non-quantized PUNC model. Default is True.
			--itn-dir modelscope model ID or local model path.
			--port: Port number that the server listens on. Default is 10095.
			--decoder-thread-num: Number of inference threads that the server starts. Default is 8.
			--decoder-thread-num: The number of thread pools on the server side that can handle concurrent requests. The default value is 8.
			--model-thread-num: The number of internal threads for each recognition route to control the parallelism of the ONNX model.
			The default value is 1. It is recommended that decoder-thread-num * model-thread-num equals the total number of threads.
			--io-thread-num: Number of IO threads that the server starts. Default is 1.
			--certfile <string>: SSL certificate file. Default is ../../../ssl_key/server.crt. If you want to close ssl，set 0
			--keyfile <string>: SSL key file. Default is ../../../ssl_key/server.key.

			@@ -120,11 +120,14 @@
			--punc-quant True为量化PUNC模型，False为非量化PUNC模型，默认是True
			--itn-dir modelscope model ID 或者本地模型路径
			--port 服务端监听的端口号，默认为 10095
			--decoder-thread-num 服务端启动的推理线程数，默认为 8
			--decoder-thread-num 服务端线程池个数(支持的最大并发路数)，默认为 8
			--model-thread-num 每路识别的内部线程数(控制ONNX模型的并行)，默认为 1，
			其中建议 decoder-thread-num*model-thread-num 等于总线程数
			--io-thread-num 服务端启动的IO线程数，默认为 1
			--certfile ssl的证书文件，默认为：../../../ssl_key/server.crt，如果需要关闭ssl，参数设置为0
			--keyfile ssl的密钥文件，默认为：../../../ssl_key/server.key
			--hotword 热词文件路径，每行一个热词，格式：热词权重(例如:阿里巴巴 20)，如果客户端提供热词，则与客户端提供的热词合并一起使用。
			--hotword 热词文件路径，每行一个热词，格式：热词权重(例如:阿里巴巴 20)，
			如果客户端提供热词，则与客户端提供的热词合并一起使用，服务端热词全局生效，客户端热词只针对对应客户端生效。
			```

			### 关闭FunASR服务

			@@ -16,7 +16,7 @@
			### Install the requirements for server

			```shell
			cd funasr/runtime/python/websocket
			cd runtime/python/websocket
			pip install -r requirements_server.txt
			```

			@@ -53,13 +53,13 @@
			help="cpu cores")
			parser.add_argument("--certfile",
			type=str,
			default="../ssl_key/server.crt",
			default="../../ssl_key/server.crt",
			required=False,
			help="certfile for ssl")

			parser.add_argument("--keyfile",
			type=str,
			default="../ssl_key/server.key",
			default="../../ssl_key/server.key",
			required=False,
			help="keyfile for ssl")
			args = parser.parse_args()