python/FunASR-XL.git

			@@ -1,9 +1,7 @@
			import pyaudio
			# import websocket #区别服务端这里是 websocket-client库
			# -- encoding: utf-8 --
			import time
			import websockets
			import asyncio
			from queue import Queue
			# import threading
			import argparse
			import json
			@@ -30,12 +28,13 @@

			args = parser.parse_args()

			# voices = asyncio.Queue()
			from queue import Queue
			voices = Queue()



			# 其他函数可以通过调用send(data)来发送数据，例如：
			async def record():
			async def record_microphone():
			import pyaudio
			#print("2")
			global voices
			FORMAT = pyaudio.paInt16
			@@ -50,17 +49,60 @@
			rate=RATE,
			input=True,
			frames_per_buffer=CHUNK)

			is_speaking = True
			while True:

			data = stream.read(CHUNK)
			data = data.decode('ISO-8859-1')
			message = json.dumps({"chunk": args.chunk_size, "is_speaking": is_speaking, "audio": data})

			voices.put(data)
			voices.put(message)
			#print(voices.qsize())

			await asyncio.sleep(0.01)

			await asyncio.sleep(0.005)

			# 其他函数可以通过调用send(data)来发送数据，例如：
			async def record_from_scp():
			import wave
			global voices
			if args.audio_in.endswith(".scp"):
			f_scp = open(args.audio_in)
			wavs = f_scp.readlines()
			else:
			wavs = [args.audio_in]
			for wav in wavs:
			wav_splits = wav.strip().split()
			wav_path = wav_splits[1] if len(wav_splits) > 1 else wav_splits[0]
			# bytes_f = open(wav_path, "rb")
			# bytes_data = bytes_f.read()
			with wave.open(wav_path, "rb") as wav_file:
			# 获取音频参数
			params = wav_file.getparams()
			# 获取头信息的长度
			# header_length = wav_file.getheaders()[0][1]
			# 读取音频帧数据，跳过头信息
			# wav_file.setpos(header_length)
			frames = wav_file.readframes(wav_file.getnframes())

			# 将音频帧数据转换为字节类型的数据
			audio_bytes = bytes(frames)
			stride = int(args.chunk_size/1000160002)
			chunk_num = (len(audio_bytes)-1)//stride + 1
			print(stride)
			is_speaking = True
			for i in range(chunk_num):
			if i == chunk_num-1:
			is_speaking = False
			beg = i*stride
			data = audio_bytes[beg:beg+stride]
			data = data.decode('ISO-8859-1')
			message = json.dumps({"chunk": args.chunk_size, "is_speaking": is_speaking, "audio": data})
			voices.put(message)
			# print("data_chunk: ", len(data_chunk))
			# print(voices.qsize())

			await asyncio.sleep(args.chunk_size/1000)


			async def ws_send():
			global voices
			@@ -74,8 +116,8 @@
			await websocket.send(data) # 通过ws对象发送数据
			except Exception as e:
			print('Exception occurred:', e)
			await asyncio.sleep(0.01)
			await asyncio.sleep(0.01)
			await asyncio.sleep(0.005)
			await asyncio.sleep(0.005)



			@@ -97,7 +139,10 @@
			uri = "ws://{}:{}".format(args.host, args.port)
			#ws = await websockets.connect(uri, subprotocols=["binary"]) # 创建一个长连接
			async for websocket in websockets.connect(uri, subprotocols=["binary"], ping_interval=None):
			task = asyncio.create_task(record()) # 创建一个后台任务录音
			if args.audio_in is not None:
			task = asyncio.create_task(record_from_scp()) # 创建一个后台任务录音
			else:
			task = asyncio.create_task(record_microphone()) # 创建一个后台任务录音
			task2 = asyncio.create_task(ws_send()) # 创建一个后台任务发送
			task3 = asyncio.create_task(message()) # 创建一个后台接收消息的任务
			await asyncio.gather(task, task2, task3)