GlocKieHuan
2023-08-29 682919c502c543198f566ebcc63340e16062c135
Supports hotwords and timestamps (#900)

* add cshape client

* delete

* Add wss-client

* Supports hot words and time stamps

Supports hot words and time stamps

* Update README.md

* Add files via upload

* Add files via upload
3个文件已修改
1个文件已添加
102 ■■■■■ 已修改文件
funasr/runtime/wss-client/FunASRWSClient_Offline/Program.cs 30 ●●●●● 补丁 | 查看 | 原始文档 | blame | 历史
funasr/runtime/wss-client/FunASRWSClient_Offline/README.md 4 ●●● 补丁 | 查看 | 原始文档 | blame | 历史
funasr/runtime/wss-client/FunASRWSClient_Offline/WebScoketClient.cs 65 ●●●●● 补丁 | 查看 | 原始文档 | blame | 历史
funasr/runtime/wss-client/confg/hotword.txt 3 ●●●●● 补丁 | 查看 | 原始文档 | blame | 历史
funasr/runtime/wss-client/FunASRWSClient_Offline/Program.cs
@@ -19,11 +19,13 @@
    {
        public static string host = "0.0.0.0";
        public static string port = "10095";
        public static string hotword = null;
        private static CWebSocketClient m_websocketclient = new CWebSocketClient();
        [STAThread]
        public async void FunASR_Main()
        {
            loadconfig();
            loadhotword();
            //初始化通信连接
            string errorStatus = string.Empty;
            string commstatus = ClientConnTest();
@@ -72,6 +74,34 @@
                    }
                }
            }
        }
        static void loadhotword()
        {
            string filePath = "hotword.txt";
            try
            {
                // 使用 StreamReader 打开文本文件
                using (StreamReader sr = new StreamReader(filePath))
                {
                    string line;
                    // 逐行读取文件内容
                    while ((line = sr.ReadLine()) != null)
                    {
                        hotword += line;
                        hotword += " ";
                    }
                }
            }
            catch (Exception ex)
            {
                Console.WriteLine("读取文件时发生错误:" + ex.Message);
            }
            finally
            {
                if (hotword.Length > 0 && hotword[hotword.Length - 1] == ' ')
                    hotword = hotword.Substring(0,hotword.Length - 1);
            }
        }
        private static string ClientConnTest()
        {
funasr/runtime/wss-client/FunASRWSClient_Offline/README.md
@@ -6,4 +6,6 @@
配置好服务端ip和端口号,在vs中打开需添加Websocket.Client的Nuget程序包后,可直接进行测试,按照控制台提示操作即可。
注:本客户端暂支持wav文件,在win11下完成测试,编译环境VS2022。
更新:支持热词和时间戳,热词需将config文件夹下的hotword.txt放置在执行路径下。
注:运行后台须注意热词和时间戳为不同模型,本客户端在win11下完成测试,编译环境VS2022。
funasr/runtime/wss-client/FunASRWSClient_Offline/WebScoketClient.cs
@@ -2,6 +2,7 @@
using System.Text.Json;
using System.Reactive.Linq;
using FunASRWSClient_Offline;
using System.Text.RegularExpressions;
namespace WebSocketSpace
{
@@ -45,15 +46,31 @@
        public async Task<Task> ClientSendFileFunc(string file_name)//文件转录
        {
            string fileExtension = Path.GetExtension(file_name);
            fileExtension = fileExtension.Replace(".", "");
            if (!(fileExtension == "mp3" || fileExtension == "mp4" || fileExtension == "wav" || fileExtension == "pcm"))
                return Task.CompletedTask;
            try
            {
                if (client.IsRunning)
                {
                    if (fileExtension == "wav")
                    {
                    var exitEvent = new ManualResetEvent(false);
                    string path = Path.GetFileName(file_name);
                    string firstbuff = string.Format("{{\"mode\": \"offline\", \"wav_name\": \"{0}\", \"is_speaking\": true}}", Path.GetFileName(file_name));
                        string firstbuff = string.Format("{{\"mode\": \"offline\", \"wav_name\": \"{0}\", \"is_speaking\": true,\"hotwords\":\"{1}\"}}", Path.GetFileName(file_name), WSClient_Offline.hotword);
                    client.Send(firstbuff);
                    showWAVForm(client, file_name);
                    }
                    else
                    {
                        var exitEvent = new ManualResetEvent(false);
                        string path = Path.GetFileName(file_name);
                        string firstbuff = string.Format("{{\"mode\": \"offline\", \"wav_name\": \"{0}\", \"is_speaking\": true,\"hotwords\":\"{1}\", \"wav_format\":\"{2}\"}}", Path.GetFileName(file_name), WSClient_Offline.hotword, fileExtension);
                        client.Send(firstbuff);
                        showWAVForm_All(client, file_name);
                    }
                }
            }
            catch (Exception ex)
@@ -69,15 +86,42 @@
            {
                try
                {
                    string timestamp = string.Empty;
                    JsonDocument jsonDoc = JsonDocument.Parse(message);
                    JsonElement root = jsonDoc.RootElement;
                    string mode = root.GetProperty("mode").GetString();
                    string text = root.GetProperty("text").GetString();
                    string name = root.GetProperty("wav_name").GetString();
                    if(name == "asr_stream")
                        Console.WriteLine($"实时识别内容: {text}");
                    if (message.IndexOf("timestamp") != -1)
                    {
                        Console.WriteLine($"文件名称:{name}");
                        //识别内容处理
                        text = text.Replace(",", "。");
                        text = text.Replace("?", "。");
                        List<string> sens = text.Split("。").ToList();
                        //时间戳处理
                        timestamp = root.GetProperty("timestamp").GetString();
                        List<List<int>> data = new List<List<int>>();
                        string pattern = @"\[(\d+),(\d+)\]";
                        foreach (Match match in Regex.Matches(timestamp, pattern))
                        {
                            int start = int.Parse(match.Groups[1].Value);
                            int end = int.Parse(match.Groups[2].Value);
                            data.Add(new List<int> { start, end });
                        }
                        int count = 0;
                        for (int i = 0; i< sens.Count;  i++)
                        {
                            if (sens[i].Length == 0)
                                continue;
                            Console.WriteLine(string.Format($"[{data[count][0]}-{data[count + sens[i].Length - 1][1]}]:{sens[i]}"));
                            count += sens[i].Length;
                        }
                    }
                    else
                        Console.WriteLine($"文件名称:{name} 文件转录内容: {text}");
                    {
                        Console.WriteLine($"文件名称:{name} 文件转录内容: {text} 时间戳:{timestamp}");
                    }
                }
                catch (JsonException ex)
                {
@@ -100,6 +144,19 @@
            client.Send("{\"is_speaking\": false}");
        }
        private void showWAVForm_All(WebsocketClient client, string file_name)
        {
            byte[] getbyte = FileToByte(file_name).ToArray();
            for (int i = 0; i < getbyte.Length; i += 1024000)
            {
                byte[] send = getbyte.Skip(i).Take(1024000).ToArray();
                client.Send(send);
                Thread.Sleep(5);
            }
            Thread.Sleep(10);
            client.Send("{\"is_speaking\": false}");
        }
        public byte[] FileToByte(string fileUrl)
        {
            try
funasr/runtime/wss-client/confg/hotword.txt
New file
@@ -0,0 +1,3 @@
阿里巴巴
达摩院
FunASR