feat(engine): 重构字幕引擎，新增 Sherpa-ONNX SenseVoice 语音识别模型

- 重构字幕引擎，将音频采集改为在新线程上进行 - 重构 audio2text 中的类，调整运行逻辑 - 更新 main 函数，添加对 Sosv 模型的支持 - 修改 AudioStream 类，默认使用 16000Hz 采样率
2026-02-04 04:14:42 +08:00 · 2025-09-06 20:49:46 +08:00
parent 2b7ce06f04
commit eba2c5ca45
14 changed files with 377 additions and 112 deletions
--- a/engine/utils/server.py
+++ b/engine/utils/server.py
@@ -1,13 +1,12 @@
 import socket
 import threading
 import json
-# import time
-from utils import thread_data, stdout_cmd, stderr
+from utils import shared_data, stdout_cmd, stderr


 def handle_client(client_socket):
-    global thread_data
-    while thread_data.status == 'running':
+    global shared_data
+    while shared_data.status == 'running':
        try:
            data = client_socket.recv(4096).decode('utf-8')
            if not data:
@@ -15,13 +14,13 @@ def handle_client(client_socket):
            data = json.loads(data)

            if data['command'] == 'stop':
-                thread_data.status = 'stop'
+                shared_data.status = 'stop'
                break
        except Exception as e:
            stderr(f'Communication error: {e}')
            break
    
-    thread_data.status = 'stop'
+    shared_data.status = 'stop'
    client_socket.close()


@@ -34,7 +33,6 @@ def start_server(port: int):
        stderr(str(e))
        stdout_cmd('kill')
        return
-    # time.sleep(20)
    stdout_cmd('connect')

    client, addr = server.accept()