refactor(项目): 尝试 Python 语音识别和内容发送

This commit is contained in:
himeditator
2025-06-17 21:26:16 +08:00
parent 1e83ad2199
commit d1bee65ae1
11 changed files with 158 additions and 357 deletions

View File

@@ -1,17 +1,23 @@
import asyncio
from sysaudio.win import LoopbackStream, mergeStreamChannels
from audio2text.gummy import GummyTranslator
loopback = LoopbackStream()
loopback.openStream()
def main():
loopback = LoopbackStream()
loopback.openStream()
gummy = GummyTranslator(loopback.RATE, "ja", "zh")
gummy.translator.start()
gummy = GummyTranslator(loopback.RATE, "zh", "en")
gummy.translator.start()
for i in range(0, 100):
if not loopback.stream: continue
data = loopback.stream.read(loopback.CHUNK)
data = mergeStreamChannels(data, loopback.CHANNELS)
gummy.translator.send_audio_frame(data)
try:
for _ in range(0, 400):
if not loopback.stream: continue
data = loopback.stream.read(loopback.CHUNK)
data = mergeStreamChannels(data, loopback.CHANNELS)
gummy.translator.send_audio_frame(data)
finally:
gummy.translator.stop()
loopback.closeStream()
gummy.translator.stop()
loopback.closeStream()
if __name__ == "__main__":
main()