From 699ae46f06af0a04f0fd5cface2ccb8b7dc29e59 Mon Sep 17 00:00:00 2001 From: Jake Wilkinson Date: Fri, 24 Oct 2025 10:27:05 +0000 Subject: [PATCH] realtime.py voice-to-text added, needs to be integrated --- .gitignore | 1 + realtime.py | 26 ++++++++++++++++++++++++++ 2 files changed, 27 insertions(+) create mode 100644 .gitignore create mode 100644 realtime.py diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..1373935 --- /dev/null +++ b/.gitignore @@ -0,0 +1 @@ +vosk-model-small-en-us-0.15/ diff --git a/realtime.py b/realtime.py new file mode 100644 index 0000000..896c9e6 --- /dev/null +++ b/realtime.py @@ -0,0 +1,26 @@ +import sounddevice as sd +import queue +import sys +import json +from vosk import Model, KaldiRecognizer +model = Model("./vosk-model-small-en-us-0.15") + +rec = KaldiRecognizer(model, 16000) +q = queue.Queue() + +def callback(indata, frames, time, status): + if status: + print(status, file=sys.stderr) + q.put(bytes(indata)) + +with sd.RawInputStream(samplerate=16000, blocksize=8000, dtype='int16', + channels=1, callback=callback): + print("Listening... Speak into the mic.") + while True: + data = q.get() + if rec.AcceptWaveform(data): + result = json.loads(rec.Result()) + print(".", result) + else: + partial = json.loads(rec.PartialResult()) + print("...", partial, end='\r')