From ede3d963f512d47b781b6fa726a684030bed998f Mon Sep 17 00:00:00 2001 From: "dingfeng.wong" Date: Wed, 23 Jul 2025 13:56:00 +0800 Subject: [PATCH] a --- pyproject.toml | 5 +- realtimesst.log | 183 ++++++++++++++++++++++++++++++++++++++++++++++++ uv.lock | 22 ++++-- 3 files changed, 204 insertions(+), 6 deletions(-) diff --git a/pyproject.toml b/pyproject.toml index 2ec0a18..66e8af7 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -14,8 +14,8 @@ dependencies = [ "typer>=0.12.0", "rich>=13.0.0", "rumps>=0.4.0", - "realtimestt>=0.3.104", "pynput>=1.7.6", + "realtimestt", ] [project.optional-dependencies] @@ -44,3 +44,6 @@ build-backend = "hatchling.build" dev = [ "open-webui>=0.6.5", ] + +[tool.uv.sources] +realtimestt = { path = "../../projects/RealtimeSTT" } diff --git a/realtimesst.log b/realtimesst.log index a8b4b77..ed972a4 100644 --- a/realtimesst.log +++ b/realtimesst.log @@ -1789,3 +1789,186 @@ ValueError: unsupported device mps 2025-07-23 12:45:21.659 - RealTimeSTT: realtimestt - INFO - Setting listen time 2025-07-23 12:45:21.659 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'listening' 2025-07-23 12:45:21.659 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording start +2025-07-23 12:45:43.020 - RealTimeSTT: realtimestt - INFO - voice activity detected +2025-07-23 12:45:43.020 - RealTimeSTT: realtimestt - INFO - recording started +2025-07-23 12:45:43.020 - RealTimeSTT: realtimestt - INFO - State changed from 'listening' to 'recording' +2025-07-23 12:45:43.021 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording stop +2025-07-23 12:45:43.043 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 16896 +2025-07-23 12:45:43.385 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: 2. +2025-07-23 12:45:43.385 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 22016 +2025-07-23 12:45:43.722 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: So don't... +2025-07-23 12:45:43.722 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 27136 +2025-07-23 12:45:44.097 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: soon on next one +2025-07-23 12:45:44.097 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 33280 +2025-07-23 12:45:44.556 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: So don't make so much of it. +2025-07-23 12:45:44.621 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 42496 +2025-07-23 12:45:44.997 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: So don't make so much review. +2025-07-23 12:45:44.997 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 47616 +2025-07-23 12:45:45.399 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: So don't make so much review switch. +2025-07-23 12:45:45.643 - RealTimeSTT: realtimestt - INFO - recording stopped +2025-07-23 12:45:45.644 - RealTimeSTT: realtimestt - DEBUG - No samples removed, final audio length: 58368 +2025-07-23 12:45:45.644 - RealTimeSTT: realtimestt - INFO - State changed from 'recording' to 'inactive' +2025-07-23 12:45:45.648 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'transcribing' +2025-07-23 12:45:45.648 - RealTimeSTT: realtimestt - DEBUG - Adding transcription request, no early transcription started +2025-07-23 12:45:45.649 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:45:45.758 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:45:45.862 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:45:45.963 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:45:46.064 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:45:46.166 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:45:46.198 - RealTimeSTT: realtimestt - INFO - State changed from 'transcribing' to 'inactive' +2025-07-23 12:45:46.226 - RealTimeSTT: realtimestt - DEBUG - Model base completed transcription in 0.58 seconds +2025-07-23 12:45:46.237 - RealTimeSTT: realtimestt - INFO - Setting listen time +2025-07-23 12:45:46.237 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'listening' +2025-07-23 12:45:46.237 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording start +2025-07-23 12:45:58.523 - RealTimeSTT: realtimestt - INFO - voice activity detected +2025-07-23 12:45:58.526 - RealTimeSTT: realtimestt - INFO - recording started +2025-07-23 12:45:58.526 - RealTimeSTT: realtimestt - INFO - State changed from 'listening' to 'recording' +2025-07-23 12:45:58.526 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording stop +2025-07-23 12:45:58.548 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 16896 +2025-07-23 12:46:00.542 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: Shit. +2025-07-23 12:46:00.543 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 48640 +2025-07-23 12:46:02.346 - RealTimeSTT: realtimestt - INFO - recording stopped +2025-07-23 12:46:02.349 - RealTimeSTT: realtimestt - DEBUG - No samples removed, final audio length: 77824 +2025-07-23 12:46:02.350 - RealTimeSTT: realtimestt - INFO - State changed from 'recording' to 'inactive' +2025-07-23 12:46:02.448 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'transcribing' +2025-07-23 12:46:02.450 - RealTimeSTT: realtimestt - DEBUG - Adding transcription request, no early transcription started +2025-07-23 12:46:02.462 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:02.601 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:02.756 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:02.823 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: Sudo next OS +2025-07-23 12:46:02.857 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:02.958 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:03.053 - RealTimeSTT: realtimestt - INFO - State changed from 'transcribing' to 'inactive' +2025-07-23 12:46:03.062 - RealTimeSTT: realtimestt - DEBUG - Model base completed transcription in 0.61 seconds +2025-07-23 12:46:03.086 - RealTimeSTT: realtimestt - INFO - Setting listen time +2025-07-23 12:46:03.086 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'listening' +2025-07-23 12:46:03.087 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording start +2025-07-23 12:46:10.411 - RealTimeSTT: realtimestt - INFO - voice activity detected +2025-07-23 12:46:10.411 - RealTimeSTT: realtimestt - INFO - recording started +2025-07-23 12:46:10.411 - RealTimeSTT: realtimestt - INFO - State changed from 'listening' to 'recording' +2025-07-23 12:46:10.411 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording stop +2025-07-23 12:46:10.425 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 16896 +2025-07-23 12:46:11.907 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: S. +2025-07-23 12:46:11.908 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 40448 +2025-07-23 12:46:13.683 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: pseudo nixo +2025-07-23 12:46:14.122 - RealTimeSTT: realtimestt - INFO - recording stopped +2025-07-23 12:46:14.126 - RealTimeSTT: realtimestt - DEBUG - No samples removed, final audio length: 75776 +2025-07-23 12:46:14.126 - RealTimeSTT: realtimestt - INFO - State changed from 'recording' to 'inactive' +2025-07-23 12:46:14.155 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'transcribing' +2025-07-23 12:46:14.156 - RealTimeSTT: realtimestt - DEBUG - Adding transcription request, no early transcription started +2025-07-23 12:46:14.183 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:14.352 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:14.474 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:14.575 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:14.676 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:14.776 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:14.785 - RealTimeSTT: realtimestt - INFO - State changed from 'transcribing' to 'inactive' +2025-07-23 12:46:14.834 - RealTimeSTT: realtimestt - DEBUG - Model base completed transcription in 0.68 seconds +2025-07-23 12:46:14.857 - RealTimeSTT: realtimestt - INFO - Setting listen time +2025-07-23 12:46:14.857 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'listening' +2025-07-23 12:46:14.857 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording start +2025-07-23 12:46:34.926 - RealTimeSTT: realtimestt - INFO - voice activity detected +2025-07-23 12:46:34.926 - RealTimeSTT: realtimestt - INFO - recording started +2025-07-23 12:46:34.926 - RealTimeSTT: realtimestt - INFO - State changed from 'listening' to 'recording' +2025-07-23 12:46:34.926 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording stop +2025-07-23 12:46:34.929 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 16896 +2025-07-23 12:46:36.854 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: Forty +2025-07-23 12:46:36.855 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 47616 +2025-07-23 12:46:37.871 - RealTimeSTT: realtimestt - INFO - recording stopped +2025-07-23 12:46:37.875 - RealTimeSTT: realtimestt - DEBUG - No samples removed, final audio length: 63488 +2025-07-23 12:46:37.875 - RealTimeSTT: realtimestt - INFO - State changed from 'recording' to 'inactive' +2025-07-23 12:46:37.893 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'transcribing' +2025-07-23 12:46:37.894 - RealTimeSTT: realtimestt - DEBUG - Adding transcription request, no early transcription started +2025-07-23 12:46:37.901 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:38.195 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:38.296 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:38.401 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:38.505 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:46:38.542 - RealTimeSTT: realtimestt - INFO - State changed from 'transcribing' to 'inactive' +2025-07-23 12:46:38.560 - RealTimeSTT: realtimestt - DEBUG - Model base completed transcription in 0.67 seconds +2025-07-23 12:46:38.611 - RealTimeSTT: realtimestt - INFO - Setting listen time +2025-07-23 12:46:38.611 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'listening' +2025-07-23 12:46:38.612 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording start +2025-07-23 12:46:38.988 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: for the STT status bar +2025-07-23 12:46:54.442 - RealTimeSTT: realtimestt - INFO - voice activity detected +2025-07-23 12:46:54.442 - RealTimeSTT: realtimestt - INFO - recording started +2025-07-23 12:46:54.442 - RealTimeSTT: realtimestt - INFO - State changed from 'listening' to 'recording' +2025-07-23 12:46:54.445 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording stop +2025-07-23 12:46:54.457 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 16896 +2025-07-23 12:46:56.312 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: Huh? +2025-07-23 12:46:56.312 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 46592 +2025-07-23 12:46:57.880 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: How can I use your body? +2025-07-23 12:46:57.880 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 71168 +2025-07-23 12:46:59.693 - RealTimeSTT: realtimestt - INFO - recording stopped +2025-07-23 12:46:59.700 - RealTimeSTT: realtimestt - DEBUG - No samples removed, final audio length: 100352 +2025-07-23 12:46:59.700 - RealTimeSTT: realtimestt - INFO - State changed from 'recording' to 'inactive' +2025-07-23 12:46:59.780 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'transcribing' +2025-07-23 12:46:59.782 - RealTimeSTT: realtimestt - DEBUG - Adding transcription request, no early transcription started +2025-07-23 12:46:59.805 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:00.095 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:00.197 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:00.198 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: How can I use Yabai SK hit? +2025-07-23 12:47:00.298 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:00.399 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:00.401 - RealTimeSTT: realtimestt - INFO - State changed from 'transcribing' to 'inactive' +2025-07-23 12:47:00.405 - RealTimeSTT: realtimestt - DEBUG - Model base completed transcription in 0.62 seconds +2025-07-23 12:47:00.453 - RealTimeSTT: realtimestt - INFO - Setting listen time +2025-07-23 12:47:00.453 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'listening' +2025-07-23 12:47:00.455 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording start +2025-07-23 12:47:02.765 - RealTimeSTT: realtimestt - INFO - voice activity detected +2025-07-23 12:47:02.766 - RealTimeSTT: realtimestt - INFO - recording started +2025-07-23 12:47:02.766 - RealTimeSTT: realtimestt - INFO - State changed from 'listening' to 'recording' +2025-07-23 12:47:02.766 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording stop +2025-07-23 12:47:02.774 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 16896 +2025-07-23 12:47:04.603 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: Paul. +2025-07-23 12:47:04.877 - RealTimeSTT: realtimestt - INFO - recording stopped +2025-07-23 12:47:04.879 - RealTimeSTT: realtimestt - DEBUG - No samples removed, final audio length: 50176 +2025-07-23 12:47:04.879 - RealTimeSTT: realtimestt - INFO - State changed from 'recording' to 'inactive' +2025-07-23 12:47:04.904 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'transcribing' +2025-07-23 12:47:04.905 - RealTimeSTT: realtimestt - DEBUG - Adding transcription request, no early transcription started +2025-07-23 12:47:04.916 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:05.194 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:05.296 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:05.397 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:05.416 - RealTimeSTT: realtimestt - INFO - State changed from 'transcribing' to 'inactive' +2025-07-23 12:47:05.464 - RealTimeSTT: realtimestt - DEBUG - Model base completed transcription in 0.56 seconds +2025-07-23 12:47:05.487 - RealTimeSTT: realtimestt - INFO - Setting listen time +2025-07-23 12:47:05.487 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'listening' +2025-07-23 12:47:05.488 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording start +2025-07-23 12:47:12.042 - RealTimeSTT: realtimestt - INFO - voice activity detected +2025-07-23 12:47:12.042 - RealTimeSTT: realtimestt - INFO - recording started +2025-07-23 12:47:12.043 - RealTimeSTT: realtimestt - INFO - State changed from 'listening' to 'recording' +2025-07-23 12:47:12.043 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording stop +2025-07-23 12:47:12.088 - RealTimeSTT: realtimestt - DEBUG - Current realtime buffer size: 16896 +2025-07-23 12:47:13.706 - RealTimeSTT: realtimestt - INFO - recording stopped +2025-07-23 12:47:13.708 - RealTimeSTT: realtimestt - DEBUG - No samples removed, final audio length: 43008 +2025-07-23 12:47:13.708 - RealTimeSTT: realtimestt - INFO - State changed from 'recording' to 'inactive' +2025-07-23 12:47:13.775 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'transcribing' +2025-07-23 12:47:13.776 - RealTimeSTT: realtimestt - DEBUG - Adding transcription request, no early transcription started +2025-07-23 12:47:13.796 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:14.100 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:14.168 - RealTimeSTT: realtimestt - DEBUG - Realtime text detected: This +2025-07-23 12:47:14.202 - RealTimeSTT: realtimestt - DEBUG - Receive from parent_transcription_pipe after sendiung transcription request, transcribe_count: 1 +2025-07-23 12:47:14.283 - RealTimeSTT: realtimestt - INFO - State changed from 'transcribing' to 'inactive' +2025-07-23 12:47:14.308 - RealTimeSTT: realtimestt - DEBUG - Model base completed transcription in 0.53 seconds +2025-07-23 12:47:14.372 - RealTimeSTT: realtimestt - INFO - Setting listen time +2025-07-23 12:47:14.372 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'listening' +2025-07-23 12:47:14.373 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording start +2025-07-23 12:48:23.629 - RealTimeSTT: realtimestt - DEBUG - No samples removed, final audio length: 0 +2025-07-23 12:48:23.631 - RealTimeSTT: realtimestt - INFO - State changed from 'listening' to 'inactive' +2025-07-23 12:55:04.678 - RealTimeSTT: realtimestt - INFO - Starting RealTimeSTT +2025-07-23 12:55:04.680 - RealTimeSTT: realtimestt - INFO - Using Apple Metal Performance Shaders (MPS) +2025-07-23 12:55:04.690 - RealTimeSTT: realtimestt - INFO - Initializing audio recording (creating pyAudio input stream, sample rate: 16000 buffer size: 512 +2025-07-23 12:55:04.695 - RealTimeSTT: realtimestt - INFO - Initializing faster_whisper realtime transcription model tiny, default device: mps, compute type: default, device index: 0, download root: None +2025-07-23 12:55:05.423 - RealTimeSTT: realtimestt - DEBUG - Faster_whisper realtime speech to text transcription model initialized successfully +2025-07-23 12:55:05.423 - RealTimeSTT: realtimestt - INFO - Initializing WebRTC voice with Sensitivity 3 +2025-07-23 12:55:05.423 - RealTimeSTT: realtimestt - DEBUG - WebRTC VAD voice activity detection engine initialized successfully +2025-07-23 12:55:06.044 - RealTimeSTT: realtimestt - DEBUG - Silero VAD voice activity detection engine initialized successfully +2025-07-23 12:55:06.044 - RealTimeSTT: realtimestt - DEBUG - Starting realtime worker +2025-07-23 12:55:06.044 - RealTimeSTT: realtimestt - DEBUG - Waiting for main transcription model to start +2025-07-23 12:55:09.657 - RealTimeSTT: realtimestt - DEBUG - Main transcription model ready +2025-07-23 12:55:09.658 - RealTimeSTT: realtimestt - DEBUG - RealtimeSTT initialization completed successfully +2025-07-23 12:55:09.658 - RealTimeSTT: realtimestt - INFO - Setting listen time +2025-07-23 12:55:09.658 - RealTimeSTT: realtimestt - INFO - State changed from 'inactive' to 'listening' +2025-07-23 12:55:09.659 - RealTimeSTT: realtimestt - DEBUG - Waiting for recording start diff --git a/uv.lock b/uv.lock index 5d4e5f8..55bb145 100644 --- a/uv.lock +++ b/uv.lock @@ -5566,7 +5566,7 @@ wheels = [ [[package]] name = "realtimestt" version = "0.3.104" -source = { registry = "https://pypi.org/simple" } +source = { directory = "../../projects/RealtimeSTT" } dependencies = [ { name = "faster-whisper" }, { name = "halo" }, @@ -5581,9 +5581,21 @@ dependencies = [ { name = "websocket-client" }, { name = "websockets" }, ] -sdist = { url = "https://files.pythonhosted.org/packages/29/15/70c63317462a153ae46a1857e35b21c4de94729f56d8f1b899fbc5ff3b52/realtimestt-0.3.104.tar.gz", hash = "sha256:96bafae0e839c3b60729462cf760c5fc104569c9839fc1071b5afecc1a2b351f", size = 118257, upload-time = "2025-05-03T21:47:33.78Z" } -wheels = [ - { url = "https://files.pythonhosted.org/packages/cf/24/df28da0f3c5f0d4760e1492e7cee937e0aa72897d4cc41a36ee8c46af5c1/realtimestt-0.3.104-py3-none-any.whl", hash = "sha256:d0a4030551afa3d54b729d94f8a23cca800ef0b21e7778e84ab7ece014c9135f", size = 110633, upload-time = "2025-05-03T21:47:32.59Z" }, + +[package.metadata] +requires-dist = [ + { name = "faster-whisper", specifier = "==1.1.1" }, + { name = "halo", specifier = "==0.0.31" }, + { name = "openwakeword", specifier = ">=0.4.0" }, + { name = "pvporcupine", specifier = "==1.9.5" }, + { name = "pyaudio", specifier = "==0.2.14" }, + { name = "scipy", specifier = "==1.15.2" }, + { name = "soundfile", specifier = "==0.13.1" }, + { name = "torch", specifier = ">=2.7.1" }, + { name = "torchaudio", specifier = ">=2.7.1" }, + { name = "webrtcvad-wheels", specifier = "==2.0.14" }, + { name = "websocket-client", specifier = "==1.8.0" }, + { name = "websockets", specifier = "==15.0.1" }, ] [[package]] @@ -6377,7 +6389,7 @@ requires-dist = [ { name = "pyscreenshot", marker = "extra == 'screenshot-all'", specifier = ">=3.1" }, { name = "pyscreenshot", marker = "extra == 'screenshot-multi'", specifier = ">=3.1" }, { name = "python-doctr", specifier = ">=0.8.0" }, - { name = "realtimestt", specifier = ">=0.3.104" }, + { name = "realtimestt", directory = "../../projects/RealtimeSTT" }, { name = "rich", specifier = ">=13.0.0" }, { name = "rumps", specifier = ">=0.4.0" }, { name = "typer", specifier = ">=0.12.0" },