onyedikachi-david · January 3, 2025 13:24 · Nov 3, 2024 · Nov 3, 2024 · Nov 3, 2024
diff --git a/mlx_whisper_realtime.py b/mlx_whisper_realtime.py
@@ -1,6 +1,10 @@
-# Required packages:
-# pip install SpeechRecognition mlx-whisper pyaudio
-# Note: This script requires Apple Silicon Mac for MLX Whisper
+# /// script
+# dependencies = [
+#   "SpeechRecognition",
+#   "mlx-whisper",
+#   "pyaudio",
+# ]
+# ///
 
 import speech_recognition as sr
 import numpy as np

diff --git a/gistfile1.txt → mlx_whisper_realtime.py b/gistfile1.txt → mlx_whisper_realtime.py
diff --git a/gistfile1.txt b/gistfile1.txt
@@ -0,0 +1,30 @@
+# Required packages:
+# pip install SpeechRecognition mlx-whisper pyaudio
+# Note: This script requires Apple Silicon Mac for MLX Whisper
+
+import speech_recognition as sr
+import numpy as np
+import mlx_whisper
+
+r = sr.Recognizer()
+mic = sr.Microphone(sample_rate=16000)
+
+print("Listening...")
+
+try:
+    with mic as source:
+        r.adjust_for_ambient_noise(source)
+        while True:
+            audio = r.listen(source)
+            # Convert audio to numpy array
+            audio_data = np.frombuffer(audio.get_raw_data(), dtype=np.int16).astype(np.float32) / 32768.0
+
+            # Process audio with Apple MLXWhisper model
+            result = mlx_whisper.transcribe(audio_data, path_or_hf_repo="mlx-community/whisper-large-v3-turbo")["text"]
+
+            # Print the transcribed text
+            print(result)
+
+except KeyboardInterrupt:
+    print("Stopped listening.")
+