Use microphone default sample rate (#20)

2024-06-29 21:20:00 +02:00 · 2022-10-04 20:41:23 +01:00 · 2022-10-04 20:41:23 +01:00 · 14765badc6
parent 67b280718c
commit 14765badc6
3 changed files with 22 additions and 5 deletions
--- a/2
+++ b/2
@ -9,7 +9,7 @@ bundle_windows:
 	tar -czf dist/buzz-${version}-windows.tar.gz dist/Buzz

 test:
-	pytest --cov --cov-fail-under=73
+	pytest --cov --cov-fail-under=75

 bundle_mac:
 	make buzz
--- a/transcriber.py
+++ b/transcriber.py
@ -3,7 +3,7 @@ import logging
 import os
 import queue
 from threading import Thread
-from typing import Callable, Optional
+from typing import Any, Callable, Optional

 import numpy as np
 import sounddevice
@ -41,9 +41,10 @@ class Transcriber:
    def start_recording(self, block_duration=10, input_device_index: Optional[int] = None):
        logging.debug("Recording... language: \"%s\", model: \"%s\", task: \"%s\", device: \"%s\", block duration: \"%s\"" %
                      (self.language, self.model_name, self.task, input_device_index, block_duration))
+        sample_rate = self.get_device_sample_rate(device_id=input_device_index)
        self.current_stream = sounddevice.InputStream(
-            samplerate=whisper.audio.SAMPLE_RATE,
-            blocksize=block_duration * whisper.audio.SAMPLE_RATE,
+            samplerate=sample_rate,
+            blocksize=block_duration * sample_rate,
            device=input_device_index, dtype="float32",
            channels=1, callback=self.stream_callback)
        self.current_stream.start()
@ -62,10 +63,15 @@ class Transcriber:
                result = self.model.transcribe(
                    audio=block, language=self.language, task=self.task)
                logging.debug("Received next result: \"%s\"" % result["text"])
-                self.text_callback(result["text"])
+                self.text_callback(result["text"])  # type: ignore
            except queue.Empty:
                continue

+    def get_device_sample_rate(self, device_id: Optional[int]) -> int:
+        device_info: dict[str, Any] = sounddevice.query_devices(
+            device=device_id)  # type: ignore
+        return int(device_info.get('default_samplerate', whisper.audio.SAMPLE_RATE))
+
    def stream_callback(self, in_data, frame_count, time_info, status):
        # Try to enqueue the next block. If the queue is already full, drop the block.
        try:
--- a/transcriber_test.py
+++ b/transcriber_test.py
@ -0,0 +1,11 @@
+from transcriber import Transcriber
+
+
+class TestTranscriber:
+    def test_transcriber(self):
+        def text_callback(text: str):
+            pass
+
+        transcriber = Transcriber(model_name='tiny', language='en',
+                                  text_callback=text_callback, task=Transcriber.Task.TRANSCRIBE)
+        assert transcriber != None