mirror of
https://github.com/chidiwilliams/buzz.git
synced 2024-06-29 13:10:26 +02:00
88 lines
3.7 KiB
Python
88 lines
3.7 KiB
Python
import os
|
|
import time
|
|
from threading import Thread
|
|
from typing import Callable, Any
|
|
from unittest.mock import MagicMock
|
|
|
|
import numpy as np
|
|
import sounddevice
|
|
import whisper
|
|
|
|
mock_query_devices = [
|
|
{'name': 'Background Music', 'index': 0, 'hostapi': 0, 'max_input_channels': 2, 'max_output_channels': 2,
|
|
'default_low_input_latency': 0.01,
|
|
'default_low_output_latency': 0.008, 'default_high_input_latency': 0.1, 'default_high_output_latency': 0.064,
|
|
'default_samplerate': 8000.0},
|
|
{'name': 'Background Music (UI Sounds)', 'index': 1, 'hostapi': 0, 'max_input_channels': 2,
|
|
'max_output_channels': 2, 'default_low_input_latency': 0.01,
|
|
'default_low_output_latency': 0.008, 'default_high_input_latency': 0.1, 'default_high_output_latency': 0.064,
|
|
'default_samplerate': 8000.0},
|
|
{'name': 'BlackHole 2ch', 'index': 2, 'hostapi': 0, 'max_input_channels': 2, 'max_output_channels': 2,
|
|
'default_low_input_latency': 0.01,
|
|
'default_low_output_latency': 0.0013333333333333333, 'default_high_input_latency': 0.1,
|
|
'default_high_output_latency': 0.010666666666666666, 'default_samplerate': 48000.0},
|
|
{'name': 'MacBook Pro Microphone', 'index': 3, 'hostapi': 0, 'max_input_channels': 1, 'max_output_channels': 0,
|
|
'default_low_input_latency': 0.034520833333333334,
|
|
'default_low_output_latency': 0.01, 'default_high_input_latency': 0.043854166666666666,
|
|
'default_high_output_latency': 0.1, 'default_samplerate': 48000.0},
|
|
{'name': 'MacBook Pro Speakers', 'index': 4, 'hostapi': 0, 'max_input_channels': 0, 'max_output_channels': 2,
|
|
'default_low_input_latency': 0.01,
|
|
'default_low_output_latency': 0.0070416666666666666, 'default_high_input_latency': 0.1,
|
|
'default_high_output_latency': 0.016375, 'default_samplerate': 48000.0},
|
|
{'name': 'Null Audio Device', 'index': 5, 'hostapi': 0, 'max_input_channels': 2, 'max_output_channels': 2,
|
|
'default_low_input_latency': 0.01,
|
|
'default_low_output_latency': 0.0014512471655328798, 'default_high_input_latency': 0.1,
|
|
'default_high_output_latency': 0.011609977324263039, 'default_samplerate': 44100.0},
|
|
{'name': 'Multi-Output Device', 'index': 6, 'hostapi': 0, 'max_input_channels': 0, 'max_output_channels': 2,
|
|
'default_low_input_latency': 0.01,
|
|
'default_low_output_latency': 0.0033333333333333335, 'default_high_input_latency': 0.1,
|
|
'default_high_output_latency': 0.012666666666666666, 'default_samplerate': 48000.0},
|
|
]
|
|
|
|
|
|
class MockInputStream(MagicMock):
|
|
running = False
|
|
thread: Thread
|
|
|
|
def __init__(self, callback: Callable[[np.ndarray, int, Any, sounddevice.CallbackFlags], None], *args, **kwargs):
|
|
super().__init__(spec=sounddevice.InputStream)
|
|
self.thread = Thread(target=self.target)
|
|
self.callback = callback
|
|
|
|
def start(self):
|
|
self.thread.start()
|
|
|
|
def target(self):
|
|
sample_rate = whisper.audio.SAMPLE_RATE
|
|
file_path = os.path.join(os.path.dirname(__file__), '../testdata/whisper-french.mp3')
|
|
audio = whisper.load_audio(file_path, sr=sample_rate)
|
|
|
|
chunk_duration_secs = 1
|
|
|
|
self.running = True
|
|
seek = 0
|
|
num_samples_in_chunk = chunk_duration_secs * sample_rate
|
|
|
|
while self.running:
|
|
time.sleep(chunk_duration_secs)
|
|
chunk = audio[seek:seek + num_samples_in_chunk]
|
|
self.callback(chunk, 0, None, sounddevice.CallbackFlags())
|
|
seek += num_samples_in_chunk
|
|
|
|
# loop back around
|
|
if seek + num_samples_in_chunk > audio.size:
|
|
seek = 0
|
|
|
|
def stop(self):
|
|
self.running = False
|
|
self.thread.join()
|
|
|
|
def close(self):
|
|
pass
|
|
|
|
def __enter__(self):
|
|
self.start()
|
|
|
|
def __exit__(self, exc_type, exc_val, exc_tb):
|
|
self.stop()
|