buzz/tests/mock_sounddevice.py

import os
import time
from threading import Thread
from typing import Callable, Any
from unittest.mock import MagicMock

import numpy as np
import sounddevice
import whisper

mock_query_devices = [
    {'name': 'Background Music', 'index': 0, 'hostapi': 0, 'max_input_channels': 2, 'max_output_channels': 2,
     'default_low_input_latency': 0.01,
     'default_low_output_latency': 0.008, 'default_high_input_latency': 0.1, 'default_high_output_latency': 0.064,
     'default_samplerate': 8000.0},
    {'name': 'Background Music (UI Sounds)', 'index': 1, 'hostapi': 0, 'max_input_channels': 2,
     'max_output_channels': 2, 'default_low_input_latency': 0.01,
     'default_low_output_latency': 0.008, 'default_high_input_latency': 0.1, 'default_high_output_latency': 0.064,
     'default_samplerate': 8000.0},
    {'name': 'BlackHole 2ch', 'index': 2, 'hostapi': 0, 'max_input_channels': 2, 'max_output_channels': 2,
     'default_low_input_latency': 0.01,
     'default_low_output_latency': 0.0013333333333333333, 'default_high_input_latency': 0.1,
     'default_high_output_latency': 0.010666666666666666, 'default_samplerate': 48000.0},
    {'name': 'MacBook Pro Microphone', 'index': 3, 'hostapi': 0, 'max_input_channels': 1, 'max_output_channels': 0,
     'default_low_input_latency': 0.034520833333333334,
     'default_low_output_latency': 0.01, 'default_high_input_latency': 0.043854166666666666,
     'default_high_output_latency': 0.1, 'default_samplerate': 48000.0},
    {'name': 'MacBook Pro Speakers', 'index': 4, 'hostapi': 0, 'max_input_channels': 0, 'max_output_channels': 2,
     'default_low_input_latency': 0.01,
     'default_low_output_latency': 0.0070416666666666666, 'default_high_input_latency': 0.1,
     'default_high_output_latency': 0.016375, 'default_samplerate': 48000.0},
    {'name': 'Null Audio Device', 'index': 5, 'hostapi': 0, 'max_input_channels': 2, 'max_output_channels': 2,
     'default_low_input_latency': 0.01,
     'default_low_output_latency': 0.0014512471655328798, 'default_high_input_latency': 0.1,
     'default_high_output_latency': 0.011609977324263039, 'default_samplerate': 44100.0},
    {'name': 'Multi-Output Device', 'index': 6, 'hostapi': 0, 'max_input_channels': 0, 'max_output_channels': 2,
     'default_low_input_latency': 0.01,
     'default_low_output_latency': 0.0033333333333333335, 'default_high_input_latency': 0.1,
     'default_high_output_latency': 0.012666666666666666, 'default_samplerate': 48000.0},
]


class MockInputStream(MagicMock):
    running = False
    thread: Thread

    def __init__(self, callback: Callable[[np.ndarray, int, Any, sounddevice.CallbackFlags], None], *args, **kwargs):
        super().__init__(spec=sounddevice.InputStream)
        self.thread = Thread(target=self.target)
        self.callback = callback

    def start(self):
        self.thread.start()

    def target(self):
        sample_rate = whisper.audio.SAMPLE_RATE
        file_path = os.path.join(os.path.dirname(__file__), '../testdata/whisper-french.mp3')
        audio = whisper.load_audio(file_path, sr=sample_rate)

        chunk_duration_secs = 1

        self.running = True
        seek = 0
        num_samples_in_chunk = chunk_duration_secs * sample_rate

        while self.running:
            time.sleep(chunk_duration_secs)
            chunk = audio[seek:seek + num_samples_in_chunk]
            self.callback(chunk, 0, None, sounddevice.CallbackFlags())
            seek += num_samples_in_chunk

            # loop back around
            if seek + num_samples_in_chunk > audio.size:
                seek = 0

    def stop(self):
        self.running = False
        self.thread.join()

    def close(self):
        pass

    def __enter__(self):
        self.start()

    def __exit__(self, exc_type, exc_val, exc_tb):
        self.stop()