aider/tests/basic/test_voice.py

import os
import queue
from unittest.mock import Mock, patch

import numpy as np
import pytest

from aider.voice import SoundDeviceError, Voice


@pytest.fixture
def mock_sounddevice():
    with patch("sounddevice.query_devices") as mock_query:
        mock_query.return_value = [
            {"name": "test_device", "max_input_channels": 2},
            {"name": "another_device", "max_input_channels": 1},
        ]
        yield mock_query


@pytest.fixture
def mock_soundfile():
    with patch("soundfile.SoundFile") as mock_sf:
        yield mock_sf


def test_voice_init_default_device(mock_sounddevice):
    voice = Voice()
    assert voice.device_id is None
    assert voice.audio_format == "wav"


def test_voice_init_specific_device(mock_sounddevice):
    voice = Voice(device_name="test_device")
    assert voice.device_id == 0


def test_voice_init_invalid_device(mock_sounddevice):
    with pytest.raises(ValueError) as exc:
        Voice(device_name="nonexistent_device")
    assert "Device" in str(exc.value)
    assert "not found" in str(exc.value)


def test_voice_init_invalid_format():
    with pytest.raises(ValueError) as exc:
        Voice(audio_format="invalid")
    assert "Unsupported audio format" in str(exc.value)


def test_callback_processing():
    voice = Voice()
    voice.q = queue.Queue()

    # Test with silence (low amplitude)
    test_data = np.zeros((1000, 1))
    voice.callback(test_data, None, None, None)
    assert voice.pct == 0.5  # When range is too small (<=0.001), pct is set to 0.5

    # Test with loud signal (high amplitude)
    test_data = np.ones((1000, 1))
    voice.callback(test_data, None, None, None)
    assert voice.pct > 0.9

    # Verify data is queued
    assert not voice.q.empty()


@patch("aider.voice.litellm")
def test_record_and_transcribe(mock_litellm, mock_soundfile):
    voice = Voice()

    # Mock the recording process
    with patch("sounddevice.InputStream") as mock_stream:
        # Set up the mock stream to simulate some audio data
        mock_data = np.zeros((1000, 1))
        mock_stream.return_value.__enter__.return_value = mock_data

        # Mock prompt_toolkit's prompt function more completely
        with patch("prompt_toolkit.shortcuts.prompt") as mock_prompt:
            mock_prompt.return_value = ""  # Simulate pressing Enter

            # Mock the transcription response
            mock_litellm.transcription.return_value = Mock(text="Hello, world!")

            result = voice.record_and_transcribe()

            assert result == "Hello, world!"
            mock_litellm.transcription.assert_called_once()


def test_get_prompt():
    voice = Voice()
    voice.start_time = voice.start_time = os.times().elapsed
    voice.pct = 0.5  # 50% volume level

    prompt = voice.get_prompt()
    assert "Recording" in prompt
    assert "sec" in prompt
    assert "█" in prompt  # Should contain some filled blocks
    assert "░" in prompt  # Should contain some empty blocks


@patch("sounddevice.InputStream")
def test_record_and_transcribe_keyboard_interrupt(mock_stream):
    voice = Voice()
    mock_stream.side_effect = KeyboardInterrupt()

    result = voice.record_and_transcribe()
    assert result is None


@patch("sounddevice.InputStream")
def test_record_and_transcribe_device_error(mock_stream):
    voice = Voice()
    mock_stream.side_effect = SoundDeviceError("Test error")

    result = voice.record_and_transcribe()
    assert result is None