MyTTSClient/src/commands/audio.py

import sounddevice as sd
import numpy as np
import os
from typing import Optional, List

from ..devices import get_audio_devices_windows, install_audio_cmdlets, get_audio_devices_windows_from_pnp_devices, \
  get_audio_devices_linux
from ..core.utils import *
from ..config import AppConfig


def _detect_wsl() -> bool:
  """Detect if running under Windows Subsystem for Linux."""
  try:
    # Method 1: Check /proc/version for Microsoft
    if os.path.exists('/proc/version'):
      with open('/proc/version', 'r') as f:
        version_info = f.read().lower()
        if 'microsoft' in version_info or 'wsl' in version_info:
          return True

    # Method 2: Check WSL environment variables
    if os.getenv('WSL_DISTRO_NAME') or os.getenv('WSLENV'):
      return True

    # Method 3: Check if powershell.exe is available
    try:
      subprocess.run(['powershell.exe', '-Command', 'echo test'],
                     capture_output=True, timeout=2, check=True)
      return True
    except (subprocess.SubprocessError, FileNotFoundError):
      pass

    return False
  except Exception:
    return False


def _get_device_type(instance_id: str) -> str:
  """Categorize device type based on InstanceId."""
  instance_lower = instance_id.lower()
  if '0.0.1.00000000' in instance_lower:
    return "Recording"
  elif '0.0.0.00000000' in instance_lower:
    return "Playback"
  else:
    return "Unknown"


def _get_short_device_id(instance_id: str) -> str:
  """Get device name based on InstanceId."""
  if len(instance_id) == 68:
    return instance_id[31:-1]
  elif len(instance_id) == 55:
    return instance_id[18:-1]
  else:
    return instance_id


def _get_colored_bool(status: bool) -> str:
  """Get colored status string based on status."""
  if status:
    return f"[green]{status}[/green]"
  else:
    return str(status)


def _get_colored_status(status: str) -> str:
  """Get colored status string based on status."""
  if status == "Unknown":
    return f"[red]{status}[/red]"
  else:
    return str(status)


def list_devices(
    device: Optional[int] = typer.Argument(default=None, help="Show details of a device, by its Id"),
    pulse: bool = typer.Option(False, "--pulse", help="Show PulseAudio sources"),
    native: bool = typer.Option(False, "--native", help="Force native Linux view (WSL only)"),
    all_devices: bool = typer.Option(False, "--all", help="Display all devices, even those not connected"),
    sort_info: Optional[str] = typer.Option(None, "--sort", help="Sort by column"),
    desc_info: bool = typer.Option(False, "--desc", help="Set the sorting order to descending"),
    filter_info: Optional[str] = typer.Option(None, "--filter", help="Filter by a column value. Use column=value"),
    config_file: Optional[str] = typer.Option(None, "--config", "-c", help="Path to config file")
):
  """List audio devices."""

  # Load configuration for context
  config = AppConfig.load(config_file)

  # Determine title based on environment and options
  is_wsl = _detect_wsl()
  if is_wsl and not native:
    typer.echo(typer.style("WSL detected, showing Windows audio devices (use --native for WSL view)",
                           fg=typer.colors.BLUE))
    result = get_audio_devices_windows_from_pnp_devices() if all_devices else get_audio_devices_windows()
    if not check_result(result):
      return

    windows_devices = get_results(result.stdout)
    if all_devices:
      select_conf = [
          SelectConf(attr="Index", default=""),
          SelectConf(attr="InstanceId", to="ID", formatter=lambda item: _get_short_device_id(item.InstanceId)),
          SelectConf(attr="FriendlyName", to="Name"),
          SelectConf(attr="Type", formatter=lambda item: _get_device_type(item.InstanceId)),
          SelectConf(attr="Status", formatter=lambda item: _get_colored_status(item.Status)),
      ]
    else:
      select_conf = [
          SelectConf(attr="Index"),
          SelectConf(attr="ID", formatter=lambda item: _get_short_device_id(item.ID)),
          SelectConf(attr="Name"),
          SelectConf(attr="Type"),
          SelectConf(attr="Default", formatter=lambda item: _get_colored_bool(item.Default)),
      ]
    windows_devices = select(windows_devices, select_conf)

    # apply sorting and filtering
    windows_devices = filter_and_sort(windows_devices, filter_info, sort_info, desc_info)

    display_as_table(windows_devices)


  else:
    if native and not is_wsl:
      typer.echo(typer.style("Native is applicable only when WSL is detected.", fg=typer.colors.RED))
      return

    if all_devices and native:
      typer.echo(typer.style("All devices is not applicable with native mode.", fg=typer.colors.RED))
      return

    result = get_audio_devices_linux()
    if not check_result(result):
      return

    linux_devices = result.result
    # apply sorting and filtering
    linux_devices = filter_and_sort(linux_devices, filter_info, sort_info, desc_info)

    display_as_table(linux_devices)

  # Show legend
  typer.echo(f"\nLegend:")
  typer.echo(typer.style("   * = Configured device", fg=typer.colors.YELLOW))
  typer.echo(f"   IN/OUT = Input/Output channel count")


def install():
  result = install_audio_cmdlets()
  if not check_result(result):
    return

  typer.echo(result.stdout)


def display_linux_devices(devices: list,
                          config: AppConfig,
                          show_pulse: bool = False,
                          sort_conf: Optional[SortConf] = None) -> None:
  """Display Linux audio devices with existing formatting logic."""

  if not devices:
    typer.echo(typer.style("No audio devices found!", fg=typer.colors.RED))
    return

  # Display header
  typer.echo(f"\nFound {typer.style(str(len(devices)), fg=typer.colors.CYAN, bold=True)} devices:")
  typer.echo(f"{'ID':<3} {'Name':<35} {'IN':<3} {'OUT':<3} {'Rate':<8} {'Host API'}")
  typer.echo("-" * 70)

  # Display devices
  for device in devices:
    rate = int(device.default_samplerate)
    is_configured = (config.audio.device == device.device_id)
    marker = " *" if is_configured else ""

    device_line = (f"{device.device_id:<3} {device.name:<35} {device.max_input_channels:<3} "
                   f"{device.max_output_channels:<3} {rate:<8} {device.hostapi_name}{marker}")
    typer.echo(typer.style(device_line, bold=is_configured))

  # Show default devices info
  typer.echo(f"\nDefault devices:")
  try:
    default_device = sd.default.device
    default_input = int(default_device[0])
    default_output = int(default_device[1])

    input_device = next((d for d in devices if d.device_id == default_input), None)
    if input_device:
      typer.echo(f"   Input:  [{default_input}] {input_device.name}")
    output_device = next((d for d in devices if d.device_id == default_output), None)
    if output_device:
      typer.echo(f"   Output: [{default_output}] {output_device.name}")
  except Exception as e:
    typer.echo(typer.style(f"   Error getting defaults: {e}", fg=typer.colors.RED))

  # Show PulseAudio sources if requested
  if show_pulse:
    typer.echo(f"\nPulseAudio sources:")
    pulse_sources = get_pulseaudio_sources()
    if pulse_sources:
      for source in pulse_sources:
        typer.echo(f"   {source['id']:2}: {source['name']}")
    else:
      typer.echo(typer.style("   Could not retrieve PulseAudio sources", fg=typer.colors.RED))


# Legacy function for backwards compatibility
# def get_audio_devices():
#   """Get comprehensive information about audio devices."""
#   try:
#     devices = sd.query_devices()
#     return devices
#   except Exception as e:
#     typer.echo(typer.style(f"Error querying audio devices: {e}", fg=typer.colors.RED, bold=True))
#     raise typer.Exit(1)


def get_pulseaudio_sources():
  """Get PulseAudio sources for comparison."""
  try:
    result = subprocess.run(['pactl', 'list', 'sources', 'short'],
                            capture_output=True, text=True, timeout=5)
    if result.returncode == 0:
      sources = []
      for line in result.stdout.strip().split('\n'):
        if line.strip():
          parts = line.split('\t')
          if len(parts) >= 2:
            sources.append({'id': parts[0], 'name': parts[1]})
      return sources
    else:
      return None
  except Exception:
    return None


def test_device(
    device: Optional[int] = typer.Option(None, "--device", "-d", help="Device ID to test (default: configured device)"),
    duration: float = typer.Option(3.0, "--duration", help="Recording duration in seconds"),
    save: bool = typer.Option(False, "--save", help="Save recording to WAV file"),
    play: bool = typer.Option(False, "--play", help="Play recorded audio through default speakers"),
    config_file: Optional[str] = typer.Option(None, "--config", "-c", help="Path to config file")
):
  """Test audio recording from a specific device."""

  # Load configuration
  config = AppConfig.load(config_file)

  # Determine device to use
  test_device_id = device if device is not None else config.audio.device

  typer.echo(typer.style("Audio Device Test", fg=typer.colors.BLUE, bold=True))
  typer.echo("=" * 20)

  # Get device info
  result = get_audio_devices_linux()
  if not check_result(result):
    return

  devices_list = result.result

  if test_device_id is not None:
    if test_device_id >= len(devices_list):
      typer.echo(typer.style(f"Error: Device {test_device_id} not found!", fg=typer.colors.RED))
      raise typer.Exit(1)

    device_info = devices_list[test_device_id]
    if device_info['max_input_channels'] == 0:
      typer.echo(typer.style(f"Error: Device {test_device_id} has no input channels!", fg=typer.colors.RED))
      raise typer.Exit(1)

    typer.echo(f"Testing device [{test_device_id}]: {device_info['name']}")
  else:
    typer.echo("Testing default input device")

  typer.echo(f"Recording for {duration} seconds...")
  typer.echo("Starting in 3... 2... 1...")

  try:
    # Record audio
    typer.echo(typer.style("Recording...", fg=typer.colors.GREEN, bold=True))

    audio_data = sd.rec(
      int(duration * config.audio.sample_rate),
      samplerate=config.audio.sample_rate,
      channels=config.audio.channels,
      device=test_device_id,
      dtype='float32'
    )
    sd.wait()

    # Analyze the recording
    audio_int16 = (audio_data.flatten() * 32767).astype(np.int16)
    max_amplitude = np.max(np.abs(audio_int16))
    rms_level = np.sqrt(np.mean(audio_int16.astype(np.float32) ** 2))

    typer.echo(typer.style("Recording completed!", fg=typer.colors.GREEN))
    typer.echo(f"\nAnalysis:")
    typer.echo(f"   Duration: {duration:.1f}s")
    typer.echo(f"   Samples: {len(audio_int16)}")
    typer.echo(f"   Max amplitude: {max_amplitude} / 32767 ({max_amplitude / 32767 * 100:.1f}%)")
    typer.echo(f"   RMS level: {rms_level:.1f}")

    # Signal quality assessment
    if max_amplitude < 100:
      typer.echo(typer.style("   Status: Very low signal - check microphone", fg=typer.colors.RED))
    elif max_amplitude < 1000:
      typer.echo(typer.style("   Status: Low signal - may need to speak louder", fg=typer.colors.YELLOW))
    elif max_amplitude > 30000:
      typer.echo(typer.style("   Status: Very high signal - may be clipping", fg=typer.colors.YELLOW))
    else:
      typer.echo(typer.style("   Status: Good signal level", fg=typer.colors.GREEN))

    # Play recorded audio if requested
    if play:
      typer.echo(f"\n{typer.style('Playing recorded audio...', fg=typer.colors.CYAN, bold=True)}")
      sd.play(audio_data, samplerate=config.audio.sample_rate)
      sd.wait()
      typer.echo(typer.style("Playback completed!", fg=typer.colors.CYAN))

    # Save if requested
    if save:
      filename = f"test_device_{test_device_id or 'default'}_{int(duration)}s.wav"
      from scipy.io import wavfile
      wavfile.write(filename, config.audio.sample_rate, audio_int16)
      typer.echo(typer.style(f"Audio saved to: {filename}", fg=typer.colors.MAGENTA, bold=True))

  except Exception as e:
    typer.echo(typer.style(f"Recording failed: {e}", fg=typer.colors.RED, bold=True))
    raise typer.Exit(1)