Working on testing the server

2025-09-08 22:59:12 +02:00
parent 2ce6d22f89
commit ddcc5f5e04
6 changed files with 190 additions and 99 deletions
--- a/requirements.txt
+++ b/requirements.txt
@@ -0,0 +1,23 @@
 cffi==1.17.1
 click==8.2.1
 comtypes==1.4.12
 iniconfig==2.1.0
 markdown-it-py==4.0.0
 mdurl==0.1.2
 numpy==2.3.2
 packaging==25.0
 pluggy==1.6.0
 psutil==7.0.0
 PyAudio==0.2.14
 pycaw==20240210
 pycparser==2.22
 Pygments==2.19.2
 pytest==8.4.1
 PyYAML==6.0.2
 rich==14.1.0
 scipy==1.16.1
 shellingham==1.5.4
 sounddevice==0.5.2
 typer==0.17.3
 typing_extensions==4.15.0
 wyoming==1.7.2
--- a/src/cli.py
+++ b/src/cli.py
@@ -9,15 +9,14 @@ audio_app = typer.Typer(help="Audio device operations")
 # Add commands to subcommands
 server_app.command("check")(server.check)
 server_app.command("test")(server.test)
 audio_app.command("list")(audio.list_devices)
 audio_app.command("test")(audio.test_device)
 audio_app.command("config")(audio.config_info)
 audio_app.command("install")(audio.install)
 # Register subcommands
 app.add_typer(server_app, name="server")
 app.add_typer(audio_app, name="audio")
 if __name__ == "__main__":
  app()
--- a/src/commands/audio.py
+++ b/src/commands/audio.py
@@ -3,7 +3,8 @@ import numpy as np
 import os
 from typing import Optional, List
-from ..devices import get_audio_devices_windows, install_audio_cmdlets, get_audio_devices_windows_from_pnp_devices
+from ..devices import get_audio_devices_windows, install_audio_cmdlets, get_audio_devices_windows_from_pnp_devices, \
  get_audio_devices_linux
 from ..core.utils import *
 from ..config import AppConfig
@@ -48,8 +49,6 @@ def _get_device_type(instance_id: str) -> str:
 def _get_short_device_id(instance_id: str) -> str:
  """Get device name based on InstanceId."""
  "SWD\MMDEVAPI\{0.0.0.00000000}.{20434736-BDB3-4CE2-A56B-5DF61D4DD593}"
  if len(instance_id) == 68:
    return instance_id[31:-1]
  elif len(instance_id) == 55:
@@ -124,8 +123,23 @@ def list_devices(
  else:
-    linux_devices = get_linux_audio_devices()
+    if native and not is_wsl:
-    display_linux_devices(linux_devices, config, pulse, sort_config)
+      typer.echo(typer.style("Native is applicable only when WSL is detected.", fg=typer.colors.RED))
      return
    if all_devices and native:
      typer.echo(typer.style("All devices is not applicable with native mode.", fg=typer.colors.RED))
      return
    result = get_audio_devices_linux()
    if not check_result(result):
      return
    linux_devices = result.result
    # apply sorting and filtering
    linux_devices = filter_and_sort(linux_devices, filter_info, sort_info, desc_info)
    display_as_table(linux_devices)
  # Show legend
  typer.echo(f"\nLegend:")
@@ -141,30 +155,6 @@ def install():
  typer.echo(result.stdout)
 def get_linux_audio_devices() -> list:
  """Get Linux audio devices using sounddevice."""
  try:
    devices = sd.query_devices()
    linux_devices = []
    for i, device in enumerate(devices):
      hostapi_name = sd.query_hostapis(device['hostapi'])['name']
      linux_devices.append(LinuxAudioDevice(
        device_id=i,
        name=device['name'],
        max_input_channels=device['max_input_channels'],
        max_output_channels=device['max_output_channels'],
        default_samplerate=device['default_samplerate'],
        hostapi_name=hostapi_name
      ))
    return linux_devices
  except Exception as e:
    typer.echo(typer.style(f"Error querying Linux audio devices: {e}", fg=typer.colors.RED, bold=True))
    raise typer.Exit(1)
 def display_linux_devices(devices: list,
                          config: AppConfig,
                          show_pulse: bool = False,
@@ -251,6 +241,7 @@ def test_device(
    device: Optional[int] = typer.Option(None, "--device", "-d", help="Device ID to test (default: configured device)"),
    duration: float = typer.Option(3.0, "--duration", help="Recording duration in seconds"),
    save: bool = typer.Option(False, "--save", help="Save recording to WAV file"),
    play: bool = typer.Option(False, "--play", help="Play recorded audio through default speakers"),
    config_file: Optional[str] = typer.Option(None, "--config", "-c", help="Path to config file")
 ):
  """Test audio recording from a specific device."""
@@ -265,7 +256,11 @@ def test_device(
  typer.echo("=" * 20)
  # Get device info
-  devices_list = get_linux_audio_devices()
+  result = get_audio_devices_linux()
  if not check_result(result):
    return
  devices_list = result.result
  if test_device_id is not None:
    if test_device_id >= len(devices_list):
@@ -319,72 +314,20 @@ def test_device(
    else:
      typer.echo(typer.style("   Status: Good signal level", fg=typer.colors.GREEN))
    # Play recorded audio if requested
    if play:
      typer.echo(f"\n{typer.style('Playing recorded audio...', fg=typer.colors.CYAN, bold=True)}")
      sd.play(audio_data, samplerate=config.audio.sample_rate)
      sd.wait()
      typer.echo(typer.style("Playback completed!", fg=typer.colors.CYAN))
    # Save if requested
    if save:
      filename = f"test_device_{test_device_id or 'default'}_{int(duration)}s.wav"
-      # Note: WyomingAudioRecorder is not defined in the current code
+      from scipy.io import wavfile
-      # This would need to be implemented or the save functionality modified
+      wavfile.write(filename, config.audio.sample_rate, audio_int16)
-      typer.echo(f"   Save functionality needs to be implemented")
+      typer.echo(typer.style(f"Audio saved to: {filename}", fg=typer.colors.MAGENTA, bold=True))
  except Exception as e:
    typer.echo(typer.style(f"Recording failed: {e}", fg=typer.colors.RED, bold=True))
    raise typer.Exit(1)
 def config_info(
    config_file: Optional[str] = typer.Option(None, "--config", "-c", help="Path to config file")
 ):
  """Show current audio configuration."""
  # Load configuration
  config = AppConfig.load(config_file)
  typer.echo(typer.style("Audio Configuration", fg=typer.colors.BLUE, bold=True))
  typer.echo("=" * 21)
  # Show current settings
  typer.echo(f"\nCurrent settings:")
  typer.echo(f"   Sample rate: {typer.style(f'{config.audio.sample_rate} Hz', fg=typer.colors.CYAN)}")
  typer.echo(f"   Channels: {typer.style(str(config.audio.channels), fg=typer.colors.CYAN)}")
  if config.audio.device is not None:
    typer.echo(f"   Device: {typer.style(str(config.audio.device), fg=typer.colors.CYAN)}")
    # Show device details
    try:
      devices_list = get_linux_audio_devices()
      if config.audio.device < len(devices_list):
        device = devices_list[config.audio.device]
        typer.echo(f"\nConfigured device details:")
        typer.echo(f"   Name: {device['name']}")
        typer.echo(f"   Input channels: {device['max_input_channels']}")
        typer.echo(f"   Default rate: {int(device['default_samplerate'])} Hz")
        if device['max_input_channels'] == 0:
          typer.echo(typer.style("   Warning: This device has no input channels!", fg=typer.colors.RED))
      else:
        typer.echo(typer.style(f"   Warning: Configured device {config.audio.device} not found!",
                               fg=typer.colors.RED, bold=True))
    except Exception as e:
      typer.echo(typer.style(f"   Error getting device info: {e}", fg=typer.colors.RED))
  else:
    typer.echo(f"   Device: {typer.style('default', fg=typer.colors.CYAN)}")
    # Show default device info
    try:
      default_device = sd.default.device
      if hasattr(default_device, '__len__') and len(default_device) >= 2:
        default_input = int(default_device[0])
      else:
        default_input = int(default_device)
      devices_list = get_linux_audio_devices()
      device = devices_list[default_input]
      typer.echo(f"\nDefault input device:")
      typer.echo(f"   ID: {default_input}")
      typer.echo(f"   Name: {device['name']}")
      typer.echo(f"   Input channels: {device['max_input_channels']}")
    except Exception as e:
      typer.echo(typer.style(f"   Error getting default device: {e}", fg=typer.colors.RED))
  # Show configuration source info
--- a/src/commands/server.py
+++ b/src/commands/server.py
@@ -4,7 +4,61 @@ from contextlib import closing
 import typer
 from typing import Optional
 from wyoming.audio import AudioStart, AudioChunk, AudioStop
 from ..config import AppConfig
 import io
 import wave
 import numpy as np
 import sounddevice as sd
 import asyncio
 from wyoming.client import AsyncTcpClient
 from wyoming.asr import Transcribe, Transcript
 async def _async_transcribe(host: str, port: int, timeout: float, pcm_bytes: bytes, lang: str) -> Optional[str]:
  """Stream raw PCM data to Wyoming ASR and return transcript text."""
  # Instantiate the async TCP client
  client = AsyncTcpClient(host, port)
  # Audio parameters
  rate = 16000
  width = 2  # 16-bit
  channels = 1
  # The client instance is an async context manager.
  async with client:
    # 1. Send transcription request
    await client.write_event(Transcribe(language=lang).event())
    # 2. Start the audio stream
    await client.write_event(AudioStart(rate, width, channels).event())
    # 3. Send audio chunks
    chunk_size = 2048  # A reasonable chunk size
    for i in range(0, len(pcm_bytes), chunk_size):
      chunk_bytes = pcm_bytes[i:i + chunk_size]
      await client.write_event(AudioChunk(audio=chunk_bytes, rate=rate, width=width, channels=channels).event())
    # 4. Stop the audio stream
    await client.write_event(AudioStop().event())
    # 5. Read events until a transcript arrives
    transcript_text = None
    try:
      while True:
        event = await asyncio.wait_for(client.read_event(), timeout=timeout)
        if event is None:
          break
        if Transcript.is_type(event):
          tr = Transcript.from_event(event)
          transcript_text = tr.text
          break
    except asyncio.TimeoutError:
      typer.echo(typer.style("Connection timed out waiting for transcript.", fg=typer.colors.YELLOW))
    return transcript_text
 def check_wyoming_server(host: str, port: int, timeout: float = 3.0) -> tuple[bool, float | None, str | None]:
@@ -58,3 +112,66 @@ def check(
    typer.echo(f"Server: {final_host}:{final_port}")
    typer.echo(typer.style(f"Error: {error}", fg=typer.colors.RED))
    raise typer.Exit(1)
 def test(
    duration: float = typer.Option(3.0, "--duration", help="Recording duration in seconds"),
    lang: str = typer.Option("fr", "--lang", help="Language code: 'fr' or 'en'"),
    host: Optional[str] = typer.Option(None, "--host", "-h", help="Wyoming server host"),
    port: Optional[int] = typer.Option(None, "--port", "-p", help="Wyoming server port"),
    timeout: Optional[float] = typer.Option(None, "--timeout", "-t", help="Connection timeout in seconds"),
    config_file: Optional[str] = typer.Option(None, "--config", "-c", help="Path to config file")
 ):
  """Record from default microphone, send to Wyoming ASR server, and print transcription."""
  # Load configuration
  config = AppConfig.load(config_file)
  final_host = host or config.server.host
  final_port = port or config.server.port
  final_timeout = timeout or config.server.timeout
  # Validate language (two-letter code)
  lang = (lang or "fr").strip().lower()
  if lang not in ("fr", "en"):
    typer.echo(typer.style("Invalid --lang. Use 'fr' or 'en'.", fg=typer.colors.RED))
    raise typer.Exit(2)
  # Check server reachability first
  reachable, latency, err = check_wyoming_server(final_host, final_port, final_timeout)
  if not reachable:
    typer.echo(typer.style(f"Cannot reach Wyoming server at {final_host}:{final_port}: {err}", fg=typer.colors.RED))
    raise typer.Exit(1)
  # Record audio (16 kHz mono float32)
  sample_rate = 16000
  channels = 1
  typer.echo(typer.style("Recording...", fg=typer.colors.GREEN, bold=True))
  try:
    frames = int(duration * sample_rate)
    audio = sd.rec(frames, samplerate=sample_rate, channels=channels, dtype="float32")
    sd.wait()
  except Exception as e:
    typer.echo(typer.style(f"Audio recording failed: {e}", fg=typer.colors.RED))
    raise typer.Exit(1)
  # Convert to PCM16 bytes directly, no need for WAV wrapper
  audio_int16 = np.clip(audio.flatten() * 32767.0, -32768, 32767).astype(np.int16)
  pcm_bytes = audio_int16.tobytes()
  # Send to Wyoming ASR (async)
  try:
    typer.echo(typer.style(f"Connecting to {final_host}:{final_port} (lang={lang})...", fg=typer.colors.CYAN))
    # Run the async helper
    transcript_text = asyncio.run(
      _async_transcribe(final_host, final_port, final_timeout, pcm_bytes, lang)
    )
    if transcript_text:
      typer.echo(typer.style("\nTranscription:", fg=typer.colors.GREEN, bold=True))
      typer.echo(transcript_text)
    else:
      typer.echo(typer.style("No transcription received.", fg=typer.colors.YELLOW))
  except Exception as e:
    typer.echo(typer.style(f"ASR request failed: {e}", fg=typer.colors.RED))
    raise typer.Exit(1)
--- a/src/core/Expando.py
+++ b/src/core/Expando.py
@@ -8,8 +8,10 @@ class Expando:
  You can then access the property using dot '.' (ex. obj.prop1.prop2)
  """
-  def __init__(self, props):
+  def __init__(self, props=None, **kwargs):
-    self._props = props
+    self._props = props.copy() if props else {}
    if kwargs:
      self._props.update(kwargs)
  def __getattr__(self, item):
    if item not in self._props:
--- a/src/core/utils.py
+++ b/src/core/utils.py
@@ -51,6 +51,13 @@ class ProcessResult:
  result: Any
  error: str = None
  @property
  def stderr(self):
    return self.error
  @property
  def returncode(self):
    return 0 if self.result is not None else 1
 def sort_by(items: list[Expando], sort_conf: SortConf):
  """Sort a list of items by a given property."""