{
  "timestamp": 1780745173,
  "stt_text": "Mars 正在測試 M4A 最小文字橋接，請回覆一句短句。",
  "llm_model": "gpt-4o-mini",
  "llm_text": "",
  "tts_candidates": [
    "/opt/ai-avatar-demo/data/tts_outputs/gate602_m2_mandy_clone_validation.wav",
    "/opt/ai-avatar-demo/data/tts_outputs/yuka_intro_mandy_clone_gate7m_a_r3.wav",
    "/opt/ai-avatar-demo/services/livekit-agent/.venv/lib/python3.12/site-packages/livekit/agents/inference/tts.py",
    "/opt/ai-avatar-demo/services/livekit-agent/.venv/lib/python3.12/site-packages/livekit/agents/tts/tts.py",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/modelscope/preprocessors/tts.py",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/modelscope/tools/speech_tts_autolabel.py",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/modelscope/trainers/audio/tts_trainer.py",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/modelscope/utils/audio/tts_exceptions.py",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-1234Hz-le-1ch-10S-20bit-extra.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-2ch-32bit-float-be.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-2ch-32bit-float-le.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-be-1ch-4bytes.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-early-eof-no-data.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-early-eof.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-incomplete-chunk.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-rf64.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-48000Hz-2ch-64bit-float-le-wavex.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-be-3ch-5S-24bit.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-1ch-1byte-ulaw.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-2ch-1byteu.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-24bit-inconsistent.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-24bit-rf64.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-24bit.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-36bit.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-45bit.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-53bit.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-64bit.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-4ch-9S-12bit.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-5ch-9S-5bit.wav",
    "/opt/ai-avatar-demo/services/sglang/.venv/lib/python3.12/site-packages/torchaudio/datasets/libritts.py",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-1234Hz-le-1ch-10S-20bit-extra.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-2ch-32bit-float-be.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-2ch-32bit-float-le.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-be-1ch-4bytes.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-early-eof-no-data.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-early-eof.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-incomplete-chunk.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-rf64.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-48000Hz-2ch-64bit-float-le-wavex.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-be-3ch-5S-24bit.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-1ch-1byte-ulaw.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-2ch-1byteu.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-24bit-inconsistent.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-24bit-rf64.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-24bit.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-36bit.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-45bit.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-53bit.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-3ch-5S-64bit.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-4ch-9S-12bit.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-le-5ch-9S-5bit.wav",
    "/opt/ai-avatar-demo/services/stt/.venv/lib/python3.12/site-packages/torchaudio/datasets/libritts.py",
    "/opt/ai-avatar-demo/services/torch-smoke/.venv/lib/python3.12/site-packages/torchaudio/datasets/libritts.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/gradio/media_assets/audio/audio_sample.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/gradio/media_assets/audio/cantina.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/gradio/media_assets/audio/recording1.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/gradio/media_assets/audio/sax.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/gradio/test_data/test_audio.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/qwen_tts/core/models/configuration_qwen3_tts.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/qwen_tts/core/models/modeling_qwen3_tts.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/qwen_tts/core/models/processing_qwen3_tts.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/qwen_tts/core/tokenizer_12hz/configuration_qwen3_tts_tokenizer_v2.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/qwen_tts/core/tokenizer_12hz/modeling_qwen3_tts_tokenizer_v2.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/qwen_tts/core/tokenizer_25hz/configuration_qwen3_tts_tokenizer_v1.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/qwen_tts/core/tokenizer_25hz/modeling_qwen3_tts_tokenizer_v1.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/qwen_tts/inference/qwen3_tts_model.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/qwen_tts/inference/qwen3_tts_tokenizer.py",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-1234Hz-le-1ch-10S-20bit-extra.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-2ch-32bit-float-be.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-2ch-32bit-float-le.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-be-1ch-4bytes.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-early-eof-no-data.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-early-eof.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-incomplete-chunk.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes-rf64.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-44100Hz-le-1ch-4bytes.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-48000Hz-2ch-64bit-float-le-wavex.wav",
    "/opt/ai-avatar-demo/services/tts/.venv/lib/python3.12/site-packages/scipy/io/tests/data/test-8000Hz-be-3ch-5S-24bit.wav"
  ],
  "recommended_tts_callable_if_identified": "/opt/ai-avatar-demo/work/gate7m_a_qwen3_tts_customvoice_smoke.py",
  "tts_audio_path": null,
  "tts_status": "TTS_CALLABLE_IDENTIFIED_BUT_NOT_INVOKED_IN_M4A_MINIMAL_SKELETON",
  "livekit_status": "LIVEKIT_BINDING_PENDING; no active LiveKit server port found in recon"
}