# Agent behavior configuration (safe to edit per profile) # This file only controls agent-side behavior (VAD/LLM/TTS/ASR providers). # Infra/server/network settings should stay in .env. agent: vad: type: silero model_path: data/vad/silero_vad.onnx threshold: 0.5 min_speech_duration_ms: 100 eou_threshold_ms: 800 llm: # provider: openai | openai_compatible | siliconflow provider: openai_compatible model: deepseek-v3 temperature: 0.7 # Required: no fallback. You can still reference env explicitly. api_key: sk-fc4d59b360475f53401a864db8ce0985010acc4e696723d20a90d6569f38d80a # Optional for OpenAI-compatible endpoints: api_url: https://api.qnaigc.com/v1 tts: # provider: edge | openai_compatible | siliconflow | dashscope # dashscope defaults (if omitted): provider: dashscope api_url: wss://dashscope.aliyuncs.com/api-ws/v1/realtime model: qwen3-tts-flash-realtime api_key: sk-391f5126d18345d497c6e8717c8c9ad7 mode: commit voice: Cherry speed: 1.0 # provider: openai_compatible # api_key: sk-thmzysdpqqmhqxxshyqoxvjeiflexjdgaftyufrsgrhpjnyx # api_url: https://api.siliconflow.cn/v1/audio/speech # model: FunAudioLLM/CosyVoice2-0.5B # voice: anna # speed: 1.0 asr: # provider: buffered | openai_compatible | siliconflow provider: openai_compatible api_key: sk-thmzysdpqqmhqxxshyqoxvjeiflexjdgaftyufrsgrhpjnyx api_url: https://api.siliconflow.cn/v1/audio/transcriptions model: FunAudioLLM/SenseVoiceSmall interim_interval_ms: 500 min_audio_ms: 300 start_min_speech_ms: 160 pre_speech_ms: 240 final_tail_ms: 120 duplex: enabled: true system_prompt: You are a helpful, friendly voice assistant. Keep your responses concise and conversational. barge_in: min_duration_ms: 200 silence_tolerance_ms: 60 tools: - calculator - current_time