Update default.yaml configuration for speech agent parameters, adjusting min_speech_duration_ms from 100 to 120 ms and eou_threshold_ms from 800 to 1300 ms. Modify audio model parameters: set start_min_speech_ms to 100 ms, pre_speech_ms to 360 ms, and final_tail_ms to 180 ms for improved audio processing.
This commit is contained in:
@@ -7,8 +7,8 @@ agent:
|
||||
type: silero
|
||||
model_path: data/vad/silero_vad.onnx
|
||||
threshold: 0.5
|
||||
min_speech_duration_ms: 100
|
||||
eou_threshold_ms: 800
|
||||
min_speech_duration_ms: 120
|
||||
eou_threshold_ms: 1300
|
||||
|
||||
llm:
|
||||
# provider: openai | openai_compatible | siliconflow
|
||||
@@ -45,9 +45,9 @@ agent:
|
||||
model: FunAudioLLM/SenseVoiceSmall
|
||||
interim_interval_ms: 500
|
||||
min_audio_ms: 300
|
||||
start_min_speech_ms: 160
|
||||
pre_speech_ms: 240
|
||||
final_tail_ms: 120
|
||||
start_min_speech_ms: 100
|
||||
pre_speech_ms: 360
|
||||
final_tail_ms: 180
|
||||
|
||||
duplex:
|
||||
enabled: true
|
||||
|
||||
Reference in New Issue
Block a user