diff --git a/packages/services/voice-agent/src/agent.py b/packages/services/voice-agent/src/agent.py index b77d0dd..b0b98a1 100644 --- a/packages/services/voice-agent/src/agent.py +++ b/packages/services/voice-agent/src/agent.py @@ -203,6 +203,14 @@ async def entrypoint(ctx: JobContext) -> None: language=settings.whisper_language, client=_oai_client, use_realtime=True, + # Increase silence_duration_ms so Chinese speech isn't chopped + # into tiny fragments (default 350ms is too aggressive). + turn_detection={ + "type": "server_vad", + "threshold": 0.6, + "prefix_padding_ms": 600, + "silence_duration_ms": 800, + }, ) else: stt = LocalWhisperSTT(