From 853e1558b1ba532c73998d5dd5836e70eb0ec5c8 Mon Sep 17 00:00:00 2001 From: Xin Wang Date: Wed, 17 Dec 2025 22:40:11 +0800 Subject: [PATCH] fix realtime mode need push to talk once --- agents/my_basic_agent_1_2_9.py | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/agents/my_basic_agent_1_2_9.py b/agents/my_basic_agent_1_2_9.py index caaeca9..e6a9a58 100644 --- a/agents/my_basic_agent_1_2_9.py +++ b/agents/my_basic_agent_1_2_9.py @@ -1192,6 +1192,8 @@ async def entrypoint(ctx: JobContext, avatar_dispatcher_url: str = None, vision_ session.input.set_audio_enabled(False) logger.info("Setting audio enabled to False (PTT mode)") else: + # When switching to realtime mode, clear user turn state to ensure proper initialization + session.clear_user_turn() session.input.set_audio_enabled(True) logger.info("Setting audio enabled to True (realtime mode)") @@ -1204,6 +1206,8 @@ async def entrypoint(ctx: JobContext, avatar_dispatcher_url: str = None, vision_ if _talking_mode == "push_to_talk": session.input.set_audio_enabled(False) else: + # When switching to realtime mode, clear user turn state + session.clear_user_turn() session.input.set_audio_enabled(True) return json.dumps({"success": True, "mode": _talking_mode})