diff --git a/changelog/3228.changed.md b/changelog/3228.changed.md new file mode 100644 index 000000000..5444eef28 --- /dev/null +++ b/changelog/3228.changed.md @@ -0,0 +1,4 @@ +- Updated default models for: + + - `GeminiLiveLLMService` to `gemini-2.5-flash-native-audio-preview-12-2025`. + - `GeminiLiveVertexLLMService` to `gemini-live-2.5-flash-native-audio`. diff --git a/src/pipecat/services/google/gemini_live/llm.py b/src/pipecat/services/google/gemini_live/llm.py index ec608c311..129d9d224 100644 --- a/src/pipecat/services/google/gemini_live/llm.py +++ b/src/pipecat/services/google/gemini_live/llm.py @@ -563,18 +563,18 @@ class InputParams(BaseModel): context_window_compression: Context compression settings. Defaults to None. thinking: Thinking settings. Defaults to None. Note that these settings may require specifying a model that - supports them, e.g. "gemini-2.5-flash-native-audio-preview-09-2025". + supports them, e.g. "gemini-2.5-flash-native-audio-preview-12-2025". enable_affective_dialog: Enable affective dialog, which allows Gemini to adapt to expression and tone. Defaults to None. Note that these settings may require specifying a model that - supports them, e.g. "gemini-2.5-flash-native-audio-preview-09-2025". + supports them, e.g. "gemini-2.5-flash-native-audio-preview-12-2025". Also note that this setting may require specifying an API version that supports it, e.g. HttpOptions(api_version="v1alpha"). proactivity: Proactivity settings, which allows Gemini to proactively decide how to behave, such as whether to avoid responding to content that is not relevant. Defaults to None. Note that these settings may require specifying a model that - supports them, e.g. "gemini-2.5-flash-native-audio-preview-09-2025". + supports them, e.g. "gemini-2.5-flash-native-audio-preview-12-2025". Also note that this setting may require specifying an API version that supports it, e.g. HttpOptions(api_version="v1alpha"). extra: Additional parameters. Defaults to empty dict. @@ -615,7 +615,7 @@ class GeminiLiveLLMService(LLMService): *, api_key: str, base_url: Optional[str] = None, - model="models/gemini-2.0-flash-live-001", + model="models/gemini-2.5-flash-native-audio-preview-12-2025", voice_id: str = "Charon", start_audio_paused: bool = False, start_video_paused: bool = False, @@ -638,7 +638,7 @@ class GeminiLiveLLMService(LLMService): Please use `http_options` to customize requests made by the API client. - model: Model identifier to use. Defaults to "models/gemini-2.0-flash-live-001". + model: Model identifier to use. Defaults to "models/gemini-2.5-flash-native-audio-preview-12-2025". voice_id: TTS voice identifier. Defaults to "Charon". start_audio_paused: Whether to start with audio input paused. Defaults to False. start_video_paused: Whether to start with video input paused. Defaults to False.