Add thinking settings to GeminiMultimodalLiveLLMService

2025-10-07 09:56:55 -04:00
parent 566af6b0b8
commit 48e92a22fe
1 changed files with 13 additions and 0 deletions
--- a/src/pipecat/services/gemini_multimodal_live/gemini.py
+++ b/src/pipecat/services/gemini_multimodal_live/gemini.py
@@ -99,6 +99,7 @@ try:
        SlidingWindow,
        SpeechConfig,
        StartSensitivity,
+        ThinkingConfig,
        VoiceConfig,
    )
 except ModuleNotFoundError as e:
@@ -454,6 +455,9 @@ class ContextWindowCompressionParams(BaseModel):
    )  # None = use default (80% of context window)


+ThinkingParams = ThinkingConfig
+
+
 class InputParams(BaseModel):
    """Input parameters for Gemini Multimodal Live generation.

@@ -469,6 +473,9 @@ class InputParams(BaseModel):
        media_resolution: Media resolution setting. Defaults to UNSPECIFIED.
        vad: Voice activity detection parameters. Defaults to None.
        context_window_compression: Context compression settings. Defaults to None.
+        thinking: Thinking settings. Defaults to None.
+            Note that these settings aren't accepted by all models, including
+            the current default one.
        extra: Additional parameters. Defaults to empty dict.
    """

@@ -487,6 +494,7 @@ class InputParams(BaseModel):
    )
    vad: Optional[GeminiVADParams] = Field(default=None)
    context_window_compression: Optional[ContextWindowCompressionParams] = Field(default=None)
+    thinking: Optional[ThinkingParams] = Field(default=None)
    extra: Optional[Dict[str, Any]] = Field(default_factory=dict)


@@ -613,6 +621,7 @@ class GeminiMultimodalLiveLLMService(LLMService):
            "context_window_compression": params.context_window_compression.model_dump()
            if params.context_window_compression
            else {},
+            "thinking": params.thinking or {},
            "extra": params.extra if isinstance(params.extra, dict) else {},
        }

@@ -875,6 +884,10 @@ class GeminiMultimodalLiveLLMService(LLMService):

                config.context_window_compression = compression_config

+            # Add thinking configuration to configuration, if provided
+            if self._settings.get("thinking"):
+                config.thinking_config = self._settings["thinking"]
+
            # Add VAD configuration to configuration, if provided
            if self._settings.get("vad"):
                vad_config = AutomaticActivityDetection()