From 6664c492ac6019631b15c1fb8724bf577fc42719 Mon Sep 17 00:00:00 2001 From: Mert Sefa AKGUN Date: Thu, 9 Jan 2025 15:38:33 +0300 Subject: [PATCH] feat(gemini): enable audio transcription in live text example Add options to transcribe both user and model audio during the GeminiMultimodalLiveLLMService setup in the 26d-gemini-multimodal-live-text.py example. --- examples/foundational/26d-gemini-multimodal-live-text.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/examples/foundational/26d-gemini-multimodal-live-text.py b/examples/foundational/26d-gemini-multimodal-live-text.py index deca5dbf1..f70ba4eca 100644 --- a/examples/foundational/26d-gemini-multimodal-live-text.py +++ b/examples/foundational/26d-gemini-multimodal-live-text.py @@ -56,6 +56,8 @@ async def main(): llm = GeminiMultimodalLiveLLMService( api_key=os.getenv("GOOGLE_API_KEY"), # system_instruction="Talk like a pirate." + transcribe_user_audio=True, + transcribe_model_audio=True, ) llm.set_model_modalities( GeminiMultimodalModalities.TEXT