Add sensor-controller multi-task example

A voice agent talking to a worker that owns a simulated temperature sensor. Demonstrates two ``PipelineTask`` instances side by side communicating purely via ``BusJobRequestMessage`` / ``BusJobResponseMessage`` — the worker is a plain ``PipelineTask`` (no ``LLMTask`` subclassing, not bridged) whose pipeline runs both an autonomous sensor tick loop and its own tool-calling LLM: SensorReader -> SensorStats -> user_agg -> llm -> assistant_agg The voice agent's LLM has a single tool, ``ask_controller(question)``, that forwards the user's request verbatim to the worker and speaks back the controller's reply. The worker LLM has direct tools to read the current temperature, inspect rolling stats, set the target, or change the response rate; the sensor simulation drifts toward the target with a first-order lag plus Gaussian noise. Job responses are paired with completed LLM turns via the assistant aggregator's ``on_assistant_turn_stopped`` event, skipping empty turn-stopped events that fire between a tool call and its result.
2026-05-15 09:48:03 -07:00
parent f22350ce2f
commit 410190dabb
2 changed files with 520 additions and 0 deletions
--- a/examples/multi-task/sensor-controller/sensor-controller.py
+++ b/examples/multi-task/sensor-controller/sensor-controller.py
@@ -0,0 +1,334 @@
+#
+# Copyright (c) 2026, Daily
+#
+# SPDX-License-Identifier: BSD 2-Clause License
+#
+
+"""Voice agent + sensor-controller worker, both as plain PipelineTasks.
+
+Two ``PipelineTask`` instances run side by side:
+
+- The **voice agent** is built inline in ``run_bot`` — a standard
+  transport + STT + LLM + TTS pipeline. Its LLM has a single tool,
+  ``ask_controller(question)``, which forwards the user's request to
+  the controller over the bus and speaks back the response.
+- The **sensor controller** (``build_sensor_controller``) is a
+  ``PipelineTask`` whose pipeline runs a simulated temperature sensor
+  (see ``sensor.py``) alongside its own LLM. The worker LLM has tool
+  access to read the current reading, inspect rolling stats, and
+  mutate the simulated sensor's target temperature and response rate.
+
+The worker does **not** subclass ``LLMTask`` and is **not** bridged.
+The voice agent and the controller communicate exclusively through
+``BusJobRequestMessage`` / ``BusJobResponseMessage``. The controller
+collects responses by listening to the assistant aggregator's
+``on_assistant_turn_stopped`` event and pairing each LLM completion
+with the in-flight job id.
+
+Requirements:
+
+- OPENAI_API_KEY
+- DEEPGRAM_API_KEY
+- CARTESIA_API_KEY
+- DAILY_API_KEY (for Daily transport)
+
+Example voice exchange::
+
+    User: What's the temperature?
+    Controller: 22.1°C, holding steady.
+
+    User: Make it warmer.
+    Controller: I set the target to 26°C. Give it about 20 seconds.
+
+    User: Is it stable yet?
+    Controller: It's at 25.4°C and still climbing — almost there.
+
+    User: Why is it slow?
+    Controller: The response rate is 5%. I sped it up to 20%; it'll settle faster now.
+"""
+
+import os
+
+from dotenv import load_dotenv
+from loguru import logger
+from sensor import SensorReader, SensorStats
+
+from pipecat.adapters.schemas.tools_schema import ToolsSchema
+from pipecat.audio.vad.silero import SileroVADAnalyzer
+from pipecat.bus import BusJobRequestMessage
+from pipecat.frames.frames import LLMMessagesAppendFrame, LLMRunFrame
+from pipecat.pipeline.pipeline import Pipeline
+from pipecat.pipeline.runner import PipelineRunner
+from pipecat.pipeline.task import PipelineParams, PipelineTask
+from pipecat.processors.aggregators.llm_context import LLMContext
+from pipecat.processors.aggregators.llm_response_universal import (
+    AssistantTurnStoppedMessage,
+    LLMContextAggregatorPair,
+    LLMUserAggregatorParams,
+)
+from pipecat.runner.types import RunnerArguments
+from pipecat.runner.utils import create_transport
+from pipecat.services.cartesia.tts import CartesiaTTSService
+from pipecat.services.deepgram.stt import DeepgramSTTService
+from pipecat.services.llm_service import FunctionCallParams
+from pipecat.services.openai.llm import OpenAILLMService
+from pipecat.transports.base_transport import BaseTransport, TransportParams
+from pipecat.transports.daily.transport import DailyParams
+
+load_dotenv(override=True)
+
+
+transport_params = {
+    "daily": lambda: DailyParams(
+        audio_in_enabled=True,
+        audio_out_enabled=True,
+    ),
+    "webrtc": lambda: TransportParams(
+        audio_in_enabled=True,
+        audio_out_enabled=True,
+    ),
+}
+
+
+def build_sensor_controller() -> PipelineTask:
+    """Build the controller worker as a plain :class:`PipelineTask`.
+
+    The pipeline shape is::
+
+        SensorReader -> SensorStats -> user_agg -> llm -> assistant_agg
+
+    ``SensorReader`` runs an autonomous tick loop that emits a
+    :class:`SensorReadingFrame` every second; ``SensorStats`` consumes
+    those readings and exposes rolling statistics. The LLM has four
+    direct tools that read or mutate the sensor.
+
+    Jobs arrive via the ``on_job_request`` event handler. The handler
+    stores the active ``job_id``, then queues an
+    :class:`LLMMessagesAppendFrame` with the user's question and runs
+    the LLM. When the assistant turn finishes (signalled by the
+    assistant aggregator's ``on_assistant_turn_stopped`` event), the
+    handler sends a :class:`BusJobResponseMessage` carrying the LLM's
+    answer back to the voice agent.
+    """
+    sensor = SensorReader()
+    stats = SensorStats()
+
+    async def get_current_reading(params: FunctionCallParams):
+        """Read the sensor's current temperature in degrees Celsius."""
+        await params.result_callback({"temperature": round(sensor.current, 2)})
+
+    async def get_stats(params: FunctionCallParams):
+        """Rolling minimum, maximum, average, and trend of the temperature."""
+        await params.result_callback(
+            {
+                "min": round(stats.min, 2),
+                "max": round(stats.max, 2),
+                "avg": round(stats.avg, 2),
+                "trend": stats.trend,
+            }
+        )
+
+    async def set_target_temperature(params: FunctionCallParams, target_celsius: float):
+        """Adjust the target temperature; the sensor will drift toward it.
+
+        Args:
+            target_celsius (float): The new target temperature in degrees Celsius.
+        """
+        sensor.set_target(target_celsius)
+        await params.result_callback({"ok": True, "new_target": target_celsius})
+
+    async def set_response_rate(params: FunctionCallParams, rate: float):
+        """Set how aggressively the sensor approaches the target.
+
+        Args:
+            rate (float): Response rate between 0.01 (slow) and 0.3 (fast).
+        """
+        sensor.set_response_rate(rate)
+        await params.result_callback({"ok": True, "new_rate": rate})
+
+    llm = OpenAILLMService(
+        api_key=os.environ["OPENAI_API_KEY"],
+        settings=OpenAILLMService.Settings(
+            system_instruction=(
+                "You are a temperature sensor controller. You manage a single "
+                "thermometer and answer the user's questions about it. Use the "
+                "provided tools to read the current temperature, inspect rolling "
+                "statistics, change the target temperature, or change how fast "
+                "the sensor responds. When the user asks for a vague change "
+                "('make it warmer', 'cooler'), pick a sensible target and call "
+                "set_target_temperature. Always answer in one or two short "
+                "sentences — your reply is spoken aloud."
+            ),
+        ),
+    )
+    llm.register_direct_function(get_current_reading)
+    llm.register_direct_function(get_stats)
+    llm.register_direct_function(set_target_temperature)
+    llm.register_direct_function(set_response_rate)
+
+    context = LLMContext(
+        tools=ToolsSchema(
+            standard_tools=[
+                get_current_reading,
+                get_stats,
+                set_target_temperature,
+                set_response_rate,
+            ]
+        )
+    )
+    aggregators = LLMContextAggregatorPair(context)
+
+    pipeline = Pipeline(
+        [
+            sensor,
+            stats,
+            aggregators.user(),
+            llm,
+            aggregators.assistant(),
+        ]
+    )
+
+    worker = PipelineTask(pipeline, name="controller")
+
+    # The controller handles one job at a time (the LLM pipeline can only
+    # run one turn at a time). ``state["job_id"]`` pairs the in-flight
+    # job with the next ``on_assistant_turn_stopped`` event.
+    state: dict[str, str | None] = {"job_id": None}
+
+    @worker.event_handler("on_job_request")
+    async def on_request(_task, message: BusJobRequestMessage):
+        question = message.payload["question"]
+        logger.info(f"Controller: received question '{question}'")
+        state["job_id"] = message.job_id
+        await worker.queue_frame(
+            LLMMessagesAppendFrame(
+                messages=[{"role": "user", "content": question}],
+                run_llm=True,
+            )
+        )
+
+    @aggregators.assistant().event_handler("on_assistant_turn_stopped")
+    async def on_assistant_turn_stopped(_aggregator, message: AssistantTurnStoppedMessage):
+        # The aggregator fires this event on every ``LLMFullResponseEndFrame``,
+        # including the tool-call round that precedes the tool result and has
+        # no spoken text. Skip those so we only forward the LLM's final
+        # response to the voice agent.
+        if not message.content:
+            return
+        if state["job_id"] is None:
+            return
+        job_id, state["job_id"] = state["job_id"], None
+        logger.info(f"Controller: answering job {job_id[:8]}")
+        await worker.send_job_response(job_id, response={"answer": message.content})
+
+    return worker
+
+
+async def run_bot(transport: BaseTransport, runner_args: RunnerArguments):
+    logger.info("Starting sensor-controller bot")
+
+    # Voice agent: standard transport + STT + LLM + TTS pipeline. The
+    # only tool the voice LLM has is ``ask_controller`` — it does not
+    # know anything about temperatures, trends, or response rates.
+    stt = DeepgramSTTService(api_key=os.environ["DEEPGRAM_API_KEY"])
+    tts = CartesiaTTSService(
+        api_key=os.environ["CARTESIA_API_KEY"],
+        settings=CartesiaTTSService.Settings(
+            voice="9626c31c-bec5-4cca-baa8-f8ba9e84c8bc",  # Jacqueline
+        ),
+    )
+
+    async def ask_controller(params: FunctionCallParams, question: str):
+        """Ask the temperature sensor controller anything about the sensor.
+
+        Forward the user's request verbatim and speak back the answer.
+
+        Args:
+            question (str): The user's question or instruction to forward to the controller.
+        """
+        logger.info(f"Voice agent: forwarding to controller: '{question}'")
+        async with params.pipeline_task.job(
+            "controller", payload={"question": question}, timeout=30
+        ) as t:
+            pass
+        await params.result_callback(t.response["answer"])
+
+    llm = OpenAILLMService(
+        api_key=os.environ["OPENAI_API_KEY"],
+        settings=OpenAILLMService.Settings(
+            system_instruction=(
+                "You are a friendly voice assistant with access to a temperature "
+                "sensor controller. For ANY request about the temperature — "
+                "reading it, adjusting it, checking trends, changing how fast it "
+                "responds — call the ask_controller tool. Forward the user's "
+                "request verbatim. Then speak the controller's answer back. "
+                "Keep responses brief; do not add extra commentary."
+            ),
+        ),
+    )
+    llm.register_direct_function(ask_controller, timeout_secs=60)
+
+    context = LLMContext(tools=ToolsSchema(standard_tools=[ask_controller]))
+    aggregators = LLMContextAggregatorPair(
+        context,
+        user_params=LLMUserAggregatorParams(vad_analyzer=SileroVADAnalyzer()),
+    )
+
+    pipeline = Pipeline(
+        [
+            transport.input(),
+            stt,
+            aggregators.user(),
+            llm,
+            tts,
+            transport.output(),
+            aggregators.assistant(),
+        ]
+    )
+
+    task = PipelineTask(
+        pipeline,
+        params=PipelineParams(
+            enable_metrics=True,
+            enable_usage_metrics=True,
+        ),
+        idle_timeout_secs=runner_args.pipeline_idle_timeout_secs,
+    )
+
+    runner = PipelineRunner(handle_sigint=runner_args.handle_sigint)
+
+    @transport.event_handler("on_client_connected")
+    async def on_client_connected(transport, client):
+        logger.info("Client connected")
+        context.add_message(
+            {
+                "role": "developer",
+                "content": (
+                    "Greet the user and let them know you can read or adjust a "
+                    "temperature sensor on their behalf."
+                ),
+            }
+        )
+        await task.queue_frame(LLMRunFrame())
+
+    @transport.event_handler("on_client_disconnected")
+    async def on_client_disconnected(transport, client):
+        logger.info("Client disconnected")
+        await runner.cancel()
+
+    await runner.spawn(build_sensor_controller())
+    await runner.spawn(task)
+
+    await runner.run()
+
+
+async def bot(runner_args: RunnerArguments):
+    """Main bot entry point compatible with Pipecat Cloud."""
+    transport = await create_transport(runner_args, transport_params)
+    await run_bot(transport, runner_args)
+
+
+if __name__ == "__main__":
+    from pipecat.runner.run import main
+
+    main()