workflow_test working except for text_input node

hackathon demo
2024-11-01 21:56:30 -07:00 · 2024-10-21 22:35:20 -07:00
6 changed files with 225 additions and 0 deletions
--- a/src/pipecat/workflow/.gitignore
+++ b/src/pipecat/workflow/.gitignore
@@ -0,0 +1 @@
 *.json
--- a/src/pipecat/workflow/README.md
+++ b/src/pipecat/workflow/README.md
@@ -0,0 +1 @@
 python -m pipecat.workflow.workflow_test to run 
--- a/src/pipecat/workflow/init.py
+++ b/src/pipecat/workflow/init.py
--- a/src/pipecat/workflow/workflow_mapping.py
+++ b/src/pipecat/workflow/workflow_mapping.py
@@ -0,0 +1,18 @@
 from ..services.cartesia import CartesiaTTSService
 from ..services.openai import OpenAILLMService
 from ..services.deepgram import DeepgramSTTService
 from ..transports.services.daily import DailyTransport
 from ..processors.frame_processor import FrameProcessor
 # Map workflow types to their corresponding Python classes
 WORKFLOW_MAPPING = {
    "inputs/audio_input": DailyTransport,
    "processors/speech_to_text": DeepgramSTTService,
    "processors/llm": OpenAILLMService,
    "processors/text_to_speech": CartesiaTTSService,
    "outputs/audio_output": DailyTransport,
 }
 def get_processor_class(node_type: str) -> type[FrameProcessor]:
    return WORKFLOW_MAPPING.get(node_type, FrameProcessor)
--- a/src/pipecat/workflow/workflow_test.py
+++ b/src/pipecat/workflow/workflow_test.py
@@ -0,0 +1,65 @@
 import asyncio
 import os
 from dotenv import load_dotenv
 from ..pipeline.pipeline import Pipeline
 from ..pipeline.runner import PipelineRunner
 from ..pipeline.task import PipelineTask, PipelineParams
 from .workflow_translator import translate_workflow
 from ..services.openai import OpenAIUserContextAggregator
 load_dotenv(override=True)
 async def main():
    print("Starting workflow test")
    # Update the path to the workflow.json file
    script_dir = os.path.dirname(os.path.abspath(__file__))
    workflow_path = os.path.join(script_dir, "workflow.json")
    print(f"Workflow path: {workflow_path}")
    # Translate the workflow to a list of processors
    print("Translating workflow to processors")
    processors, daily_transport = translate_workflow(workflow_path)
    print(f"Processors created: {processors}")
    # Create a pipeline from the processors
    print("Creating pipeline")
    pipeline = Pipeline(processors)
    print(f"Pipeline created: {pipeline}")
    # Create a pipeline task
    print("Creating pipeline task")
    task = PipelineTask(pipeline, PipelineParams(allow_interruptions=True))
    print(f"Pipeline task created: {task}")
    # Create a pipeline runner
    print("Creating pipeline runner")
    runner = PipelineRunner()
    print(f"Pipeline runner created: {runner}")
    user_context_aggregator = next(
        p for p in processors if isinstance(p, OpenAIUserContextAggregator)
    )
    @daily_transport.event_handler("on_first_participant_joined")
    async def on_first_participant_joined(transport, participant):
        transport.capture_participant_transcription(participant["id"])
        await task.queue_frames([user_context_aggregator.get_context_frame()])
    # Run the pipeline
    print("Running the pipeline")
    try:
        await runner.run(task)
        print("Pipeline execution completed successfully")
    except Exception as e:
        print(f"Error during pipeline execution: {e}")
    print("Workflow test completed")
 if __name__ == "__main__":
    print("Starting main execution")
    asyncio.run(main())
    print("Main execution completed")
--- a/src/pipecat/workflow/workflow_translator.py
+++ b/src/pipecat/workflow/workflow_translator.py
@@ -0,0 +1,140 @@
 import json
 import os
 from typing import Any, Dict, List, Tuple
 from .workflow_mapping import get_processor_class
 from ..processors.frame_processor import FrameProcessor
 from ..transports.services.daily import DailyParams
 from ..processors.aggregators.openai_llm_context import OpenAILLMContext
 from ..audio.vad.silero import SileroVADAnalyzer
 from ..transports.base_transport import BaseTransport
 def load_workflow(file_path: str) -> Dict[str, Any]:
    print(f"Loading workflow from file: {file_path}")
    try:
        with open(file_path, "r") as f:
            workflow = json.load(f)
        print(f"Workflow loaded successfully: {workflow}")
        return workflow
    except Exception as e:
        print(f"Error loading workflow: {e}")
        raise
 def create_processor(node: Dict[str, Any], next_node: Dict[str, Any] = None) -> FrameProcessor:
    print(f"Creating processor for node: {node['id']} of type: {node['type']}")
    processor_class = get_processor_class(node["type"])
    print(f"Processor class: {processor_class}")
    # Extract relevant properties for initialization
    init_params = {}
    if node["type"] == "inputs/audio_input":
        init_params = {
            "room_url": os.getenv("DAILY_SAMPLE_ROOM_URL"),
            "token": "",
            "bot_name": "PipecatBot",
            "params": DailyParams(
                audio_out_enabled=True,
                vad_enabled=True,
                vad_audio_passthrough=True,
                vad_analyzer=SileroVADAnalyzer(),
            ),
        }
    elif node["type"] == "processors/speech_to_text":
        init_params = {
            "api_key": os.getenv("DEEPGRAM_API_KEY"),
        }
    elif node["type"] == "processors/text_to_speech":
        init_params = {
            "api_key": os.getenv("CARTESIA_API_KEY"),
            "voice_id": "79a125e8-cd45-4c13-8a67-188112f4dd22",
        }
    print(f"Initialization parameters: {init_params}")
    processor = processor_class(**init_params)
    print(f"Processor created: {processor}")
    return processor
 def create_pipeline(workflow: Dict[str, Any]) -> Tuple[List[FrameProcessor], BaseTransport]:
    print("Creating pipeline from workflow")
    nodes = {node["id"]: node for node in workflow["nodes"]}
    links = workflow["links"]
    print(f"Nodes: {nodes}")
    print(f"Links: {links}")
    # Create a dictionary to store processors
    processors = {}
    daily_transport = None
    llm_service = None
    context_aggregator = None
    # Create processors for each node
    for node_id, node in nodes.items():
        print(f"Creating processor for node: {node_id}")
        if node["type"] == "inputs/audio_input":
            daily_transport = create_processor(node)
            processors[node_id] = {"processor": daily_transport, "type": node["type"]}
        elif node["type"] == "outputs/audio_output":
            if daily_transport is None:
                raise ValueError("Audio output transport node found before audio input node")
            processors[node_id] = {"processor": daily_transport, "type": node["type"]}
        elif node["type"] == "processors/llm":
            llm_service = create_processor(node)
            processors[node_id] = {"processor": llm_service, "type": node["type"]}
            context = OpenAILLMContext(
                [
                    {
                        "role": "system",
                        "content": "You are a helpful assistant. Your name is Housecat. You are participating in a voice conversation. Keep your answers brief. For punctuation use only period, comma, and question mark.",
                    },
                    {"role": "user", "content": "Introduce yourself."},
                ]
            )
            context_aggregator = llm_service.create_context_aggregator(context)
            print(f"Context aggregator created: {context_aggregator}")
        else:
            processors[node_id] = {"processor": create_processor(node), "type": node["type"]}
    # Create the pipeline based on the links
    pipeline = []
    for link in links:
        source_id, _, _, target_id, _, _ = link
        print(f"Processing link: {source_id} -> {target_id}")
        if processors[source_id]["processor"] not in pipeline:
            print(f"Adding source processor: {source_id}, {processors[source_id]['processor']}")
            if processors[source_id]["type"] == "inputs/audio_input":
                pipeline.append(processors[source_id]["processor"].input())
            else:
                pipeline.append(processors[source_id]["processor"])
        if processors[target_id]["processor"] not in pipeline and target_id in processors:
            print(f"Adding target processor: {target_id} {processors[target_id]['processor']}")
            if processors[target_id]["type"] == "outputs/audio_output":
                pipeline.append(processors[target_id]["processor"].output())
            elif processors[target_id]["type"] == "processors/llm":
                print("TRYING TO LINK AGGREGATOR")
                if context_aggregator:
                    print("AGGREGATOR FOUND")
                    pipeline.append(context_aggregator.user())
                pipeline.append(processors[target_id]["processor"])
            else:
                pipeline.append(processors[target_id]["processor"])
    print(f"Pipeline created with {len(pipeline)} processors")
    print(f"Pipeline: {pipeline}")
    return pipeline, daily_transport
 def translate_workflow(file_path: str) -> Tuple[List[FrameProcessor], BaseTransport]:
    print(f"Translating workflow from file: {file_path}")
    workflow = load_workflow(file_path)
    pipeline, transport = create_pipeline(workflow)
    print("Workflow translation completed")
    return pipeline, transport
Author	SHA1	Message	Date
Kwindla Hultman Kramer	b20687e32a	workflow_test working except for text_input node	2024-11-01 21:56:30 -07:00
hyypeman	388b3a239b	hackathon demo	2024-10-21 22:35:20 -07:00
		`@@ -0,0 +1 @@`
							`python -m pipecat.workflow.workflow_test to run`