Spaces:

Deadmon
/

pipecat

Runtime error

App Files Files Community

Deadmon commited on May 10

Commit

1366db9

verified ·

1 Parent(s): 95c84ab

Upload 12 files

Browse files

Files changed (12) hide show

.gitignore +165 -0
bot_constants.py +23 -0
bot_definitions.py +55 -0
bot_registry.py +137 -0
bot_runner.py +247 -0
bot_runner_helpers.py +211 -0
call_connection_manager.py +608 -0
call_transfer.py +465 -0
image.png +0 -0
simple_dialin.py +192 -0
simple_dialout.py +184 -0
voicemail_detection.py +449 -0

.gitignore ADDED Viewed

	@@ -0,0 +1,165 @@

+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+# C extensions
+*.so
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+# Translations
+*.mo
+*.pot
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+# Flask stuff:
+instance/
+.webassets-cache
+# Scrapy stuff:
+.scrapy
+# Sphinx documentation
+docs/_build/
+# PyBuilder
+.pybuilder/
+target/
+# Jupyter Notebook
+.ipynb_checkpoints
+# IPython
+profile_default/
+ipython_config.py
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+# poetry
+#   Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control.
+#   This is especially recommended for binary packages to ensure reproducibility, and is more
+#   commonly ignored for libraries.
+#   https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control
+#poetry.lock
+# pdm
+#   Similar to Pipfile.lock, it is generally recommended to include pdm.lock in version control.
+#pdm.lock
+#   pdm stores project-wide configurations in .pdm.toml, but it is recommended to not include it
+#   in version control.
+#   https://pdm.fming.dev/#use-with-ide
+.pdm.toml
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow and github.com/pdm-project/pdm
+__pypackages__/
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+# SageMath parsed files
+*.sage.py
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+# Spyder project settings
+.spyderproject
+.spyproject
+# Rope project settings
+.ropeproject
+# mkdocs documentation
+/site
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+# Pyre type checker
+.pyre/
+# pytype static type analyzer
+.pytype/
+# Cython debug symbols
+cython_debug/
+# PyCharm
+#  JetBrains specific template is maintained in a separate JetBrains.gitignore that can
+#  be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore
+#  and can be added to the global gitignore or merged into this file.  For a more nuclear
+#  option (not recommended) you can uncomment the following to ignore the entire idea folder.
+#.idea/
+runpod.toml
+# custom script to recursively upgrade items in requirements.py
+upgrade_requirements.py
+.DS_Store

bot_constants.py ADDED Viewed

	@@ -0,0 +1,23 @@

+# bot_constants.py
+"""Constants used across the bot runner application."""
+# Maximum session time
+MAX_SESSION_TIME = 5 * 60  # 5 minutes
+# Required environment variables
+REQUIRED_ENV_VARS = [
+    "OPENAI_API_KEY",
+    "GOOGLE_API_KEY",
+    "DAILY_API_KEY",
+    "CARTESIA_API_KEY",
+    "DEEPGRAM_API_KEY",
+]
+# Default example to use when handling dialin webhooks - determines which bot type to run
+DEFAULT_DIALIN_EXAMPLE = "call_transfer"  # Options: call_transfer, simple_dialin
+# Call transfer configuration constants
+DEFAULT_CALLTRANSFER_MODE = "dialout"
+DEFAULT_SPEAK_SUMMARY = True  # Speak a summary of the call to the operator
+DEFAULT_STORE_SUMMARY = False  # Store summary of the call (for future implementation)
+DEFAULT_TEST_IN_PREBUILT = False  # Test in prebuilt mode (bypasses need to dial in/out)

bot_definitions.py ADDED Viewed

	@@ -0,0 +1,55 @@

+# bot_definitions.py
+"""Definitions of different bot types for the bot registry."""
+from bot_registry import BotRegistry, BotType
+from bot_runner_helpers import (
+    create_call_transfer_settings,
+    create_simple_dialin_settings,
+    create_simple_dialout_settings,
+)
+# Create and configure the bot registry
+bot_registry = BotRegistry()
+# Register bot types
+bot_registry.register(
+    BotType(
+        name="call_transfer",
+        settings_creator=create_call_transfer_settings,
+        required_settings=["dialin_settings"],
+        incompatible_with=["simple_dialin", "simple_dialout", "voicemail_detection"],
+        auto_add_settings={"dialin_settings": {}},
+    )
+)
+bot_registry.register(
+    BotType(
+        name="simple_dialin",
+        settings_creator=create_simple_dialin_settings,
+        required_settings=["dialin_settings"],
+        incompatible_with=["call_transfer", "simple_dialout", "voicemail_detection"],
+        auto_add_settings={"dialin_settings": {}},
+    )
+)
+bot_registry.register(
+    BotType(
+        name="simple_dialout",
+        settings_creator=create_simple_dialout_settings,
+        required_settings=["dialout_settings"],
+        incompatible_with=["call_transfer", "simple_dialin", "voicemail_detection"],
+        auto_add_settings={"dialout_settings": [{}]},
+    )
+)
+bot_registry.register(
+    BotType(
+        name="voicemail_detection",
+        settings_creator=lambda body: body.get(
+            "voicemail_detection", {}
+        ),  # No creator function in original code
+        required_settings=["dialout_settings"],
+        incompatible_with=["call_transfer", "simple_dialin", "simple_dialout"],
+        auto_add_settings={"dialout_settings": [{}]},
+    )
+)

bot_registry.py ADDED Viewed

	@@ -0,0 +1,137 @@

+# bot_registry.py
+"""Bot registry pattern for managing different bot types."""
+from typing import Any, Callable, Dict, List, Optional
+from bot_constants import DEFAULT_DIALIN_EXAMPLE
+from bot_runner_helpers import ensure_dialout_settings_array
+from fastapi import HTTPException
+class BotType:
+    """Bot type configuration and handling."""
+    def __init__(
+        self,
+        name: str,
+        settings_creator: Callable[[Dict[str, Any]], Dict[str, Any]],
+        required_settings: list = None,
+        incompatible_with: list = None,
+        auto_add_settings: dict = None,
+    ):
+        """Initialize a bot type.
+        Args:
+            name: Name of the bot type
+            settings_creator: Function to create/update settings for this bot type
+            required_settings: List of settings this bot type requires
+            incompatible_with: List of bot types this one cannot be used with
+            auto_add_settings: Settings to add if this bot is being run in test mode
+        """
+        self.name = name
+        self.settings_creator = settings_creator
+        self.required_settings = required_settings or []
+        self.incompatible_with = incompatible_with or []
+        self.auto_add_settings = auto_add_settings or {}
+    def has_test_mode(self, body: Dict[str, Any]) -> bool:
+        """Check if this bot type is configured for test mode."""
+        return self.name in body and body[self.name].get("testInPrebuilt", False)
+    def create_settings(self, body: Dict[str, Any]) -> Dict[str, Any]:
+        """Create or update settings for this bot type."""
+        body[self.name] = self.settings_creator(body)
+        return body
+    def prepare_for_test(self, body: Dict[str, Any]) -> Dict[str, Any]:
+        """Add required settings for test mode if they don't exist."""
+        for setting, default_value in self.auto_add_settings.items():
+            if setting not in body:
+                body[setting] = default_value
+        return body
+class BotRegistry:
+    """Registry for managing different bot types."""
+    def __init__(self):
+        self.bots = {}
+        self.bot_validation_rules = []
+    def register(self, bot_type: BotType):
+        """Register a bot type."""
+        self.bots[bot_type.name] = bot_type
+        return self
+    def get_bot(self, name: str) -> BotType:
+        """Get a bot type by name."""
+        return self.bots.get(name)
+    def detect_bot_type(self, body: Dict[str, Any]) -> Optional[str]:
+        """Detect which bot type to use based on configuration."""
+        # First check for test mode bots
+        for name, bot in self.bots.items():
+            if bot.has_test_mode(body):
+                return name
+        # Then check for specific combinations of settings
+        for name, bot in self.bots.items():
+            if name in body and all(req in body for req in bot.required_settings):
+                return name
+        # Default for dialin settings
+        if "dialin_settings" in body:
+            return DEFAULT_DIALIN_EXAMPLE
+        return None
+    def validate_bot_combination(self, body: Dict[str, Any]) -> List[str]:
+        """Validate that bot types in the configuration are compatible."""
+        errors = []
+        bot_types_in_config = [name for name in self.bots.keys() if name in body]
+        # Check each bot type against its incompatible list
+        for bot_name in bot_types_in_config:
+            bot = self.bots[bot_name]
+            for incompatible in bot.incompatible_with:
+                if incompatible in body:
+                    errors.append(
+                        f"Cannot have both '{bot_name}' and '{incompatible}' in the same configuration"
+                    )
+        return errors
+    def setup_configuration(self, body: Dict[str, Any]) -> Dict[str, Any]:
+        """Set up bot configuration based on detected bot type."""
+        # Ensure dialout_settings is an array if present
+        body = ensure_dialout_settings_array(body)
+        # Detect which bot type to use
+        bot_type_name = self.detect_bot_type(body)
+        if not bot_type_name:
+            raise HTTPException(
+                status_code=400, detail="Configuration doesn't match any supported scenario"
+            )
+        # If we have a dialin scenario but no explicit bot type, add the default
+        if "dialin_settings" in body and bot_type_name == DEFAULT_DIALIN_EXAMPLE:
+            if bot_type_name not in body:
+                body[bot_type_name] = {}
+        # Get the bot type object
+        bot_type = self.get_bot(bot_type_name)
+        # Create/update settings for the bot type
+        body = bot_type.create_settings(body)
+        # If in test mode, add any required settings
+        if bot_type.has_test_mode(body):
+            body = bot_type.prepare_for_test(body)
+        # Validate bot combinations
+        errors = self.validate_bot_combination(body)
+        if errors:
+            error_message = "Invalid configuration: " + "; ".join(errors)
+            raise HTTPException(status_code=400, detail=error_message)
+        return body

bot_runner.py ADDED Viewed

	@@ -0,0 +1,247 @@

+import argparse
+import json
+import os
+import shlex
+import subprocess
+from contextlib import asynccontextmanager
+from typing import Any, Dict
+import aiohttp
+from bot_constants import (
+    MAX_SESSION_TIME,
+    REQUIRED_ENV_VARS,
+)
+from bot_definitions import bot_registry
+from bot_runner_helpers import (
+    determine_room_capabilities,
+    ensure_prompt_config,
+    process_dialin_request,
+)
+from dotenv import load_dotenv
+from fastapi import FastAPI, HTTPException, Request
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import JSONResponse
+from pipecat.transports.services.helpers.daily_rest import (
+    DailyRESTHelper,
+    DailyRoomParams,
+    DailyRoomProperties,
+    DailyRoomSipParams,
+)
+load_dotenv(override=True)
+daily_helpers = {}
+# ----------------- Daily Room Management ----------------- #
+async def create_daily_room(room_url: str = None, config_body: Dict[str, Any] = None):
+    """Create or retrieve a Daily room with appropriate properties based on the configuration.
+    Args:
+        room_url: Optional existing room URL
+        config_body: Optional configuration that determines room capabilities
+    Returns:
+        Dict containing room URL, token, and SIP endpoint
+    """
+    if not room_url:
+        # Get room capabilities based on the configuration
+        capabilities = determine_room_capabilities(config_body)
+        # Configure SIP parameters if dialin is needed
+        sip_params = None
+        if capabilities["enable_dialin"]:
+            sip_params = DailyRoomSipParams(
+                display_name="dialin-user", video=False, sip_mode="dial-in", num_endpoints=2
+            )
+        # Create the properties object with the appropriate settings
+        properties = DailyRoomProperties(sip=sip_params)
+        # Set dialout capability if needed
+        if capabilities["enable_dialout"]:
+            properties.enable_dialout = True
+        # Log the capabilities being used
+        capability_str = ", ".join([f"{k}={v}" for k, v in capabilities.items()])
+        print(f"Creating room with capabilities: {capability_str}")
+        params = DailyRoomParams(properties=properties)
+        print("Creating new room...")
+        room = await daily_helpers["rest"].create_room(params=params)
+    else:
+        # Check if passed room URL exists
+        try:
+            room = await daily_helpers["rest"].get_room_from_url(room_url)
+        except Exception:
+            raise HTTPException(status_code=500, detail=f"Room not found: {room_url}")
+    print(f"Daily room: {room.url} {room.config.sip_endpoint}")
+    # Get token for the agent
+    token = await daily_helpers["rest"].get_token(room.url, MAX_SESSION_TIME)
+    if not room or not token:
+        raise HTTPException(status_code=500, detail="Failed to get room or token")
+    return {"room": room.url, "token": token, "sip_endpoint": room.config.sip_endpoint}
+# ----------------- Bot Process Management ----------------- #
+async def start_bot(room_details: Dict[str, str], body: Dict[str, Any], example: str) -> bool:
+    """Start a bot process with the given configuration.
+    Args:
+        room_details: Room URL and token
+        body: Bot configuration
+        example: Example script to run
+    Returns:
+        Boolean indicating success
+    """
+    room_url = room_details["room"]
+    token = room_details["token"]
+    # Properly format body as JSON string for command line
+    body_json = json.dumps(body).replace('"', '\\"')
+    print(f"++++ Body JSON: {body_json}")
+    # Modified to use non-LLM-specific bot module names
+    bot_proc = f'python3 -m {example} -u {room_url} -t {token} -b "{body_json}"'
+    print(f"Starting bot. Example: {example}, Room: {room_url}")
+    try:
+        command_parts = shlex.split(bot_proc)
+        subprocess.Popen(command_parts, bufsize=1, cwd=os.path.dirname(os.path.abspath(__file__)))
+        return True
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=f"Failed to start subprocess: {e}")
+# ----------------- API Setup ----------------- #
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    aiohttp_session = aiohttp.ClientSession()
+    daily_helpers["rest"] = DailyRESTHelper(
+        daily_api_key=os.getenv("DAILY_API_KEY", ""),
+        daily_api_url=os.getenv("DAILY_API_URL", "https://api.daily.co/v1"),
+        aiohttp_session=aiohttp_session,
+    )
+    yield
+    await aiohttp_session.close()
+app = FastAPI(lifespan=lifespan)
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# ----------------- API Endpoints ----------------- #
+@app.post("/start")
+async def handle_start_request(request: Request) -> JSONResponse:
+    """Unified endpoint to handle bot configuration for different scenarios."""
+    # Get default room URL from environment
+    room_url = os.getenv("DAILY_SAMPLE_ROOM_URL", None)
+    try:
+        data = await request.json()
+        # Handle webhook test
+        if "test" in data:
+            return JSONResponse({"test": True})
+        # Handle direct dialin webhook from Daily
+        if all(key in data for key in ["From", "To", "callId", "callDomain"]):
+            body = await process_dialin_request(data)
+        # Handle body-based request
+        elif "config" in data:
+            # Use the registry to set up the bot configuration
+            body = bot_registry.setup_configuration(data["config"])
+        else:
+            raise HTTPException(status_code=400, detail="Invalid request format")
+        # Ensure prompt configuration
+        body = ensure_prompt_config(body)
+        # Detect which bot type to use
+        bot_type_name = bot_registry.detect_bot_type(body)
+        if not bot_type_name:
+            raise HTTPException(
+                status_code=400, detail="Configuration doesn't match any supported scenario"
+            )
+        # Create the Daily room
+        room_details = await create_daily_room(room_url, body)
+        # Start the bot
+        await start_bot(room_details, body, bot_type_name)
+        # Get the bot type
+        bot_type = bot_registry.get_bot(bot_type_name)
+        # Build the response
+        response = {"status": "Bot started", "bot_type": bot_type_name}
+        # Add room URL for test mode
+        if bot_type.has_test_mode(body):
+            response["room_url"] = room_details["room"]
+            # Remove llm_model from response as it's no longer relevant
+            if "llm" in body:
+                response["llm_provider"] = body["llm"]  # Optionally keep track of provider
+        # Add dialout info for dialout scenarios
+        if "dialout_settings" in body and len(body["dialout_settings"]) > 0:
+            first_setting = body["dialout_settings"][0]
+            if "phoneNumber" in first_setting:
+                response["dialing_to"] = f"phone:{first_setting['phoneNumber']}"
+            elif "sipUri" in first_setting:
+                response["dialing_to"] = f"sip:{first_setting['sipUri']}"
+        return JSONResponse(response)
+    except json.JSONDecodeError:
+        raise HTTPException(status_code=400, detail="Invalid JSON in request body")
+    except Exception as e:
+        raise HTTPException(status_code=400, detail=f"Request processing error: {str(e)}")
+# ----------------- Main ----------------- #
+if __name__ == "__main__":
+    # Check environment variables
+    for env_var in REQUIRED_ENV_VARS:
+        if env_var not in os.environ:
+            raise Exception(f"Missing environment variable: {env_var}.")
+    parser = argparse.ArgumentParser(description="Pipecat Bot Runner")
+    parser.add_argument(
+        "--host", type=str, default=os.getenv("HOST", "0.0.0.0"), help="Host address"
+    )
+    parser.add_argument("--port", type=int, default=os.getenv("PORT", 7860), help="Port number")
+    parser.add_argument("--reload", action="store_true", default=True, help="Reload code on change")
+    config = parser.parse_args()
+    try:
+        import uvicorn
+        uvicorn.run("bot_runner:app", host=config.host, port=config.port, reload=config.reload)
+    except KeyboardInterrupt:
+        print("Pipecat runner shutting down...")

bot_runner_helpers.py ADDED Viewed

	@@ -0,0 +1,211 @@

+# bot_runner_helpers.py
+from typing import Any, Dict, Optional
+from bot_constants import (
+    DEFAULT_CALLTRANSFER_MODE,
+    DEFAULT_DIALIN_EXAMPLE,
+    DEFAULT_SPEAK_SUMMARY,
+    DEFAULT_STORE_SUMMARY,
+    DEFAULT_TEST_IN_PREBUILT,
+)
+from call_connection_manager import CallConfigManager
+# ----------------- Configuration Helpers ----------------- #
+def determine_room_capabilities(config_body: Optional[Dict[str, Any]] = None) -> Dict[str, bool]:
+    """Determine room capabilities based on the configuration.
+    This function examines the configuration to determine which capabilities
+    the Daily room should have enabled.
+    Args:
+        config_body: Configuration dictionary that determines room capabilities
+    Returns:
+        Dictionary of capability flags
+    """
+    capabilities = {
+        "enable_dialin": False,
+        "enable_dialout": False,
+        # Add more capabilities here in the future as needed
+    }
+    if not config_body:
+        return capabilities
+    # Check for dialin capability
+    capabilities["enable_dialin"] = "dialin_settings" in config_body
+    # Check for dialout capability - needed for outbound calls or transfers
+    has_dialout_settings = "dialout_settings" in config_body
+    # Check if there's a transfer to an operator configured
+    has_call_transfer = "call_transfer" in config_body
+    # Enable dialout if any condition requires it
+    capabilities["enable_dialout"] = has_dialout_settings or has_call_transfer
+    return capabilities
+def ensure_dialout_settings_array(body: Dict[str, Any]) -> Dict[str, Any]:
+    """Ensures dialout_settings is an array of objects.
+    Args:
+        body: The configuration dictionary
+    Returns:
+        Updated configuration with dialout_settings as an array
+    """
+    if "dialout_settings" in body:
+        # Convert to array if it's not already one
+        if not isinstance(body["dialout_settings"], list):
+            body["dialout_settings"] = [body["dialout_settings"]]
+    return body
+def ensure_prompt_config(body: Dict[str, Any]) -> Dict[str, Any]:
+    """Ensures the body has appropriate prompts settings, but doesn't add defaults.
+    Only makes sure the prompt section exists, allowing the bot script to handle defaults.
+    Args:
+        body: The configuration dictionary
+    Returns:
+        Updated configuration with prompt settings section
+    """
+    if "prompts" not in body:
+        body["prompts"] = []
+    return body
+def create_call_transfer_settings(body: Dict[str, Any]) -> Dict[str, Any]:
+    """Create call transfer settings based on configuration and customer mapping.
+    Args:
+        body: The configuration dictionary
+    Returns:
+        Call transfer settings dictionary
+    """
+    # Default transfer settings
+    transfer_settings = {
+        "mode": DEFAULT_CALLTRANSFER_MODE,
+        "speakSummary": DEFAULT_SPEAK_SUMMARY,
+        "storeSummary": DEFAULT_STORE_SUMMARY,
+        "testInPrebuilt": DEFAULT_TEST_IN_PREBUILT,
+    }
+    # If call_transfer already exists, merge the defaults with the existing settings
+    # This ensures all required fields exist while preserving user-specified values
+    if "call_transfer" in body:
+        existing_settings = body["call_transfer"]
+        # Update defaults with existing settings (existing values will override defaults)
+        for key, value in existing_settings.items():
+            transfer_settings[key] = value
+    else:
+        # No existing call_transfer - check if we have dialin settings for customer lookup
+        if "dialin_settings" in body:
+            # Create a temporary routing manager just for customer lookup
+            call_config_manager = CallConfigManager(body)
+            # Get caller info
+            caller_info = call_config_manager.get_caller_info()
+            from_number = caller_info.get("caller_number")
+            if from_number:
+                # Get customer name from phone number
+                customer_name = call_config_manager.get_customer_name(from_number)
+                # If we know the customer name, add it to the config for the bot to use
+                if customer_name:
+                    transfer_settings["customerName"] = customer_name
+    return transfer_settings
+def create_simple_dialin_settings(body: Dict[str, Any]) -> Dict[str, Any]:
+    """Create simple dialin settings based on configuration.
+    Args:
+        body: The configuration dictionary
+    Returns:
+        Simple dialin settings dictionary
+    """
+    # Default simple dialin settings
+    simple_dialin_settings = {
+        "testInPrebuilt": DEFAULT_TEST_IN_PREBUILT,
+    }
+    # If simple_dialin already exists, merge the defaults with the existing settings
+    if "simple_dialin" in body:
+        existing_settings = body["simple_dialin"]
+        # Update defaults with existing settings (existing values will override defaults)
+        for key, value in existing_settings.items():
+            simple_dialin_settings[key] = value
+    return simple_dialin_settings
+def create_simple_dialout_settings(body: Dict[str, Any]) -> Dict[str, Any]:
+    """Create simple dialout settings based on configuration.
+    Args:
+        body: The configuration dictionary
+    Returns:
+        Simple dialout settings dictionary
+    """
+    # Default simple dialout settings
+    simple_dialout_settings = {
+        "testInPrebuilt": DEFAULT_TEST_IN_PREBUILT,
+    }
+    # If simple_dialout already exists, merge the defaults with the existing settings
+    if "simple_dialout" in body:
+        existing_settings = body["simple_dialout"]
+        # Update defaults with existing settings (existing values will override defaults)
+        for key, value in existing_settings.items():
+            simple_dialout_settings[key] = value
+    return simple_dialout_settings
+async def process_dialin_request(data: Dict[str, Any]) -> Dict[str, Any]:
+    """Process incoming dial-in request data to create a properly formatted body.
+    Converts camelCase fields received from webhook to snake_case format
+    for internal consistency across the codebase.
+    Args:
+        data: Raw dialin data from webhook
+    Returns:
+        Properly formatted configuration with snake_case keys
+    """
+    # Create base body with dialin settings
+    body = {
+        "dialin_settings": {
+            "to": data.get("To", ""),
+            "from": data.get("From", ""),
+            "call_id": data.get("callId", data.get("CallSid", "")),  # Convert to snake_case
+            "call_domain": data.get("callDomain", ""),  # Convert to snake_case
+        }
+    }
+    # Use the global default to determine which example to run for dialin webhooks
+    example = DEFAULT_DIALIN_EXAMPLE
+    # Configure the bot based on the example
+    if example == "call_transfer":
+        # Create call transfer settings
+        body["call_transfer"] = create_call_transfer_settings(body)
+    elif example == "simple_dialin":
+        # Create simple dialin settings
+        body["simple_dialin"] = create_simple_dialin_settings(body)
+    return body

call_connection_manager.py ADDED Viewed

	@@ -0,0 +1,608 @@

+#
+# Copyright (c) 2024–2025, Daily
+#
+# SPDX-License-Identifier: BSD 2-Clause License
+#
+"""call_connection_manager.py.
+Manages customer/operator relationships and call routing for voice bots.
+Provides mapping between customers and operators, and functions for retrieving
+contact information. Also includes call state management.
+"""
+import json
+import os
+from typing import Any, Dict, List, Optional
+from loguru import logger
+class CallFlowState:
+    """State for tracking call flow operations and state transitions."""
+    def __init__(self):
+        # Operator-related state
+        self.dialed_operator = False
+        self.operator_connected = False
+        self.current_operator_index = 0
+        self.operator_dialout_settings = []
+        self.summary_finished = False
+        # Voicemail detection state
+        self.voicemail_detected = False
+        self.human_detected = False
+        self.voicemail_message_left = False
+        # Call termination state
+        self.call_terminated = False
+        self.participant_left_early = False
+    # Operator-related methods
+    def set_operator_dialed(self):
+        """Mark that an operator has been dialed."""
+        self.dialed_operator = True
+    def set_operator_connected(self):
+        """Mark that an operator has connected to the call."""
+        self.operator_connected = True
+        # Summary is not finished when operator first connects
+        self.summary_finished = False
+    def set_operator_disconnected(self):
+        """Handle operator disconnection."""
+        self.operator_connected = False
+        self.summary_finished = False
+    def set_summary_finished(self):
+        """Mark the summary as finished."""
+        self.summary_finished = True
+    def set_operator_dialout_settings(self, settings):
+        """Set the list of operator dialout settings to try."""
+        self.operator_dialout_settings = settings
+        self.current_operator_index = 0
+    def get_current_dialout_setting(self):
+        """Get the current operator dialout setting to try."""
+        if not self.operator_dialout_settings or self.current_operator_index >= len(
+            self.operator_dialout_settings
+        ):
+            return None
+        return self.operator_dialout_settings[self.current_operator_index]
+    def move_to_next_operator(self):
+        """Move to the next operator in the list."""
+        self.current_operator_index += 1
+        return self.get_current_dialout_setting()
+    # Voicemail detection methods
+    def set_voicemail_detected(self):
+        """Mark that a voicemail system has been detected."""
+        self.voicemail_detected = True
+        self.human_detected = False
+    def set_human_detected(self):
+        """Mark that a human has been detected (not voicemail)."""
+        self.human_detected = True
+        self.voicemail_detected = False
+    def set_voicemail_message_left(self):
+        """Mark that a voicemail message has been left."""
+        self.voicemail_message_left = True
+    # Call termination methods
+    def set_call_terminated(self):
+        """Mark that the call has been terminated by the bot."""
+        self.call_terminated = True
+    def set_participant_left_early(self):
+        """Mark that a participant left the call early."""
+        self.participant_left_early = True
+class SessionManager:
+    """Centralized management of session IDs and state for all call participants."""
+    def __init__(self):
+        # Track session IDs of different participant types
+        self.session_ids = {
+            "operator": None,
+            "customer": None,
+            "bot": None,
+            # Add other participant types as needed
+        }
+        # References for easy access in processors that need mutable containers
+        self.session_id_refs = {
+            "operator": [None],
+            "customer": [None],
+            "bot": [None],
+            # Add other participant types as needed
+        }
+        # State object for call flow
+        self.call_flow_state = CallFlowState()
+    def set_session_id(self, participant_type, session_id):
+        """Set the session ID for a specific participant type.
+        Args:
+            participant_type: Type of participant (e.g., "operator", "customer", "bot")
+            session_id: The session ID to set
+        """
+        if participant_type in self.session_ids:
+            self.session_ids[participant_type] = session_id
+            # Also update the corresponding reference if it exists
+            if participant_type in self.session_id_refs:
+                self.session_id_refs[participant_type][0] = session_id
+    def get_session_id(self, participant_type):
+        """Get the session ID for a specific participant type.
+        Args:
+            participant_type: Type of participant (e.g., "operator", "customer", "bot")
+        Returns:
+            The session ID or None if not set
+        """
+        return self.session_ids.get(participant_type)
+    def get_session_id_ref(self, participant_type):
+        """Get the mutable reference for a specific participant type.
+        Args:
+            participant_type: Type of participant (e.g., "operator", "customer", "bot")
+        Returns:
+            A mutable list container holding the session ID or None if not available
+        """
+        return self.session_id_refs.get(participant_type)
+    def is_participant_type(self, session_id, participant_type):
+        """Check if a session ID belongs to a specific participant type.
+        Args:
+            session_id: The session ID to check
+            participant_type: Type of participant (e.g., "operator", "customer", "bot")
+        Returns:
+            True if the session ID matches the participant type, False otherwise
+        """
+        return self.session_ids.get(participant_type) == session_id
+    def reset_participant(self, participant_type):
+        """Reset the state for a specific participant type.
+        Args:
+            participant_type: Type of participant (e.g., "operator", "customer", "bot")
+        """
+        if participant_type in self.session_ids:
+            self.session_ids[participant_type] = None
+            if participant_type in self.session_id_refs:
+                self.session_id_refs[participant_type][0] = None
+            # Additional reset actions for specific participant types
+            if participant_type == "operator":
+                self.call_flow_state.set_operator_disconnected()
+class CallConfigManager:
+    """Manages customer/operator relationships and call routing."""
+    def __init__(self, body_data: Dict[str, Any] = None):
+        """Initialize with optional body data.
+        Args:
+            body_data: Optional dictionary containing request body data
+        """
+        self.body = body_data or {}
+        # Get environment variables with fallbacks
+        self.dial_in_from_number = os.getenv("DIAL_IN_FROM_NUMBER", "+10000000001")
+        self.dial_out_to_number = os.getenv("DIAL_OUT_TO_NUMBER", "+10000000002")
+        self.operator_number = os.getenv("OPERATOR_NUMBER", "+10000000003")
+        # Initialize maps with dynamic values
+        self._initialize_maps()
+        self._build_reverse_lookup_maps()
+    def _initialize_maps(self):
+        """Initialize the customer and operator maps with environment variables."""
+        # Maps customer names to their contact information
+        self.CUSTOMER_MAP = {
+            "Dominic": {
+                "phoneNumber": self.dial_in_from_number,  # I have two phone numbers, one for dialing in and one for dialing out. I give myself a separate name for each.
+            },
+            "Stewart": {
+                "phoneNumber": self.dial_out_to_number,
+            },
+            "James": {
+                "phoneNumber": "+10000000000",
+                "callerId": "james-caller-id-uuid",
+                "sipUri": "sip:[email protected]",
+            },
+            "Sarah": {
+                "sipUri": "sip:[email protected]",
+            },
+            "Michael": {
+                "phoneNumber": "+16505557890",
+                "callerId": "michael-caller-id-uuid",
+            },
+        }
+        # Maps customer names to their assigned operator names
+        self.CUSTOMER_TO_OPERATOR_MAP = {
+            "Dominic": ["Yunyoung", "Maria"],  # Try Yunyoung first, then Maria
+            "Stewart": "Yunyoung",
+            "James": "Yunyoung",
+            "Sarah": "Jennifer",
+            "Michael": "Paul",
+            # Default mapping to ensure all customers have an operator
+            "Default": "Yunyoung",
+        }
+        # Maps operator names to their contact details
+        self.OPERATOR_CONTACT_MAP = {
+            "Paul": {
+                "phoneNumber": "+12345678904",
+                "callerId": "paul-caller-id-uuid",
+            },
+            "Yunyoung": {
+                "phoneNumber": self.operator_number,  # Dials out to my other phone number.
+            },
+            "Maria": {
+                "sipUri": "sip:[email protected]",
+            },
+            "Jennifer": {"phoneNumber": "+14155559876", "callerId": "jennifer-caller-id-uuid"},
+            "Default": {
+                "phoneNumber": self.operator_number,  # Use the operator number as default
+            },
+        }
+    def _build_reverse_lookup_maps(self):
+        """Build reverse lookup maps for phone numbers and SIP URIs to customer names."""
+        self._PHONE_TO_CUSTOMER_MAP = {}
+        self._SIP_TO_CUSTOMER_MAP = {}
+        for customer_name, contact_info in self.CUSTOMER_MAP.items():
+            if "phoneNumber" in contact_info:
+                self._PHONE_TO_CUSTOMER_MAP[contact_info["phoneNumber"]] = customer_name
+            if "sipUri" in contact_info:
+                self._SIP_TO_CUSTOMER_MAP[contact_info["sipUri"]] = customer_name
+    @classmethod
+    def from_json_string(cls, json_string: str):
+        """Create a CallRoutingManager from a JSON string.
+        Args:
+            json_string: JSON string containing body data
+        Returns:
+            CallRoutingManager instance with parsed data
+        Raises:
+            json.JSONDecodeError: If JSON string is invalid
+        """
+        body_data = json.loads(json_string)
+        return cls(body_data)
+    def find_customer_by_contact(self, contact_info: str) -> Optional[str]:
+        """Find customer name from a contact identifier (phone number or SIP URI).
+        Args:
+            contact_info: The contact identifier (phone number or SIP URI)
+        Returns:
+            The customer name or None if not found
+        """
+        # Check if it's a phone number
+        if contact_info in self._PHONE_TO_CUSTOMER_MAP:
+            return self._PHONE_TO_CUSTOMER_MAP[contact_info]
+        # Check if it's a SIP URI
+        if contact_info in self._SIP_TO_CUSTOMER_MAP:
+            return self._SIP_TO_CUSTOMER_MAP[contact_info]
+        return None
+    def get_customer_name(self, phone_number: str) -> Optional[str]:
+        """Get customer name from their phone number.
+        Args:
+            phone_number: The customer's phone number
+        Returns:
+            The customer name or None if not found
+        """
+        # Note: In production, this would likely query a database
+        return self.find_customer_by_contact(phone_number)
+    def get_operators_for_customer(self, customer_name: Optional[str]) -> List[str]:
+        """Get the operator name(s) assigned to a customer.
+        Args:
+            customer_name: The customer's name
+        Returns:
+            List of operator names (single item or multiple)
+        """
+        # Note: In production, this would likely query a database
+        if not customer_name or customer_name not in self.CUSTOMER_TO_OPERATOR_MAP:
+            return ["Default"]
+        operators = self.CUSTOMER_TO_OPERATOR_MAP[customer_name]
+        # Convert single string to list for consistency
+        if isinstance(operators, str):
+            return [operators]
+        return operators
+    def get_operator_dialout_settings(self, operator_name: str) -> Dict[str, str]:
+        """Get an operator's dialout settings from their name.
+        Args:
+            operator_name: The operator's name
+        Returns:
+            Dictionary with dialout settings for the operator
+        """
+        # Note: In production, this would likely query a database
+        return self.OPERATOR_CONTACT_MAP.get(operator_name, self.OPERATOR_CONTACT_MAP["Default"])
+    def get_dialout_settings_for_caller(
+        self, from_number: Optional[str] = None
+    ) -> List[Dict[str, str]]:
+        """Determine the appropriate operator dialout settings based on caller's number.
+        This method uses the caller's number to look up the customer name,
+        then finds the assigned operators for that customer, and returns
+        an array of operator dialout settings to try in sequence.
+        Args:
+            from_number: The caller's phone number (from dialin_settings)
+        Returns:
+            List of operator dialout settings to try
+        """
+        if not from_number:
+            # If we don't have dialin settings, use the Default operator
+            return [self.get_operator_dialout_settings("Default")]
+        # Get customer name from phone number
+        customer_name = self.get_customer_name(from_number)
+        # Get operator names assigned to this customer
+        operator_names = self.get_operators_for_customer(customer_name)
+        # Get dialout settings for each operator
+        return [self.get_operator_dialout_settings(name) for name in operator_names]
+    def get_caller_info(self) -> Dict[str, Optional[str]]:
+        """Get caller and dialed numbers from dialin settings in the body.
+        Returns:
+            Dictionary containing caller_number and dialed_number
+        """
+        raw_dialin_settings = self.body.get("dialin_settings")
+        if not raw_dialin_settings:
+            return {"caller_number": None, "dialed_number": None}
+        # Handle different case variations
+        dialed_number = raw_dialin_settings.get("To") or raw_dialin_settings.get("to")
+        caller_number = raw_dialin_settings.get("From") or raw_dialin_settings.get("from")
+        return {"caller_number": caller_number, "dialed_number": dialed_number}
+    def get_caller_number(self) -> Optional[str]:
+        """Get the caller's phone number from dialin settings in the body.
+        Returns:
+            The caller's phone number or None if not available
+        """
+        return self.get_caller_info()["caller_number"]
+    async def start_dialout(self, transport, dialout_settings=None):
+        """Helper function to start dialout using the provided settings or from body.
+        Args:
+            transport: The transport instance to use for dialout
+            dialout_settings: Optional override for dialout settings
+        Returns:
+            None
+        """
+        # Use provided settings or get from body
+        settings = dialout_settings or self.get_dialout_settings()
+        if not settings:
+            logger.warning("No dialout settings available")
+            return
+        for setting in settings:
+            if "phoneNumber" in setting:
+                logger.info(f"Dialing number: {setting['phoneNumber']}")
+                if "callerId" in setting:
+                    logger.info(f"with callerId: {setting['callerId']}")
+                    await transport.start_dialout(
+                        {"phoneNumber": setting["phoneNumber"], "callerId": setting["callerId"]}
+                    )
+                else:
+                    logger.info("with no callerId")
+                    await transport.start_dialout({"phoneNumber": setting["phoneNumber"]})
+            elif "sipUri" in setting:
+                logger.info(f"Dialing sipUri: {setting['sipUri']}")
+                await transport.start_dialout({"sipUri": setting["sipUri"]})
+            else:
+                logger.warning(f"Unknown dialout setting format: {setting}")
+    def get_dialout_settings(self) -> Optional[List[Dict[str, Any]]]:
+        """Extract dialout settings from the body.
+        Returns:
+            List of dialout setting objects or None if not present
+        """
+        # Check if we have dialout settings
+        if "dialout_settings" in self.body:
+            dialout_settings = self.body["dialout_settings"]
+            # Convert to list if it's an object (for backward compatibility)
+            if isinstance(dialout_settings, dict):
+                return [dialout_settings]
+            elif isinstance(dialout_settings, list):
+                return dialout_settings
+        return None
+    def get_dialin_settings(self) -> Optional[Dict[str, Any]]:
+        """Extract dialin settings from the body.
+        Handles both camelCase and snake_case variations of fields for backward compatibility,
+        but normalizes to snake_case for internal usage.
+        Returns:
+            Dictionary containing dialin settings or None if not present
+        """
+        raw_dialin_settings = self.body.get("dialin_settings")
+        if not raw_dialin_settings:
+            return None
+        # Normalize dialin settings to handle different case variations
+        # Prioritize snake_case (call_id, call_domain) but fall back to camelCase (callId, callDomain)
+        dialin_settings = {
+            "call_id": raw_dialin_settings.get("call_id") or raw_dialin_settings.get("callId"),
+            "call_domain": raw_dialin_settings.get("call_domain")
+            or raw_dialin_settings.get("callDomain"),
+            "to": raw_dialin_settings.get("to") or raw_dialin_settings.get("To"),
+            "from": raw_dialin_settings.get("from") or raw_dialin_settings.get("From"),
+        }
+        return dialin_settings
+    # Bot prompt helper functions - no defaults provided, just return what's in the body
+    def get_prompt(self, prompt_name: str) -> Optional[str]:
+        """Retrieve the prompt text for a given prompt name.
+        Args:
+            prompt_name: The name of the prompt to retrieve.
+        Returns:
+            The prompt string corresponding to the provided name, or None if not configured.
+        """
+        prompts = self.body.get("prompts", [])
+        for prompt in prompts:
+            if prompt.get("name") == prompt_name:
+                return prompt.get("text")
+        return None
+    def get_transfer_mode(self) -> Optional[str]:
+        """Get transfer mode from the body.
+        Returns:
+            Transfer mode string or None if not configured
+        """
+        if "call_transfer" in self.body:
+            return self.body["call_transfer"].get("mode")
+        return None
+    def get_speak_summary(self) -> Optional[bool]:
+        """Get speak summary from the body.
+        Returns:
+            Boolean indicating if summary should be spoken or None if not configured
+        """
+        if "call_transfer" in self.body:
+            return self.body["call_transfer"].get("speakSummary")
+        return None
+    def get_store_summary(self) -> Optional[bool]:
+        """Get store summary from the body.
+        Returns:
+            Boolean indicating if summary should be stored or None if not configured
+        """
+        if "call_transfer" in self.body:
+            return self.body["call_transfer"].get("storeSummary")
+        return None
+    def is_test_mode(self) -> bool:
+        """Check if running in test mode.
+        Returns:
+            Boolean indicating if test mode is enabled
+        """
+        if "voicemail_detection" in self.body:
+            return bool(self.body["voicemail_detection"].get("testInPrebuilt"))
+        if "call_transfer" in self.body:
+            return bool(self.body["call_transfer"].get("testInPrebuilt"))
+        if "simple_dialin" in self.body:
+            return bool(self.body["simple_dialin"].get("testInPrebuilt"))
+        if "simple_dialout" in self.body:
+            return bool(self.body["simple_dialout"].get("testInPrebuilt"))
+        return False
+    def is_voicemail_detection_enabled(self) -> bool:
+        """Check if voicemail detection is enabled in the body.
+        Returns:
+            Boolean indicating if voicemail detection is enabled
+        """
+        return bool(self.body.get("voicemail_detection"))
+    def customize_prompt(self, prompt: str, customer_name: Optional[str] = None) -> str:
+        """Insert customer name into prompt template if available.
+        Args:
+            prompt: The prompt template containing optional {customer_name} placeholders
+            customer_name: Optional customer name to insert
+        Returns:
+            Customized prompt with customer name inserted
+        """
+        if customer_name and prompt:
+            return prompt.replace("{customer_name}", customer_name)
+        return prompt
+    def create_system_message(self, content: str) -> Dict[str, str]:
+        """Create a properly formatted system message.
+        Args:
+            content: The message content
+        Returns:
+            Dictionary with role and content for the system message
+        """
+        return {"role": "system", "content": content}
+    def create_user_message(self, content: str) -> Dict[str, str]:
+        """Create a properly formatted user message.
+        Args:
+            content: The message content
+        Returns:
+            Dictionary with role and content for the user message
+        """
+        return {"role": "user", "content": content}
+    def get_customer_info_suffix(
+        self, customer_name: Optional[str] = None, preposition: str = "for"
+    ) -> str:
+        """Create a consistent customer info suffix.
+        Args:
+            customer_name: Optional customer name
+            preposition: Preposition to use before the name (e.g., "for", "to", "")
+        Returns:
+            String with formatted customer info suffix
+        """
+        if not customer_name:
+            return ""
+        # Add a space before the preposition if it's not empty
+        space_prefix = " " if preposition else ""
+        # For non-empty prepositions, add a space after it
+        space_suffix = " " if preposition else ""
+        return f"{space_prefix}{preposition}{space_suffix}{customer_name}"

call_transfer.py ADDED Viewed

	@@ -0,0 +1,465 @@

+#
+# Copyright (c) 2024–2025, Daily
+#
+# SPDX-License-Identifier: BSD 2-Clause License
+#
+import argparse
+import asyncio
+import os
+import sys
+from call_connection_manager import CallConfigManager, SessionManager
+from dotenv import load_dotenv
+from loguru import logger
+from pipecat.adapters.schemas.function_schema import FunctionSchema
+from pipecat.adapters.schemas.tools_schema import ToolsSchema
+from pipecat.audio.vad.silero import SileroVADAnalyzer
+from pipecat.frames.frames import (
+    BotStoppedSpeakingFrame,
+    EndTaskFrame,
+    Frame,
+    LLMMessagesFrame,
+    TranscriptionFrame,
+)
+from pipecat.pipeline.pipeline import Pipeline
+from pipecat.pipeline.runner import PipelineRunner
+from pipecat.pipeline.task import PipelineParams, PipelineTask
+from pipecat.processors.aggregators.openai_llm_context import OpenAILLMContext
+from pipecat.processors.filters.function_filter import FunctionFilter
+from pipecat.processors.frame_processor import FrameDirection, FrameProcessor
+from pipecat.services.cartesia.tts import CartesiaTTSService
+from pipecat.services.llm_service import FunctionCallParams, LLMService
+from pipecat.services.openai.llm import OpenAILLMService
+from pipecat.transports.services.daily import DailyDialinSettings, DailyParams, DailyTransport
+load_dotenv(override=True)
+logger.remove(0)
+logger.add(sys.stderr, level="DEBUG")
+daily_api_key = os.getenv("DAILY_API_KEY", "")
+daily_api_url = os.getenv("DAILY_API_URL", "https://api.daily.co/v1")
+class TranscriptionModifierProcessor(FrameProcessor):
+    """Processor that modifies transcription frames before they reach the context aggregator."""
+    def __init__(self, operator_session_id_ref):
+        """Initialize with a reference to the operator_session_id variable.
+        Args:
+            operator_session_id_ref: A reference or container holding the operator's session ID
+        """
+        super().__init__()
+        self.operator_session_id_ref = operator_session_id_ref
+    async def process_frame(self, frame: Frame, direction: FrameDirection):
+        await super().process_frame(frame, direction)
+        # Only process frames that are moving downstream
+        if direction == FrameDirection.DOWNSTREAM:
+            # Check if the frame is a transcription frame
+            if isinstance(frame, TranscriptionFrame):
+                # Check if this frame is from the operator
+                if (
+                    self.operator_session_id_ref[0] is not None
+                    and hasattr(frame, "user_id")
+                    and frame.user_id == self.operator_session_id_ref[0]
+                ):
+                    # Modify the text to include operator prefix
+                    frame.text = f"[OPERATOR]: {frame.text}"
+                    logger.debug(f"++++ Modified Operator Transcription: {frame.text}")
+        # Push the (potentially modified) frame downstream
+        await self.push_frame(frame, direction)
+class SummaryFinished(FrameProcessor):
+    """Frame processor that monitors when summary has been finished."""
+    def __init__(self, dial_operator_state):
+        super().__init__()
+        # Store reference to the shared state object
+        self.dial_operator_state = dial_operator_state
+    async def process_frame(self, frame: Frame, direction: FrameDirection):
+        await super().process_frame(frame, direction)
+        # Check if operator is connected and this is the end of bot speaking
+        if self.dial_operator_state.operator_connected and isinstance(
+            frame, BotStoppedSpeakingFrame
+        ):
+            logger.debug("Summary finished, bot will stop speaking")
+            self.dial_operator_state.set_summary_finished()
+        await self.push_frame(frame, direction)
+async def main(
+    room_url: str,
+    token: str,
+    body: dict,
+):
+    # ------------ CONFIGURATION AND SETUP ------------
+    # Create a routing manager using the provided body
+    call_config_manager = CallConfigManager.from_json_string(body) if body else CallConfigManager()
+    # Get caller information
+    caller_info = call_config_manager.get_caller_info()
+    caller_number = caller_info["caller_number"]
+    dialed_number = caller_info["dialed_number"]
+    # Get customer name based on caller number
+    customer_name = call_config_manager.get_customer_name(caller_number) if caller_number else None
+    # Get appropriate operator settings based on the caller
+    operator_dialout_settings = call_config_manager.get_dialout_settings_for_caller(caller_number)
+    logger.info(f"Caller number: {caller_number}")
+    logger.info(f"Dialed number: {dialed_number}")
+    logger.info(f"Customer name: {customer_name}")
+    logger.info(f"Operator dialout settings: {operator_dialout_settings}")
+    # Check if in test mode
+    test_mode = call_config_manager.is_test_mode()
+    # Get dialin settings if present
+    dialin_settings = call_config_manager.get_dialin_settings()
+    # ------------ TRANSPORT SETUP ------------
+    # Set up transport parameters
+    if test_mode:
+        logger.info("Running in test mode")
+        transport_params = DailyParams(
+            api_url=daily_api_url,
+            api_key=daily_api_key,
+            audio_in_enabled=True,
+            audio_out_enabled=True,
+            video_out_enabled=False,
+            vad_analyzer=SileroVADAnalyzer(),
+            transcription_enabled=True,
+        )
+    else:
+        daily_dialin_settings = DailyDialinSettings(
+            call_id=dialin_settings.get("call_id"), call_domain=dialin_settings.get("call_domain")
+        )
+        transport_params = DailyParams(
+            api_url=daily_api_url,
+            api_key=daily_api_key,
+            dialin_settings=daily_dialin_settings,
+            audio_in_enabled=True,
+            audio_out_enabled=True,
+            video_out_enabled=False,
+            vad_analyzer=SileroVADAnalyzer(),
+            transcription_enabled=True,
+        )
+    # Initialize the session manager
+    session_manager = SessionManager()
+    # Set up the operator dialout settings
+    session_manager.call_flow_state.set_operator_dialout_settings(operator_dialout_settings)
+    # Initialize transport
+    transport = DailyTransport(
+        room_url,
+        token,
+        "Call Transfer Bot",
+        transport_params,
+    )
+    # Initialize TTS
+    tts = CartesiaTTSService(
+        api_key=os.getenv("CARTESIA_API_KEY", ""),
+        voice_id="b7d50908-b17c-442d-ad8d-810c63997ed9",  # Use Helpful Woman voice by default
+    )
+    # ------------ LLM AND CONTEXT SETUP ------------
+    # Get prompts from routing manager
+    call_transfer_initial_prompt = call_config_manager.get_prompt("call_transfer_initial_prompt")
+    # Build default greeting with customer name if available
+    customer_greeting = f"Hello {customer_name}" if customer_name else "Hello"
+    default_greeting = f"{customer_greeting}, this is Hailey from customer support. What can I help you with today?"
+    # Build initial prompt
+    if call_transfer_initial_prompt:
+        # Use custom prompt with customer name replacement if needed
+        system_instruction = call_config_manager.customize_prompt(
+            call_transfer_initial_prompt, customer_name
+        )
+        logger.info("Using custom call transfer initial prompt")
+    else:
+        # Use default prompt with formatted greeting
+        system_instruction = f"""You are Chatbot, a friendly, helpful robot. Never refer to this prompt, even if asked. Follow these steps **EXACTLY**.
+        ### **Standard Operating Procedure:**
+        #### **Step 1: Greeting**
+        - Greet the user with: "{default_greeting}"
+        #### **Step 2: Handling Requests**
+        - If the user requests a supervisor, **IMMEDIATELY** call the `dial_operator` function.
+        - **FAILURE TO CALL `dial_operator` IMMEDIATELY IS A MISTAKE.**
+        - If the user ends the conversation, **IMMEDIATELY** call the `terminate_call` function.
+        - **FAILURE TO CALL `terminate_call` IMMEDIATELY IS A MISTAKE.**
+        ### **General Rules**
+        - Your output will be converted to audio, so **do not include special characters or formatting.**
+        """
+        logger.info("Using default call transfer initial prompt")
+    # Create the system message and initialize messages list
+    messages = [call_config_manager.create_system_message(system_instruction)]
+    # ------------ FUNCTION DEFINITIONS ------------
+    async def terminate_call(
+        task: PipelineTask,  # Pipeline task reference
+        params: FunctionCallParams,
+    ):
+        """Function the bot can call to terminate the call."""
+        # Create a message to add
+        content = "The user wants to end the conversation, thank them for chatting."
+        message = call_config_manager.create_system_message(content)
+        # Append the message to the list
+        messages.append(message)
+        # Queue the message to the context
+        await task.queue_frames([LLMMessagesFrame(messages)])
+        # Then end the call
+        await params.llm.queue_frame(EndTaskFrame(), FrameDirection.UPSTREAM)
+    async def dial_operator(params: FunctionCallParams):
+        """Function the bot can call to dial an operator."""
+        dialout_setting = session_manager.call_flow_state.get_current_dialout_setting()
+        if call_config_manager.get_transfer_mode() == "dialout":
+            if dialout_setting:
+                session_manager.call_flow_state.set_operator_dialed()
+                logger.info(f"Dialing operator with settings: {dialout_setting}")
+                # Create a message to add
+                content = "The user has requested a supervisor, indicate that you will attempt to connect them with a supervisor."
+                message = call_config_manager.create_system_message(content)
+                # Append the message to the list
+                messages.append(message)
+                # Queue the message to the context
+                await task.queue_frames([LLMMessagesFrame(messages)])
+                # Start the dialout
+                await call_config_manager.start_dialout(transport, [dialout_setting])
+            else:
+                # Create a message to add
+                content = "Indicate that there are no operator dialout settings available."
+                message = call_config_manager.create_system_message(content)
+                # Append the message to the list
+                messages.append(message)
+                # Queue the message to the context
+                await task.queue_frames([LLMMessagesFrame(messages)])
+                logger.info("No operator dialout settings available")
+        else:
+            # Create a message to add
+            content = "Indicate that the current mode is not supported."
+            message = call_config_manager.create_system_message(content)
+            # Append the message to the list
+            messages.append(message)
+            # Queue the message to the context
+            await task.queue_frames([LLMMessagesFrame(messages)])
+            logger.info("Other mode not supported")
+    # Define function schemas for tools
+    terminate_call_function = FunctionSchema(
+        name="terminate_call",
+        description="Call this function to terminate the call.",
+        properties={},
+        required=[],
+    )
+    dial_operator_function = FunctionSchema(
+        name="dial_operator",
+        description="Call this function when the user asks to speak with a human",
+        properties={},
+        required=[],
+    )
+    # Create tools schema
+    tools = ToolsSchema(standard_tools=[terminate_call_function, dial_operator_function])
+    # Initialize LLM
+    llm = OpenAILLMService(api_key=os.getenv("OPENAI_API_KEY"))
+    # Register functions with the LLM
+    llm.register_function("terminate_call", lambda params: terminate_call(task, params))
+    llm.register_function("dial_operator", dial_operator)
+    # Initialize LLM context and aggregator
+    context = OpenAILLMContext(messages, tools)
+    context_aggregator = llm.create_context_aggregator(context)
+    # ------------ PIPELINE SETUP ------------
+    # Use the session manager's references
+    summary_finished = SummaryFinished(session_manager.call_flow_state)
+    transcription_modifier = TranscriptionModifierProcessor(
+        session_manager.get_session_id_ref("operator")
+    )
+    # Define function to determine if bot should speak
+    async def should_speak(self) -> bool:
+        result = (
+            not session_manager.call_flow_state.operator_connected
+            or not session_manager.call_flow_state.summary_finished
+        )
+        return result
+    # Build pipeline
+    pipeline = Pipeline(
+        [
+            transport.input(),  # Transport user input
+            transcription_modifier,  # Prepends operator transcription with [OPERATOR]
+            context_aggregator.user(),  # User responses
+            FunctionFilter(should_speak),
+            llm,
+            tts,
+            summary_finished,
+            transport.output(),  # Transport bot output
+            context_aggregator.assistant(),  # Assistant spoken responses
+        ]
+    )
+    # Create pipeline task
+    task = PipelineTask(
+        pipeline,
+        params=PipelineParams(allow_interruptions=True),
+    )
+    # ------------ EVENT HANDLERS ------------
+    @transport.event_handler("on_first_participant_joined")
+    async def on_first_participant_joined(transport, participant):
+        await transport.capture_participant_transcription(participant["id"])
+        # For the dialin case, we want the bot to answer the phone and greet the user
+        await task.queue_frames([context_aggregator.user().get_context_frame()])
+    @transport.event_handler("on_dialout_answered")
+    async def on_dialout_answered(transport, data):
+        logger.debug(f"++++ Dial-out answered: {data}")
+        await transport.capture_participant_transcription(data["sessionId"])
+        # Skip if operator already connected
+        if (
+            not session_manager.call_flow_state
+            or session_manager.call_flow_state.operator_connected
+        ):
+            logger.debug(f"Operator already connected: {data}")
+            return
+        logger.debug(f"Operator connected with session ID: {data['sessionId']}")
+        # Set operator session ID in the session manager
+        session_manager.set_session_id("operator", data["sessionId"])
+        # Update state
+        session_manager.call_flow_state.set_operator_connected()
+        # Determine message content based on configuration
+        if call_config_manager.get_speak_summary():
+            logger.debug("Bot will speak summary")
+            call_transfer_prompt = call_config_manager.get_prompt("call_transfer_prompt")
+            if call_transfer_prompt:
+                # Use custom prompt
+                logger.info("Using custom call transfer prompt")
+                content = call_config_manager.customize_prompt(call_transfer_prompt, customer_name)
+            else:
+                # Use default summary prompt
+                logger.info("Using default call transfer prompt")
+                customer_info = call_config_manager.get_customer_info_suffix(customer_name)
+                content = f"""An operator is joining the call{customer_info}.
+                    Give a brief summary of the customer's issues so far."""
+        else:
+            # Simple join notification without summary
+            logger.debug("Bot will not speak summary")
+            customer_info = call_config_manager.get_customer_info_suffix(customer_name)
+            content = f"""Indicate that an operator has joined the call{customer_info}."""
+        # Create and queue system message
+        message = call_config_manager.create_system_message(content)
+        messages.append(message)
+        await task.queue_frames([LLMMessagesFrame(messages)])
+    @transport.event_handler("on_dialout_stopped")
+    async def on_dialout_stopped(transport, data):
+        if session_manager.get_session_id("operator") and data[
+            "sessionId"
+        ] == session_manager.get_session_id("operator"):
+            logger.debug("Dialout to operator stopped")
+    @transport.event_handler("on_participant_left")
+    async def on_participant_left(transport, participant, reason):
+        logger.debug(f"Participant left: {participant}, reason: {reason}")
+        # Check if the operator is the one who left
+        if not (
+            session_manager.get_session_id("operator")
+            and participant["id"] == session_manager.get_session_id("operator")
+        ):
+            await task.cancel()
+            return
+        logger.debug("Operator left the call")
+        # Reset operator state
+        session_manager.reset_participant("operator")
+        # Determine message content
+        call_transfer_finished_prompt = call_config_manager.get_prompt(
+            "call_transfer_finished_prompt"
+        )
+        if call_transfer_finished_prompt:
+            # Use custom prompt for operator departure
+            logger.info("Using custom call transfer finished prompt")
+            content = call_config_manager.customize_prompt(
+                call_transfer_finished_prompt, customer_name
+            )
+        else:
+            # Use default prompt for operator departure
+            logger.info("Using default call transfer finished prompt")
+            customer_info = call_config_manager.get_customer_info_suffix(
+                customer_name, preposition=""
+            )
+            content = f"""The operator has left the call.
+                Resume your role as the primary support agent and use information from the operator's conversation to help the customer{customer_info}.
+                Let the customer know the operator has left and ask if they need further assistance."""
+        # Create and queue system message
+        message = call_config_manager.create_system_message(content)
+        messages.append(message)
+        await task.queue_frames([LLMMessagesFrame(messages)])
+    # ------------ RUN PIPELINE ------------
+    runner = PipelineRunner()
+    await runner.run(task)
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Pipecat Call Transfer Bot")
+    parser.add_argument("-u", "--url", type=str, help="Room URL")
+    parser.add_argument("-t", "--token", type=str, help="Room Token")
+    parser.add_argument("-b", "--body", type=str, help="JSON configuration string")
+    args = parser.parse_args()
+    # Log the arguments for debugging
+    logger.info(f"Room URL: {args.url}")
+    logger.info(f"Token: {args.token}")
+    logger.info(f"Body provided: {bool(args.body)}")
+    asyncio.run(main(args.url, args.token, args.body))

image.png ADDED Viewed

simple_dialin.py ADDED Viewed

	@@ -0,0 +1,192 @@

+#
+# Copyright (c) 2024–2025, Daily
+#
+# SPDX-License-Identifier: BSD 2-Clause License
+#
+import argparse
+import asyncio
+import os
+import sys
+from call_connection_manager import CallConfigManager, SessionManager
+from dotenv import load_dotenv
+from loguru import logger
+from pipecat.adapters.schemas.function_schema import FunctionSchema
+from pipecat.adapters.schemas.tools_schema import ToolsSchema
+from pipecat.audio.vad.silero import SileroVADAnalyzer
+from pipecat.frames.frames import EndTaskFrame
+from pipecat.pipeline.pipeline import Pipeline
+from pipecat.pipeline.runner import PipelineRunner
+from pipecat.pipeline.task import PipelineParams, PipelineTask
+from pipecat.processors.aggregators.openai_llm_context import OpenAILLMContext
+from pipecat.processors.frame_processor import FrameDirection
+from pipecat.services.cartesia.tts import CartesiaTTSService
+from pipecat.services.llm_service import FunctionCallParams
+from pipecat.services.openai.llm import OpenAILLMService
+from pipecat.transports.services.daily import DailyDialinSettings, DailyParams, DailyTransport
+load_dotenv(override=True)
+logger.remove(0)
+logger.add(sys.stderr, level="DEBUG")
+daily_api_key = os.getenv("DAILY_API_KEY", "")
+daily_api_url = os.getenv("DAILY_API_URL", "https://api.daily.co/v1")
+async def main(
+    room_url: str,
+    token: str,
+    body: dict,
+):
+    # ------------ CONFIGURATION AND SETUP ------------
+    # Create a config manager using the provided body
+    call_config_manager = CallConfigManager.from_json_string(body) if body else CallConfigManager()
+    # Get important configuration values
+    test_mode = call_config_manager.is_test_mode()
+    # Get dialin settings if present
+    dialin_settings = call_config_manager.get_dialin_settings()
+    # Initialize the session manager
+    session_manager = SessionManager()
+    # ------------ TRANSPORT SETUP ------------
+    # Set up transport parameters
+    if test_mode:
+        logger.info("Running in test mode")
+        transport_params = DailyParams(
+            api_url=daily_api_url,
+            api_key=daily_api_key,
+            audio_in_enabled=True,
+            audio_out_enabled=True,
+            video_out_enabled=False,
+            vad_analyzer=SileroVADAnalyzer(),
+            transcription_enabled=True,
+        )
+    else:
+        daily_dialin_settings = DailyDialinSettings(
+            call_id=dialin_settings.get("call_id"), call_domain=dialin_settings.get("call_domain")
+        )
+        transport_params = DailyParams(
+            api_url=daily_api_url,
+            api_key=daily_api_key,
+            dialin_settings=daily_dialin_settings,
+            audio_in_enabled=True,
+            audio_out_enabled=True,
+            video_out_enabled=False,
+            vad_analyzer=SileroVADAnalyzer(),
+            transcription_enabled=True,
+        )
+    # Initialize transport with Daily
+    transport = DailyTransport(
+        room_url,
+        token,
+        "Simple Dial-in Bot",
+        transport_params,
+    )
+    # Initialize TTS
+    tts = CartesiaTTSService(
+        api_key=os.getenv("CARTESIA_API_KEY", ""),
+        voice_id="b7d50908-b17c-442d-ad8d-810c63997ed9",  # Use Helpful Woman voice by default
+    )
+    # ------------ FUNCTION DEFINITIONS ------------
+    async def terminate_call(params: FunctionCallParams):
+        """Function the bot can call to terminate the call upon completion of a voicemail message."""
+        if session_manager:
+            # Mark that the call was terminated by the bot
+            session_manager.call_flow_state.set_call_terminated()
+        # Then end the call
+        await params.llm.queue_frame(EndTaskFrame(), FrameDirection.UPSTREAM)
+    # Define function schemas for tools
+    terminate_call_function = FunctionSchema(
+        name="terminate_call",
+        description="Call this function to terminate the call.",
+        properties={},
+        required=[],
+    )
+    # Create tools schema
+    tools = ToolsSchema(standard_tools=[terminate_call_function])
+    # ------------ LLM AND CONTEXT SETUP ------------
+    # Set up the system instruction for the LLM
+    system_instruction = """You are Chatbot, a friendly, helpful robot. Your goal is to demonstrate your capabilities in a succinct way. Your output will be converted to audio so don't include special characters in your answers. Respond to what the user said in a creative and helpful way, but keep your responses brief. Start by introducing yourself. If the user ends the conversation, **IMMEDIATELY** call the `terminate_call` function. """
+    # Initialize LLM
+    llm = OpenAILLMService(api_key=os.getenv("OPENAI_API_KEY"))
+    # Register functions with the LLM
+    llm.register_function("terminate_call", terminate_call)
+    # Create system message and initialize messages list
+    messages = [call_config_manager.create_system_message(system_instruction)]
+    # Initialize LLM context and aggregator
+    context = OpenAILLMContext(messages, tools)
+    context_aggregator = llm.create_context_aggregator(context)
+    # ------------ PIPELINE SETUP ------------
+    # Build pipeline
+    pipeline = Pipeline(
+        [
+            transport.input(),  # Transport user input
+            context_aggregator.user(),  # User responses
+            llm,  # LLM
+            tts,  # TTS
+            transport.output(),  # Transport bot output
+            context_aggregator.assistant(),  # Assistant spoken responses
+        ]
+    )
+    # Create pipeline task
+    task = PipelineTask(pipeline, params=PipelineParams(allow_interruptions=True))
+    # ------------ EVENT HANDLERS ------------
+    @transport.event_handler("on_first_participant_joined")
+    async def on_first_participant_joined(transport, participant):
+        logger.debug(f"First participant joined: {participant['id']}")
+        await transport.capture_participant_transcription(participant["id"])
+        await task.queue_frames([context_aggregator.user().get_context_frame()])
+    @transport.event_handler("on_participant_left")
+    async def on_participant_left(transport, participant, reason):
+        logger.debug(f"Participant left: {participant}, reason: {reason}")
+        await task.cancel()
+    # ------------ RUN PIPELINE ------------
+    if test_mode:
+        logger.debug("Running in test mode (can be tested in Daily Prebuilt)")
+    runner = PipelineRunner()
+    await runner.run(task)
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Simple Dial-in Bot")
+    parser.add_argument("-u", "--url", type=str, help="Room URL")
+    parser.add_argument("-t", "--token", type=str, help="Room Token")
+    parser.add_argument("-b", "--body", type=str, help="JSON configuration string")
+    args = parser.parse_args()
+    # Log the arguments for debugging
+    logger.info(f"Room URL: {args.url}")
+    logger.info(f"Token: {args.token}")
+    logger.info(f"Body provided: {bool(args.body)}")
+    asyncio.run(main(args.url, args.token, args.body))

simple_dialout.py ADDED Viewed

	@@ -0,0 +1,184 @@

+#
+# Copyright (c) 2024–2025, Daily
+#
+# SPDX-License-Identifier: BSD 2-Clause License
+#
+import argparse
+import asyncio
+import os
+import sys
+from call_connection_manager import CallConfigManager
+from dotenv import load_dotenv
+from loguru import logger
+from pipecat.adapters.schemas.function_schema import FunctionSchema
+from pipecat.adapters.schemas.tools_schema import ToolsSchema
+from pipecat.audio.vad.silero import SileroVADAnalyzer
+from pipecat.frames.frames import EndTaskFrame
+from pipecat.pipeline.pipeline import Pipeline
+from pipecat.pipeline.runner import PipelineRunner
+from pipecat.pipeline.task import PipelineParams, PipelineTask
+from pipecat.processors.aggregators.openai_llm_context import OpenAILLMContext
+from pipecat.processors.frame_processor import FrameDirection
+from pipecat.services.cartesia.tts import CartesiaTTSService
+from pipecat.services.llm_service import FunctionCallParams
+from pipecat.services.openai.llm import OpenAILLMService
+from pipecat.transports.services.daily import DailyParams, DailyTransport
+load_dotenv(override=True)
+logger.remove(0)
+logger.add(sys.stderr, level="DEBUG")
+daily_api_key = os.getenv("DAILY_API_KEY", "")
+daily_api_url = os.getenv("DAILY_API_URL", "https://api.daily.co/v1")
+async def main(
+    room_url: str,
+    token: str,
+    body: dict,
+):
+    # ------------ CONFIGURATION AND SETUP ------------
+    # Create a config manager using the provided body
+    call_config_manager = CallConfigManager.from_json_string(body) if body else CallConfigManager()
+    # Get important configuration values
+    dialout_settings = call_config_manager.get_dialout_settings()
+    test_mode = call_config_manager.is_test_mode()
+    # ------------ TRANSPORT SETUP ------------
+    transport_params = DailyParams(
+        api_url=daily_api_url,
+        api_key=daily_api_key,
+        audio_in_enabled=True,
+        audio_out_enabled=True,
+        video_out_enabled=False,
+        vad_analyzer=SileroVADAnalyzer(),
+        transcription_enabled=True,
+    )
+    # Initialize transport with Daily
+    transport = DailyTransport(
+        room_url,
+        token,
+        "Simple Dial-out Bot",
+        transport_params,
+    )
+    # Initialize TTS
+    tts = CartesiaTTSService(
+        api_key=os.getenv("CARTESIA_API_KEY", ""),
+        voice_id="b7d50908-b17c-442d-ad8d-810c63997ed9",  # Use Helpful Woman voice by default
+    )
+    # ------------ FUNCTION DEFINITIONS ------------
+    async def terminate_call(params: FunctionCallParams):
+        """Function the bot can call to terminate the call upon completion of a voicemail message."""
+        await params.llm.queue_frame(EndTaskFrame(), FrameDirection.UPSTREAM)
+    # Define function schemas for tools
+    terminate_call_function = FunctionSchema(
+        name="terminate_call",
+        description="Call this function to terminate the call.",
+        properties={},
+        required=[],
+    )
+    # Create tools schema
+    tools = ToolsSchema(standard_tools=[terminate_call_function])
+    # ------------ LLM AND CONTEXT SETUP ------------
+    # Set up the system instruction for the LLM
+    system_instruction = """You are Chatbot, a friendly, helpful robot. Your goal is to demonstrate your capabilities in a succinct way. Your output will be converted to audio so don't include special characters in your answers. Respond to what the user said in a creative and helpful way, but keep your responses brief. Start by introducing yourself. If the user ends the conversation, **IMMEDIATELY** call the `terminate_call` function. """
+    # Initialize LLM
+    llm = OpenAILLMService(api_key=os.getenv("OPENAI_API_KEY"))
+    # Register functions with the LLM
+    llm.register_function("terminate_call", terminate_call)
+    # Create system message and initialize messages list
+    messages = [call_config_manager.create_system_message(system_instruction)]
+    # Initialize LLM context and aggregator
+    context = OpenAILLMContext(messages, tools)
+    context_aggregator = llm.create_context_aggregator(context)
+    # ------------ PIPELINE SETUP ------------
+    # Build pipeline
+    pipeline = Pipeline(
+        [
+            transport.input(),  # Transport user input
+            context_aggregator.user(),  # User responses
+            llm,  # LLM
+            tts,  # TTS
+            transport.output(),  # Transport bot output
+            context_aggregator.assistant(),  # Assistant spoken responses
+        ]
+    )
+    # Create pipeline task
+    task = PipelineTask(pipeline, params=PipelineParams(allow_interruptions=True))
+    # ------------ EVENT HANDLERS ------------
+    @transport.event_handler("on_joined")
+    async def on_joined(transport, data):
+        # Start dialout if needed
+        if not test_mode and dialout_settings:
+            logger.debug("Dialout settings detected; starting dialout")
+            await call_config_manager.start_dialout(transport, dialout_settings)
+    @transport.event_handler("on_dialout_connected")
+    async def on_dialout_connected(transport, data):
+        logger.debug(f"Dial-out connected: {data}")
+    @transport.event_handler("on_dialout_answered")
+    async def on_dialout_answered(transport, data):
+        logger.debug(f"Dial-out answered: {data}")
+        # Automatically start capturing transcription for the participant
+        await transport.capture_participant_transcription(data["sessionId"])
+        # The bot will wait to hear the user before the bot speaks
+    @transport.event_handler("on_first_participant_joined")
+    async def on_first_participant_joined(transport, participant):
+        if test_mode:
+            logger.debug(f"First participant joined: {participant['id']}")
+            await transport.capture_participant_transcription(participant["id"])
+            # The bot will wait to hear the user before the bot speaks
+    @transport.event_handler("on_participant_left")
+    async def on_participant_left(transport, participant, reason):
+        logger.debug(f"Participant left: {participant}, reason: {reason}")
+        await task.cancel()
+    # ------------ RUN PIPELINE ------------
+    if test_mode:
+        logger.debug("Running in test mode (can be tested in Daily Prebuilt)")
+    runner = PipelineRunner()
+    await runner.run(task)
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Simple Dial-out Bot")
+    parser.add_argument("-u", "--url", type=str, help="Room URL")
+    parser.add_argument("-t", "--token", type=str, help="Room Token")
+    parser.add_argument("-b", "--body", type=str, help="JSON configuration string")
+    args = parser.parse_args()
+    # Log the arguments for debugging
+    logger.info(f"Room URL: {args.url}")
+    logger.info(f"Token: {args.token}")
+    logger.info(f"Body provided: {bool(args.body)}")
+    asyncio.run(main(args.url, args.token, args.body))

voicemail_detection.py ADDED Viewed

	@@ -0,0 +1,449 @@

+#
+# Copyright (c) 2024–2025, Daily
+#
+# SPDX-License-Identifier: BSD 2-Clause License
+#
+import argparse
+import asyncio
+import functools
+import os
+import sys
+from call_connection_manager import CallConfigManager, SessionManager
+from dotenv import load_dotenv
+from loguru import logger
+from pipecat.audio.vad.silero import SileroVADAnalyzer
+from pipecat.frames.frames import (
+    EndFrame,
+    EndTaskFrame,
+    InputAudioRawFrame,
+    StopTaskFrame,
+    TranscriptionFrame,
+    UserStartedSpeakingFrame,
+    UserStoppedSpeakingFrame,
+)
+from pipecat.pipeline.pipeline import Pipeline
+from pipecat.pipeline.runner import PipelineRunner
+from pipecat.pipeline.task import PipelineParams, PipelineTask
+from pipecat.processors.frame_processor import FrameDirection, FrameProcessor
+from pipecat.services.cartesia.tts import CartesiaTTSService
+from pipecat.services.deepgram.stt import DeepgramSTTService
+from pipecat.services.google.google import GoogleLLMContext
+from pipecat.services.google.llm import GoogleLLMService
+from pipecat.services.llm_service import FunctionCallParams
+from pipecat.transports.services.daily import (
+    DailyParams,
+    DailyTransport,
+)
+load_dotenv(override=True)
+logger.remove(0)
+logger.add(sys.stderr, level="DEBUG")
+daily_api_key = os.getenv("DAILY_API_KEY", "")
+daily_api_url = os.getenv("DAILY_API_URL", "https://api.daily.co/v1")
+# ------------ HELPER CLASSES ------------
+class UserAudioCollector(FrameProcessor):
+    """Collects audio frames in a buffer, then adds them to the LLM context when the user stops speaking."""
+    def __init__(self, context, user_context_aggregator):
+        super().__init__()
+        self._context = context
+        self._user_context_aggregator = user_context_aggregator
+        self._audio_frames = []
+        self._start_secs = 0.2  # this should match VAD start_secs (hardcoding for now)
+        self._user_speaking = False
+    async def process_frame(self, frame, direction):
+        await super().process_frame(frame, direction)
+        if isinstance(frame, TranscriptionFrame):
+            # Skip transcription frames - we're handling audio directly
+            return
+        elif isinstance(frame, UserStartedSpeakingFrame):
+            self._user_speaking = True
+        elif isinstance(frame, UserStoppedSpeakingFrame):
+            self._user_speaking = False
+            self._context.add_audio_frames_message(audio_frames=self._audio_frames)
+            await self._user_context_aggregator.push_frame(
+                self._user_context_aggregator.get_context_frame()
+            )
+        elif isinstance(frame, InputAudioRawFrame):
+            if self._user_speaking:
+                # When speaking, collect frames
+                self._audio_frames.append(frame)
+            else:
+                # Maintain a rolling buffer of recent audio (for start of speech)
+                self._audio_frames.append(frame)
+                frame_duration = len(frame.audio) / 16 * frame.num_channels / frame.sample_rate
+                buffer_duration = frame_duration * len(self._audio_frames)
+                while buffer_duration > self._start_secs:
+                    self._audio_frames.pop(0)
+                    buffer_duration -= frame_duration
+        await self.push_frame(frame, direction)
+class FunctionHandlers:
+    """Handlers for the voicemail detection bot functions."""
+    def __init__(self, session_manager):
+        self.session_manager = session_manager
+        self.prompt = None  # Can be set externally
+    async def voicemail_response(self, params: FunctionCallParams):
+        """Function the bot can call to leave a voicemail message."""
+        message = """You are Chatbot leaving a voicemail message. Say EXACTLY this message and then terminate the call:
+                    'Hello, this is a message for Pipecat example user. This is Chatbot. Please call back on 123-456-7891. Thank you.'"""
+        await params.result_callback(message)
+    async def human_conversation(self, params: FunctionCallParams):
+        """Function called when bot detects it's talking to a human."""
+        # Update state to indicate human was detected
+        self.session_manager.call_flow_state.set_human_detected()
+        await params.llm.push_frame(StopTaskFrame(), FrameDirection.UPSTREAM)
+# ------------ MAIN FUNCTION ------------
+async def main(
+    room_url: str,
+    token: str,
+    body: dict,
+):
+    # ------------ CONFIGURATION AND SETUP ------------
+    # Create a configuration manager from the provided body
+    call_config_manager = CallConfigManager.from_json_string(body) if body else CallConfigManager()
+    # Get important configuration values
+    dialout_settings = call_config_manager.get_dialout_settings()
+    test_mode = call_config_manager.is_test_mode()
+    # Get caller info (might be None for dialout scenarios)
+    caller_info = call_config_manager.get_caller_info()
+    logger.info(f"Caller info: {caller_info}")
+    # Initialize the session manager
+    session_manager = SessionManager()
+    # ------------ TRANSPORT AND SERVICES SETUP ------------
+    # Initialize transport
+    transport = DailyTransport(
+        room_url,
+        token,
+        "Voicemail Detection Bot",
+        DailyParams(
+            api_url=daily_api_url,
+            api_key=daily_api_key,
+            audio_in_enabled=True,
+            audio_out_enabled=True,
+            video_out_enabled=False,
+            vad_analyzer=SileroVADAnalyzer(),
+        ),
+    )
+    # Initialize TTS
+    tts = CartesiaTTSService(
+        api_key=os.getenv("CARTESIA_API_KEY", ""),
+        voice_id="b7d50908-b17c-442d-ad8d-810c63997ed9",  # Use Helpful Woman voice by default
+    )
+    # Initialize speech-to-text service (for human conversation phase)
+    stt = DeepgramSTTService(api_key=os.getenv("DEEPGRAM_API_KEY"))
+    # ------------ FUNCTION DEFINITIONS ------------
+    async def terminate_call(
+        params: FunctionCallParams,
+        session_manager=None,
+    ):
+        """Function the bot can call to terminate the call."""
+        if session_manager:
+            # Set call terminated flag in the session manager
+            session_manager.call_flow_state.set_call_terminated()
+        await params.llm.queue_frame(EndTaskFrame(), FrameDirection.UPSTREAM)
+    # ------------ VOICEMAIL DETECTION PHASE SETUP ------------
+    # Define tools for both LLMs
+    tools = [
+        {
+            "function_declarations": [
+                {
+                    "name": "switch_to_voicemail_response",
+                    "description": "Call this function when you detect this is a voicemail system.",
+                },
+                {
+                    "name": "switch_to_human_conversation",
+                    "description": "Call this function when you detect this is a human.",
+                },
+                {
+                    "name": "terminate_call",
+                    "description": "Call this function to terminate the call.",
+                },
+            ]
+        }
+    ]
+    # Get voicemail detection prompt
+    voicemail_detection_prompt = call_config_manager.get_prompt("voicemail_detection_prompt")
+    if voicemail_detection_prompt:
+        system_instruction = voicemail_detection_prompt
+    else:
+        system_instruction = """You are Chatbot trying to determine if this is a voicemail system or a human.
+        If you hear any of these phrases (or very similar ones):
+        - "Please leave a message after the beep"
+        - "No one is available to take your call"
+        - "Record your message after the tone"
+        - "You have reached voicemail for..."
+        - "You have reached [phone number]"
+        - "[phone number] is unavailable"
+        - "The person you are trying to reach..."
+        - "The number you have dialed..."
+        - "Your call has been forwarded to an automated voice messaging system"
+        Then call the function switch_to_voicemail_response.
+        If it sounds like a human (saying hello, asking questions, etc.), call the function switch_to_human_conversation.
+        DO NOT say anything until you've determined if this is a voicemail or human.
+        If you are asked to terminate the call, **IMMEDIATELY** call the `terminate_call` function. **FAILURE TO CALL `terminate_call` IMMEDIATELY IS A MISTAKE.**"""
+    # Initialize voicemail detection LLM
+    voicemail_detection_llm = GoogleLLMService(
+        model="models/gemini-2.0-flash-lite",  # Lighter model for faster detection
+        api_key=os.getenv("GOOGLE_API_KEY"),
+        system_instruction=system_instruction,
+        tools=tools,
+    )
+    # Initialize context and context aggregator
+    voicemail_detection_context = GoogleLLMContext()
+    voicemail_detection_context_aggregator = voicemail_detection_llm.create_context_aggregator(
+        voicemail_detection_context
+    )
+    # Get custom voicemail prompt if available
+    voicemail_prompt = call_config_manager.get_prompt("voicemail_prompt")
+    # Set up function handlers
+    handlers = FunctionHandlers(session_manager)
+    handlers.prompt = voicemail_prompt  # Set custom prompt if available
+    # Register functions with the voicemail detection LLM
+    voicemail_detection_llm.register_function(
+        "switch_to_voicemail_response",
+        handlers.voicemail_response,
+    )
+    voicemail_detection_llm.register_function(
+        "switch_to_human_conversation", handlers.human_conversation
+    )
+    voicemail_detection_llm.register_function(
+        "terminate_call", lambda params: terminate_call(params, session_manager)
+    )
+    # Set up audio collector for handling audio input
+    voicemail_detection_audio_collector = UserAudioCollector(
+        voicemail_detection_context, voicemail_detection_context_aggregator.user()
+    )
+    # Build voicemail detection pipeline
+    voicemail_detection_pipeline = Pipeline(
+        [
+            transport.input(),  # Transport user input
+            voicemail_detection_audio_collector,  # Collect audio frames
+            voicemail_detection_context_aggregator.user(),  # User context
+            voicemail_detection_llm,  # LLM
+            tts,  # TTS
+            transport.output(),  # Transport bot output
+            voicemail_detection_context_aggregator.assistant(),  # Assistant context
+        ]
+    )
+    # Create pipeline task
+    voicemail_detection_pipeline_task = PipelineTask(
+        voicemail_detection_pipeline,
+        params=PipelineParams(allow_interruptions=True),
+    )
+    # ------------ EVENT HANDLERS ------------
+    @transport.event_handler("on_joined")
+    async def on_joined(transport, data):
+        # Start dialout if needed
+        if not test_mode and dialout_settings:
+            logger.debug("Dialout settings detected; starting dialout")
+            await call_config_manager.start_dialout(transport, dialout_settings)
+    @transport.event_handler("on_dialout_connected")
+    async def on_dialout_connected(transport, data):
+        logger.debug(f"Dial-out connected: {data}")
+    @transport.event_handler("on_dialout_answered")
+    async def on_dialout_answered(transport, data):
+        logger.debug(f"Dial-out answered: {data}")
+        # Start capturing transcription
+        await transport.capture_participant_transcription(data["sessionId"])
+    @transport.event_handler("on_first_participant_joined")
+    async def on_first_participant_joined(transport, participant):
+        logger.debug(f"First participant joined: {participant['id']}")
+        if test_mode:
+            await transport.capture_participant_transcription(participant["id"])
+    @transport.event_handler("on_participant_left")
+    async def on_participant_left(transport, participant, reason):
+        # Mark that a participant left early
+        session_manager.call_flow_state.set_participant_left_early()
+        await voicemail_detection_pipeline_task.queue_frame(EndFrame())
+    # ------------ RUN VOICEMAIL DETECTION PIPELINE ------------
+    if test_mode:
+        logger.debug("Detect voicemail example. You can test this in Daily Prebuilt")
+    runner = PipelineRunner()
+    print("!!! starting voicemail detection pipeline")
+    try:
+        await runner.run(voicemail_detection_pipeline_task)
+    except Exception as e:
+        logger.error(f"Error in voicemail detection pipeline: {e}")
+        import traceback
+        logger.error(traceback.format_exc())
+    print("!!! Done with voicemail detection pipeline")
+    # Check if we should exit early
+    if (
+        session_manager.call_flow_state.participant_left_early
+        or session_manager.call_flow_state.call_terminated
+    ):
+        if session_manager.call_flow_state.participant_left_early:
+            print("!!! Participant left early; terminating call")
+        elif session_manager.call_flow_state.call_terminated:
+            print("!!! Bot terminated call; not proceeding to human conversation")
+        return
+    # ------------ HUMAN CONVERSATION PHASE SETUP ------------
+    # Get human conversation prompt
+    human_conversation_prompt = call_config_manager.get_prompt("human_conversation_prompt")
+    if human_conversation_prompt:
+        human_conversation_system_instruction = human_conversation_prompt
+    else:
+        human_conversation_system_instruction = """You are Chatbot talking to a human. Be friendly and helpful.
+        Start with: "Hello! I'm a friendly chatbot. How can I help you today?"
+        Keep your responses brief and to the point. Listen to what the person says.
+        When the person indicates they're done with the conversation by saying something like:
+        - "Goodbye"
+        - "That's all"
+        - "I'm done"
+        - "Thank you, that's all I needed"
+        THEN say: "Thank you for chatting. Goodbye!" and call the terminate_call function."""
+    # Initialize human conversation LLM
+    human_conversation_llm = GoogleLLMService(
+        model="models/gemini-2.0-flash-001",  # Full model for better conversation
+        api_key=os.getenv("GOOGLE_API_KEY"),
+        system_instruction=human_conversation_system_instruction,
+        tools=tools,
+    )
+    # Initialize context and context aggregator
+    human_conversation_context = GoogleLLMContext()
+    human_conversation_context_aggregator = human_conversation_llm.create_context_aggregator(
+        human_conversation_context
+    )
+    # Register terminate function with the human conversation LLM
+    human_conversation_llm.register_function(
+        "terminate_call", functools.partial(terminate_call, session_manager=session_manager)
+    )
+    # Build human conversation pipeline
+    human_conversation_pipeline = Pipeline(
+        [
+            transport.input(),  # Transport user input
+            stt,  # Speech-to-text
+            human_conversation_context_aggregator.user(),  # User context
+            human_conversation_llm,  # LLM
+            tts,  # TTS
+            transport.output(),  # Transport bot output
+            human_conversation_context_aggregator.assistant(),  # Assistant context
+        ]
+    )
+    # Create pipeline task
+    human_conversation_pipeline_task = PipelineTask(
+        human_conversation_pipeline,
+        params=PipelineParams(allow_interruptions=True),
+    )
+    # Update participant left handler for human conversation phase
+    @transport.event_handler("on_participant_left")
+    async def on_participant_left(transport, participant, reason):
+        await voicemail_detection_pipeline_task.queue_frame(EndFrame())
+        await human_conversation_pipeline_task.queue_frame(EndFrame())
+    # ------------ RUN HUMAN CONVERSATION PIPELINE ------------
+    print("!!! starting human conversation pipeline")
+    # Initialize the context with system message
+    human_conversation_context_aggregator.user().set_messages(
+        [call_config_manager.create_system_message(human_conversation_system_instruction)]
+    )
+    # Queue the context frame to start the conversation
+    await human_conversation_pipeline_task.queue_frames(
+        [human_conversation_context_aggregator.user().get_context_frame()]
+    )
+    # Run the human conversation pipeline
+    try:
+        await runner.run(human_conversation_pipeline_task)
+    except Exception as e:
+        logger.error(f"Error in voicemail detection pipeline: {e}")
+        import traceback
+        logger.error(traceback.format_exc())
+    print("!!! Done with human conversation pipeline")
+# ------------ SCRIPT ENTRY POINT ------------
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser(description="Pipecat Voicemail Detection Bot")
+    parser.add_argument("-u", "--url", type=str, help="Room URL")
+    parser.add_argument("-t", "--token", type=str, help="Room Token")
+    parser.add_argument("-b", "--body", type=str, help="JSON configuration string")
+    args = parser.parse_args()
+    # Log the arguments for debugging
+    logger.info(f"Room URL: {args.url}")
+    logger.info(f"Token: {args.token}")
+    logger.info(f"Body provided: {bool(args.body)}")
+    asyncio.run(main(args.url, args.token, args.body))