Spaces:

Deadmon
/

pipecat

Runtime error

App Files Files Community

Deadmon commited on May 10

Commit

f336a0c

verified ·

1 Parent(s): 3e8fe6b

Update main.py

Browse files

Files changed (1) hide show

main.py +10 -18

main.py CHANGED Viewed

@@ -3,27 +3,24 @@ import os
 import sys
 import time
 import logging
 from pipecat.frames.frames import (
     TextFrame, UserStartedSpeakingFrame, UserStoppedSpeakingFrame,
-    TTSStartedFrame, BotStoppedSpeakingFrame
 )
 from pipecat.pipeline.pipeline import Pipeline
 from pipecat.pipeline.runner import PipelineRunner
 from pipecat.pipeline.task import PipelineParams
 from pipecat.processors.frame_processor import FrameProcessor, FrameDirection
-from pipecat.services.elevenlabs.tts import ElevenLabsTTSService  # updated import
-from pipecat.services.deepgram.stt import DeepgramSTTService      # updated import
 from pipecat.transports.services.daily import DailyParams, DailyTransport
-from pipecat.vad.silero import SileroVADAnalyzer
 from azure_openai import AzureOpenAILLMService
 from elevenlabs import ElevenLabs
-# Configure logging
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s")
 logger = logging.getLogger(__name__)
-# Configuration constants
 SILENCE_TIMEOUT_SECONDS = float(os.environ.get("SILENCE_TIMEOUT_SECONDS", 10))
 MAX_SILENCE_PROMPTS = int(os.environ.get("MAX_SILENCE_PROMPTS", 3))
 SILENCE_PROMPT_TEXT = "Are you still there?"
@@ -62,12 +59,12 @@ class SilenceAndCallLogicProcessor(FrameProcessor):
         self.last_activity_ts = time.time()
         self.silence_prompts_count = 0
-    async def process_frame(self, frame, direction: FrameDirection):
         if isinstance(frame, (UserStartedSpeakingFrame, TextFrame)) and direction == FrameDirection.UPSTREAM:
             self._reset_activity_timer()
         if isinstance(frame, TTSStartedFrame) and direction == FrameDirection.DOWNSTREAM:
             self._bot_is_speaking = True
-        elif isinstance(frame, BotStoppedSpeakingFrame) and direction == FrameDirection.DOWNSTREAM:
             self._bot_is_speaking = False
             self.last_activity_ts = time.time()
         await self.push_frame(frame, direction)
@@ -153,10 +150,12 @@ class PhoneChatbotApp:
             return False
     async def run(self):
-        required_keys = ["deepgram", "elevenlabs", "dailyco", "azure_openai"]
         missing_keys = [key for key in required_keys if not os.environ.get(key)]
         if missing_keys:
-            logger.error(f"Missing Hugging Face Secrets: {', '.join(missing_keys)}")
             sys.exit(1)
         voice_id = os.environ.get("ELEVENLABS_VOICE_ID", "cgSgspJ2msm6clMCkdW9")
@@ -203,10 +202,3 @@ class PhoneChatbotApp:
                 await self.pipeline.stop_when_done()
             if self.silence_processor:
                 await self.silence_processor.stop()
-async def main():
-    app = PhoneChatbotApp()
-    await app.run()
-if __name__ == "__main__":
-    asyncio.run(main())

 import sys
 import time
 import logging
 from pipecat.frames.frames import (
     TextFrame, UserStartedSpeakingFrame, UserStoppedSpeakingFrame,
+    TTSStartedFrame, TTSEndFrame
 )
 from pipecat.pipeline.pipeline import Pipeline
 from pipecat.pipeline.runner import PipelineRunner
 from pipecat.pipeline.task import PipelineParams
 from pipecat.processors.frame_processor import FrameProcessor, FrameDirection
+from pipecat.services.elevenlabs.tts import ElevenLabsTTSService
+from pipecat.services.deepgram.stt import DeepgramSTTService
 from pipecat.transports.services.daily import DailyParams, DailyTransport
+from pipecat.audio.vad.silero import SileroVADAnalyzer
 from azure_openai import AzureOpenAILLMService
 from elevenlabs import ElevenLabs
 logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s")
 logger = logging.getLogger(__name__)
 SILENCE_TIMEOUT_SECONDS = float(os.environ.get("SILENCE_TIMEOUT_SECONDS", 10))
 MAX_SILENCE_PROMPTS = int(os.environ.get("MAX_SILENCE_PROMPTS", 3))
 SILENCE_PROMPT_TEXT = "Are you still there?"
         self.last_activity_ts = time.time()
         self.silence_prompts_count = 0
+    async def process_frame(self, frame, direction):
         if isinstance(frame, (UserStartedSpeakingFrame, TextFrame)) and direction == FrameDirection.UPSTREAM:
             self._reset_activity_timer()
         if isinstance(frame, TTSStartedFrame) and direction == FrameDirection.DOWNSTREAM:
             self._bot_is_speaking = True
+        elif isinstance(frame, TTSEndFrame) and direction == FrameDirection.DOWNSTREAM:
             self._bot_is_speaking = False
             self.last_activity_ts = time.time()
         await self.push_frame(frame, direction)
             return False
     async def run(self):
+        required_keys = [
+            "deepgram", "elevenlabs", "dailyco", "azure_openai"
+        ]
         missing_keys = [key for key in required_keys if not os.environ.get(key)]
         if missing_keys:
+            logger.error(f"Missing environment variables: {', '.join(missing_keys)}")
             sys.exit(1)
         voice_id = os.environ.get("ELEVENLABS_VOICE_ID", "cgSgspJ2msm6clMCkdW9")
                 await self.pipeline.stop_when_done()
             if self.silence_processor:
                 await self.silence_processor.stop()