Spaces:

Yakova
/

Embedding

Running

App Files Files Community

Mbonea commited on Sep 27, 2024

Commit

00a1436

1 Parent(s): 412a100

pi test

Browse files

Files changed (5) hide show

App/TTS/TTSRoutes.py +1 -2
App/TTS/utils/Pi copy.py +193 -0
App/TTS/utils/Pi.py +501 -171
App/app.py +3 -1
Dockerfile +2 -2

App/TTS/TTSRoutes.py CHANGED Viewed

@@ -13,7 +13,7 @@ from .Schemas import (
 )
 from .utils.Podcastle import PodcastleAPI
 from .utils.HeyGen import HeygenAPI
-from .utils.Pi import PiAIClient
 from .utils.Descript import DescriptTTS
 import os
 import asyncio
@@ -34,7 +34,6 @@ data = {
 descript_tts = DescriptTTS()
 heyGentts = HeygenAPI(**data)
-pi = PiAIClient()
 @tts_router.post("/generate_tts")

 )
 from .utils.Podcastle import PodcastleAPI
 from .utils.HeyGen import HeygenAPI
+from App.app import pi
 from .utils.Descript import DescriptTTS
 import os
 import asyncio
 descript_tts = DescriptTTS()
 heyGentts = HeygenAPI(**data)
 @tts_router.post("/generate_tts")

App/TTS/utils/Pi copy.py ADDED Viewed

	@@ -0,0 +1,193 @@

+import aiohttp
+import asyncio
+import enum
+import requests
+import os
+from functools import cache
+import tempfile
+import uuid
+class VoiceType(enum.Enum):
+    voice1 = "voice1"
+    voice2 = "voice2"
+    voice3 = "voice3"
+    voice4 = "voice4"
+    voice5 = "voice5"
+    voice5_update = "voice5-update"
+    voice6 = "voice6"
+    voice7 = "voice7"
+    voice8 = "voice8"
+    voice9 = "voice9"
+    voice10 = "voice10"
+    voice11 = "voice11"
+    voice12 = "voice12"
+    qdpi = "qdpi"
+class PiAIClient:
+    def __init__(self):
+        self.dir = "/tmp/Audio"
+        self.base_url = "https://pi.ai/api/chat"
+        self.referer = "https://pi.ai/talk"
+        self.origin = "https://pi.ai"
+        self.user_agent = (
+            "Mozilla/5.0 (X11; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/113.0"
+        )
+        self.cookie = None
+        self.headers = {
+            "User-Agent": self.user_agent,
+            "Accept": "text/event-stream",
+            "Referer": self.referer,
+            "X-Api-Version": "3",
+            "Content-Type": "application/json",
+            "Origin": self.origin,
+            "Connection": "keep-alive",
+            "Sec-Fetch-Dest": "empty",
+            "Sec-Fetch-Mode": "no-cors",
+            "Sec-Fetch-Site": "same-origin",
+            "DNT": "1",
+            "Sec-GPC": "1",
+            "TE": "trailers",
+            "Cookie": "__cf_bm=XagWXCS3SJekiP5O.A8K9wgtGuEieLNW7AFXj10hzqk-1717865973-1.0.1.1-4Xp_xUVYB5G.Zkpfgcm30PCVGnj3g6URzZsfCS28BQIdt8dZm76rnNbQiX9vNG_OsYdbUiDiX2pa.E3ajhcOXA; path=/; expires=Sat, 08-Jun-24 17:29:33 GMT; domain=.pi.ai; HttpOnly; Secure; SameSite=None",
+            "Pragma": "no-cache",
+            "Cache-Control": "no-cache",
+        }
+    async def get_cookie(self) -> str:
+        headers = self.headers.copy()
+        async with aiohttp.ClientSession() as session:
+            async with session.post(
+                f"{self.base_url}/start", headers=headers, json={}
+            ) as response:
+                self.cookie = response.headers["Set-Cookie"]
+                return self.cookie
+    async def make_request(
+        self, endpoint: str, headers: dict, json: dict = None, method: str = "POST"
+    ):
+        async with aiohttp.ClientSession() as session:
+            if method == "POST":
+                async with session.post(
+                    endpoint, headers=headers, json=json
+                ) as response:
+                    return await response.text()
+            elif method == "GET":
+                async with session.get(endpoint, headers=headers) as response:
+                    return response
+    async def get_response(self, input_text) -> tuple[list[str], list[str]]:
+        if self.cookie is None:
+            self.cookie = await self.get_cookie()
+        headers = self.headers.copy()
+        headers["Cookie"] = self.cookie
+        data = {"text": input_text}
+        response_text = await self.make_request(self.base_url, headers, json=data)
+        response_lines = response_text.split("\n")
+        response_texts = []
+        response_sids = []
+        print(response_lines)
+        for line in response_lines:
+            if line.startswith('data: {"text":"'):
+                start = len('data: {"text":')
+                end = line.rindex("}")
+                text_dict = line[start + 1 : end - 1].strip()
+                response_texts.append(text_dict)
+            elif line.startswith('data: {"sid":'):
+                start = len('data: {"sid":')
+                end = line.rindex("}")
+                sid_dict = line[start : end - 1].strip()
+                sid_dict = sid_dict.split(",")[0][1:-1]
+                response_sids.append(sid_dict)
+        return response_texts, response_sids
+    async def speak_response(
+        self, message_sid: str, voice: VoiceType = VoiceType.voice4.value
+    ) -> None:
+        if self.cookie is None:
+            self.cookie = await self.get_cookie()
+        headers = self.headers.copy()
+        headers.update(
+            {
+                "Host": "pi.ai",
+                "Accept": "audio/webm,audio/ogg,audio/wav,audio/*;q=0.9,application/ogg;q=0.7,video/*;q=0.6,*/*;q=0.5",
+                "Accept-Language": "en-US,en;q=0.9",
+                "Range": "bytes=0-",
+                "Sec-Fetch-Dest": "audio",
+                "Sec-Fetch-Mode": "no-cors",
+                "Sec-Fetch-Site": "same-origin",
+                "Sec-CH-UA": '"Chromium";v="124", "Google Chrome";v="124", "Not-A.Brand";v="99"',
+                "Sec-CH-UA-Mobile": "?0",
+                "Sec-CH-UA-Platform": '"Windows"',
+            }
+        )
+        headers = {
+            "User-Agent": "Mozilla/5.0 (X11; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/113.0",
+            "Accept": "audio/webm,audio/ogg,audio/wav,audio/*;q=0.9,application/ogg;q=0.7,video/*;q=0.6,*/*;q=0.5",
+            "Accept-Language": "en-US,en;q=0.5",
+            "Range": "bytes=0-",
+            "Connection": "keep-alive",
+            "Referer": "https://pi.ai/talk",
+            # "Cookie": cookie,
+            "Sec-Fetch-Dest": "audio",
+            "Sec-Fetch-Mode": "no-cors",
+            "Sec-Fetch-Site": "same-origin",
+            "DNT": "1",
+            "Sec-GPC": "1",
+            "Accept-Encoding": "identity",
+            "TE": "trailers",
+        }
+        headers["Cookie"] = self.cookie
+        print(headers)
+        endpoint = (
+            f"{self.base_url}/voice?mode=eager&voice={voice}&messageSid={message_sid}"
+        )
+        async with aiohttp.ClientSession() as session:
+            async with session.get(endpoint, headers=headers) as response:
+                print(response.status)
+                file_name = str(uuid.uuid4()) + ".mp3"
+                file_path = os.path.join(self.dir, file_name)
+                os.makedirs(self.dir, exist_ok=True)
+                if response.status == 200:
+                    with open(file_path, "wb") as file:
+                        async for chunk in response.content.iter_chunked(128):
+                            file.write(chunk)
+                    return {
+                        "url": f"https://yakova-embedding.hf.space/audio/{file_name}"
+                    }
+                    # Run command vlc to play the audio file
+                    # os.system("vlc speak.wav --intf dummy --play-and-exit")
+                else:
+                    temp = await response.text()
+                    print(temp)
+                    self.cookie = None
+                    return "Error: Unable to retrieve audio."
+    async def say(self, text, voice=VoiceType.qdpi.value):
+        _, response_sids = await self.get_response(text)
+        if response_sids:
+            return await self.speak_response(response_sids[0], voice=voice)
+# async def main():
+#     client = PiAIClient()
+#     response_texts, response_sids = await client.get_response(
+#         "Write a ryme to introduce yourself."
+#     )
+#     print(response_texts, response_sids)
+#     import time
+#     if response_sids:
+#         return await client.speak_response(response_sids[1])
+# # Run the main function
+# if __name__ == "__main__":
+#     asyncio.run(main())

App/TTS/utils/Pi.py CHANGED Viewed

@@ -1,193 +1,523 @@
-import aiohttp
 import asyncio
-import enum
-import requests
 import os
-from functools import cache
-import tempfile
-import uuid
 class VoiceType(enum.Enum):
-    voice1 = "voice1"
-    voice2 = "voice2"
-    voice3 = "voice3"
-    voice4 = "voice4"
-    voice5 = "voice5"
-    voice5_update = "voice5-update"
-    voice6 = "voice6"
-    voice7 = "voice7"
-    voice8 = "voice8"
-    voice9 = "voice9"
-    voice10 = "voice10"
-    voice11 = "voice11"
-    voice12 = "voice12"
-    qdpi = "qdpi"
 class PiAIClient:
-    def __init__(self):
-        self.dir = "/tmp/Audio"
-        self.base_url = "https://pi.ai/api/chat"
-        self.referer = "https://pi.ai/talk"
-        self.origin = "https://pi.ai"
-        self.user_agent = (
-            "Mozilla/5.0 (X11; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/113.0"
-        )
-        self.cookie = None
-        self.headers = {
-            "User-Agent": self.user_agent,
-            "Accept": "text/event-stream",
-            "Referer": self.referer,
-            "X-Api-Version": "3",
-            "Content-Type": "application/json",
-            "Origin": self.origin,
-            "Connection": "keep-alive",
-            "Sec-Fetch-Dest": "empty",
-            "Sec-Fetch-Mode": "no-cors",
-            "Sec-Fetch-Site": "same-origin",
-            "DNT": "1",
-            "Sec-GPC": "1",
-            "TE": "trailers",
-            "Cookie": "__cf_bm=XagWXCS3SJekiP5O.A8K9wgtGuEieLNW7AFXj10hzqk-1717865973-1.0.1.1-4Xp_xUVYB5G.Zkpfgcm30PCVGnj3g6URzZsfCS28BQIdt8dZm76rnNbQiX9vNG_OsYdbUiDiX2pa.E3ajhcOXA; path=/; expires=Sat, 08-Jun-24 17:29:33 GMT; domain=.pi.ai; HttpOnly; Secure; SameSite=None",
-            "Pragma": "no-cache",
-            "Cache-Control": "no-cache",
-        }
-    async def get_cookie(self) -> str:
-        headers = self.headers.copy()
-        async with aiohttp.ClientSession() as session:
-            async with session.post(
-                f"{self.base_url}/start", headers=headers, json={}
-            ) as response:
-                self.cookie = response.headers["Set-Cookie"]
-                return self.cookie
-    async def make_request(
-        self, endpoint: str, headers: dict, json: dict = None, method: str = "POST"
-    ):
-        async with aiohttp.ClientSession() as session:
-            if method == "POST":
-                async with session.post(
-                    endpoint, headers=headers, json=json
-                ) as response:
-                    return await response.text()
-            elif method == "GET":
-                async with session.get(endpoint, headers=headers) as response:
-                    return response
-    async def get_response(self, input_text) -> tuple[list[str], list[str]]:
-        if self.cookie is None:
-            self.cookie = await self.get_cookie()
-        headers = self.headers.copy()
-        headers["Cookie"] = self.cookie
-        data = {"text": input_text}
-        response_text = await self.make_request(self.base_url, headers, json=data)
-        response_lines = response_text.split("\n")
-        response_texts = []
-        response_sids = []
-        print(response_lines)
-        for line in response_lines:
-            if line.startswith('data: {"text":"'):
-                start = len('data: {"text":')
-                end = line.rindex("}")
-                text_dict = line[start + 1 : end - 1].strip()
-                response_texts.append(text_dict)
-            elif line.startswith('data: {"sid":'):
-                start = len('data: {"sid":')
-                end = line.rindex("}")
-                sid_dict = line[start : end - 1].strip()
-                sid_dict = sid_dict.split(",")[0][1:-1]
-                response_sids.append(sid_dict)
-        return response_texts, response_sids
-    async def speak_response(
-        self, message_sid: str, voice: VoiceType = VoiceType.voice4.value
-    ) -> None:
-        if self.cookie is None:
-            self.cookie = await self.get_cookie()
-        headers = self.headers.copy()
-        headers.update(
             {
-                "Host": "pi.ai",
-                "Accept": "audio/webm,audio/ogg,audio/wav,audio/*;q=0.9,application/ogg;q=0.7,video/*;q=0.6,*/*;q=0.5",
-                "Accept-Language": "en-US,en;q=0.9",
-                "Range": "bytes=0-",
-                "Sec-Fetch-Dest": "audio",
-                "Sec-Fetch-Mode": "no-cors",
-                "Sec-Fetch-Site": "same-origin",
-                "Sec-CH-UA": '"Chromium";v="124", "Google Chrome";v="124", "Not-A.Brand";v="99"',
-                "Sec-CH-UA-Mobile": "?0",
-                "Sec-CH-UA-Platform": '"Windows"',
-            }
-        )
-        headers = {
-            "User-Agent": "Mozilla/5.0 (X11; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/113.0",
-            "Accept": "audio/webm,audio/ogg,audio/wav,audio/*;q=0.9,application/ogg;q=0.7,video/*;q=0.6,*/*;q=0.5",
-            "Accept-Language": "en-US,en;q=0.5",
-            "Range": "bytes=0-",
-            "Connection": "keep-alive",
-            "Referer": "https://pi.ai/talk",
-            # "Cookie": cookie,
-            "Sec-Fetch-Dest": "audio",
-            "Sec-Fetch-Mode": "no-cors",
-            "Sec-Fetch-Site": "same-origin",
-            "DNT": "1",
-            "Sec-GPC": "1",
-            "Accept-Encoding": "identity",
-            "TE": "trailers",
-        }
-        headers["Cookie"] = self.cookie
-        print(headers)
-        endpoint = (
-            f"{self.base_url}/voice?mode=eager&voice={voice}&messageSid={message_sid}"
         )
-        async with aiohttp.ClientSession() as session:
-            async with session.get(endpoint, headers=headers) as response:
-                print(response.status)
-                file_name = str(uuid.uuid4()) + ".mp3"
-                file_path = os.path.join(self.dir, file_name)
-                os.makedirs(self.dir, exist_ok=True)
-                if response.status == 200:
-                    with open(file_path, "wb") as file:
-                        async for chunk in response.content.iter_chunked(128):
-                            file.write(chunk)
-                    return {
-                        "url": f"https://yakova-embedding.hf.space/audio/{file_name}"
-                    }
-                    # Run command vlc to play the audio file
-                    # os.system("vlc speak.wav --intf dummy --play-and-exit")
                 else:
-                    temp = await response.text()
-                    print(temp)
-                    self.cookie = None
-                    return "Error: Unable to retrieve audio."
-    async def say(self, text, voice=VoiceType.qdpi.value):
-        _, response_sids = await self.get_response(text)
-        if response_sids:
-            return await self.speak_response(response_sids[0], voice=voice)
 # async def main():
-#     client = PiAIClient()
-#     response_texts, response_sids = await client.get_response(
-#         "Write a ryme to introduce yourself."
-#     )
-#     print(response_texts, response_sids)
-#     import time
-#     if response_sids:
-#         return await client.speak_response(response_sids[1])
-# # Run the main function
 # if __name__ == "__main__":
 #     asyncio.run(main())

 import asyncio
 import os
+from playwright.async_api import async_playwright, Page, Request, Response, Download
+import re
+import logging
+from urllib.parse import urlparse
+from datetime import datetime, timedelta
+import enum
+# Configure logging
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s [%(levelname)s] %(message)s",
+    handlers=[logging.StreamHandler()],
+)
+logger = logging.getLogger(__name__)
 class VoiceType(enum.Enum):
+    NEUTRAL = "voice1"
+    HAPPY = "voice2"
+    SAD = "voice3"
+    ANGRY = "voice4"
+    EXCITED = "voice5"
+    CALM = "voice6"
+    # Add more voices as supported by Pi.ai
 class PiAIClient:
+    def __init__(self, headless: bool = False, download_dir: str = "/tmp/Audio"):
+        self.headless = headless
+        self.download_dir = "/tmp/Audio"
+        self.playwright = None
+        self.browser = None
+        self.context = None
+        self.page = None
+        # Define actions with their selectors and corresponding handler methods
+        self.actions = [
             {
+                "selector": 'textarea[placeholder="Talk with Pi"]',
+                "handler": self.send_chat_message,
+                "description": "Chat input detected, sending message.",
+                "break_after": True,  # Indicates to break the loop after sending the message
+            },
+            {
+                "selector": 'button:has-text("I’ll do it later")',
+                "handler": self.click_element,
+                "description": "'I’ll do it later' button found, clicking it.",
+            },
+            {
+                "selector": 'button:has-text("Next")',
+                "handler": self.click_element,
+                "description": "'Next' button found, clicking it.",
+            },
+            {
+                "selector": 'textarea[placeholder="Your first name"]',
+                "handler": self.fill_name,
+                "description": "Name input detected, filling it.",
+            },
+        ]
+        # Regular expression to extract 'sid' values from the response
+        self.sid_regex = re.compile(r'"sid":"([\w\-]+)"')
+        # Set to keep track of processed sids to avoid duplicates
+        self.processed_sids = set()
+        # Directory to store downloaded audios
+        self.download_dir = download_dir
+        self.ensure_download_directory()
+        # Semaphore to limit concurrent downloads (optional)
+        self.semaphore = asyncio.Semaphore(5)  # Adjust the number as needed
+        # Rate limiting attributes
+        self.rate_limit_until = None  # Timestamp until which the bot should wait
+        self.rate_limit_lock = asyncio.Lock()  # To prevent race conditions
+        # Mapping from sid to (Future, VoiceType)
+        self.sid_futures = asyncio.Queue()
+    def ensure_download_directory(self):
+        """Ensure that the downloads directory exists."""
+        if not os.path.exists(self.download_dir):
+            os.makedirs(self.download_dir)
+            logger.info(
+                f"Created directory '{self.download_dir}' for storing downloads."
+            )
+        else:
+            logger.info(f"Directory '{self.download_dir}' already exists.")
+    async def setup(self):
+        """Initialize Playwright, launch the browser with a persistent context, and create a new page."""
+        self.playwright = await async_playwright().start()
+        # Specify the path for the user data directory
+        user_data_dir = os.path.join(os.getcwd(), "user_data")
+        if not os.path.exists(user_data_dir):
+            os.makedirs(user_data_dir)
+            logger.info(f"Created user data directory at '{user_data_dir}'.")
+        else:
+            logger.info(f"Using existing user data directory at '{user_data_dir}'.")
+        # Launch a persistent context
+        self.context = await self.playwright.chromium.launch_persistent_context(
+            user_agent=(
+                "Mozilla/5.0 (Windows NT 10.0; Win64; x64) "
+                "AppleWebKit/537.36 (KHTML, like Gecko) "
+                "Chrome/114.0.0.0 Safari/537.36"
+            ),
+            user_data_dir=user_data_dir,  # Persistent storage directory
+            headless=self.headless,
+            args=["--no-sandbox"],  # Optional: Add any Chromium args if needed
         )
+        # Create a new page within the persistent context
+        self.page = await self.context.new_page()
+        # Set up request and response interception
+        self.page.on("request", self.handle_request)
+        self.page.on("response", self.handle_response)
+        self.navigate("https://pi.ai/talk")
+        # Start the monitoring task
+        asyncio.create_task(self.monitor_page_and_act())
+    async def navigate(self, url: str):
+        """Navigate to the specified URL and wait for the page to load."""
+        await self.page.goto(url)
+        await self.page.wait_for_load_state("networkidle")
+        logger.info(f"Navigated to {url}")
+    async def monitor_page_and_act(self):
+        """Continuously monitor the page and perform actions based on the detected elements."""
+        counter = 0
+        while True:
+            try:
+                # Check for rate limiting before performing any actions
+                if self.is_rate_limited():
+                    wait_seconds = (
+                        self.rate_limit_until - datetime.utcnow()
+                    ).total_seconds()
+                    wait_seconds = max(wait_seconds, 0)
+                    logger.warning(
+                        f"Rate limited. Waiting for {wait_seconds:.2f} seconds before retrying."
+                    )
+                    await asyncio.sleep(wait_seconds)
+                    continue  # After waiting, re-enter the loop
+                action_performed = False
+                for action in self.actions:
+                    if await self.page.is_visible(action["selector"]):
+                        logger.info(action["description"])
+                        await action["handler"](action["selector"])
+                        action_performed = True
+                        if action.get("break_after"):
+                            action_performed = (
+                                False  # Continue monitoring after sending the message
+                            )
+                            break  # Exit the for-loop to allow handling other tasks
+                if not action_performed:
+                    logger.info(
+                        "No matching state detected. Navigating to /talk or /discover route."
+                    )
+                    if counter % 5 == 0:
+                        await self.navigate_to_route("/discover")
+                        logger.info("Navigated to /discover route.")
+                        counter = 0
+                    else:
+                        await self.navigate_to_route("/talk")
+                        logger.info("Navigated to /talk route.")
+                        counter += 1
+                # Wait for a short period before the next check
+                await asyncio.sleep(2)
+            except Exception as e:
+                logger.error(f"Error during monitoring: {e}")
+                await asyncio.sleep(
+                    2
+                )  # Prevent tight loop in case of continuous errors
+    def is_rate_limited(self):
+        """Check if the bot is currently rate-limited."""
+        if self.rate_limit_until and datetime.utcnow() < self.rate_limit_until:
+            return True
+        return False
+    async def navigate_to_route(self, route):
+        """Navigate to the specified route."""
+        try:
+            current_url = self.page.url
+            # Check if already on the specified route to prevent unnecessary navigation
+            if not current_url.endswith(route):
+                new_url = self.construct_route_url(current_url, route)
+                await self.navigate(new_url)
+            else:
+                logger.info(f"Already on the {route} route.")
+        except Exception as e:
+            logger.error(f"Error navigating to {route} route: {e}")
+    def construct_route_url(self, current_url, route):
+        """Construct the new URL for the specified route."""
+        # Modify this function to fit your URL structure
+        parsed_url = urlparse(current_url)
+        # Replace the path with the desired route
+        new_url = parsed_url._replace(path=route).geturl()
+        logger.info(f"Constructed new URL: {new_url}")
+        return new_url
+    async def click_element(self, selector: str):
+        """Wait for an element to be visible and click it."""
+        try:
+            await self.page.wait_for_selector(selector, timeout=3000)
+            await self.page.click(selector)
+            logger.info(f"Clicked element: {selector}")
+        except Exception as e:
+            logger.error(f"Error clicking element {selector}: {e}")
+    async def fill_name(self, selector: str):
+        """Fill in the name input field and submit."""
+        try:
+            name = "Cassandra"
+            await self.page.fill(selector, name)
+            await self.page.click('button[aria-label="Submit text"]')
+            logger.info(f"Name '{name}' submitted")
+        except Exception as e:
+            logger.error(f"Error submitting name: {e}")
+            await self.handle_send_failure()
+    async def send_chat_message(self, selector: str):
+        """Send a chat message in the chat input field."""
+        try:
+            await self.page.fill(selector, self.user_input)
+            await self.page.click('button[aria-label="Submit text"]')
+            logger.info("Chat message submitted")
+        except Exception as e:
+            logger.error(f"Could not send chat message: {e}")
+            await self.handle_send_failure()
+    async def handle_send_failure(self):
+        """Handle failure in sending messages by navigating to /talk or /discover."""
+        try:
+            # Attempt to navigate to /talk
+            await self.navigate_to_route("/talk")
+            logger.info("Navigated to /talk route after failing to send message.")
+        except Exception:
+            try:
+                # If navigating to /talk fails, navigate to /discover
+                await self.navigate_to_route("/discover")
+                logger.info(
+                    "Navigated to /discover route after failing to send message."
+                )
+            except Exception as e2:
+                logger.error(f"Failed to navigate after send_message failure: {e2}")
+    async def handle_request(self, request: Request):
+        """Handle and log network requests."""
+        # Log all requests at DEBUG level
+        logger.debug(f"Request: {request.method} {request.url}")
+    async def handle_response(self, response: Response):
+        """Handle and log network responses, extracting 'sid's."""
+        url = response.url
+        if "/api/chat" in url and response.request.method == "POST":
+            logger.info(f"Handling response for: {url}")
+            try:
+                response_status = response.status
+                response_text = await asyncio.wait_for(response.text(), timeout=5)
+                logger.info(f"Response received from {url}: {response_text}")
+                if response_status == 429:
+                    # Handle rate limiting based on status code
+                    logger.warning("Received 429 Too Many Requests.")
+                    retry_after = response.headers.get("Retry-After")
+                    if retry_after:
+                        wait_seconds = int(retry_after)
+                    else:
+                        wait_seconds = (
+                            60  # Default wait time if Retry-After not provided
+                        )
+                    await self.trigger_rate_limit(wait_seconds)
+                    return
+                # Attempt to parse the response as JSON
+                if "error" in response_text and "Too Many Requests" in response_text:
+                    logger.warning("Received error response: Too Many Requests.")
+                    await self.trigger_rate_limit(60)  # Default wait time
+                    return
+                # Extract 'sid's using regex
+                sids = self.sid_regex.findall(response_text)
+                if sids:
+                    logger.info(f"Extracted 'sid's: {sids}")
+                    for sid in sids:
+                        if sid not in self.processed_sids:
+                            self.processed_sids.add(sid)
+                            logger.info(f"Processing sid: {sid}")
+                            # If there are pending say requests, assign this sid to the first one
+                            if not self.sid_futures.empty():
+                                future, voice = await self.sid_futures.get()
+                                asyncio.create_task(
+                                    self.process_sid(sid, voice, future)
+                                )
+                            else:
+                                # No pending say requests, process with default voice or skip
+                                asyncio.create_task(
+                                    self.process_sid(sid, VoiceType.NEUTRAL.value, None)
+                                )
+                            break
                 else:
+                    logger.info("No 'sid's found in the response.")
+            except asyncio.TimeoutError:
+                logger.warning(
+                    "Timed out waiting for the response body (possibly streaming)."
+                )
+            except Exception as e:
+                logger.error(f"Error processing response: {e}")
+        elif "/api/chat/voice" in url:
+            # Handle audio responses directly if needed
+            pass  # Currently handled in process_sid
+    async def trigger_rate_limit(self, wait_seconds: int):
+        """Trigger rate limiting by setting the rate_limit_until timestamp."""
+        async with self.rate_limit_lock:
+            if (
+                not self.rate_limit_until
+                or datetime.utcnow() + timedelta(seconds=wait_seconds)
+                > self.rate_limit_until
+            ):
+                self.rate_limit_until = datetime.utcnow() + timedelta(
+                    seconds=wait_seconds
+                )
+                logger.warning(
+                    f"Rate limited. Will resume after {self.rate_limit_until} UTC."
+                )
+            else:
+                self.rate_limit_until += timedelta(seconds=wait_seconds)
+                logger.warning("Already rate limited. Extending the wait time.")
+    async def process_sid(self, sid: str, voice: str, future: asyncio.Future):
+        """Download the TTS audio using the sid and specified voice."""
+        async with self.semaphore:
+            try:
+                logger.info(f"Processing sid: {sid} with voice: {voice}")
+                url = f"https://pi.ai/api/chat/voice?mode=eager&voice={voice}&messageSid={sid}"
+                logger.info(f"Initiating download from URL: {url}")
+                # Open a new page (tab)
+                new_page = await self.context.new_page()
+                # Set up download handler
+                new_page.on("download", self.handle_download)
+                # Navigate to the URL
+                await new_page.goto(url)
+                logger.info(f"Opened URL: {url}")
+                # Create and click the anchor tag via JavaScript
+                await new_page.evaluate(
+                    f"""
+                    (function() {{
+                        var link = document.createElement('a');
+                        link.href = "{url}";
+                        link.download = "{sid}.mp3";
+                        document.body.appendChild(link);
+                        link.click();
+                        document.body.removeChild(link);
+                    }})();
+                    """
+                )
+                logger.info(f"Triggered download for sid: {sid}")
+                filename = f"{sid}_{voice.lower()}.mp3"
+                file_path = os.path.join(self.download_dir, filename)
+                # Start the download
+                # Wait for the download to start
+                await asyncio.sleep(2)
+                # Close the new page
+                await new_page.close()
+                # If a future was provided, set its result
+                if future:
+                    future.set_result(file_path)
+            except Exception as e:
+                logger.error(f"Error processing sid {sid}: {e}")
+                if future and not future.done():
+                    future.set_exception(e)
+    async def handle_download(self, download: Download):
+        """Handle the download event and save the file."""
+        try:
+            # Define the path to save the download
+            filename = download.suggested_filename or "audio.mp3"
+            download_path = os.path.join(self.download_dir, filename)
+            # Save the downloaded file
+            await download.save_as(download_path)
+            logger.info(f"Downloaded audio to {download_path}")
+        except Exception as e:
+            logger.error(f"Error downloading audio: {e}")
+    async def close(self):
+        """Close the browser and Playwright."""
+        if self.context:
+            await self.context.close()
+        if self.playwright:
+            await self.playwright.stop()
+        logger.info("Browser closed")
+    async def say(self, message: str, voice: str) -> str:
+        """
+        Send a message and retrieve the path to the downloaded TTS audio.
+        :param message: The message to send.
+        :param voice: The emotional voice type to use.
+        :return: The file path of the downloaded audio.
+        """
+        # Create a Future to wait for the audio download
+        future = asyncio.get_event_loop().create_future()
+        # Put the future and voice into the queue
+        await self.sid_futures.put((future, voice))
+        # Send the message
+        self.user_input = message
+        await self.send_message(message)
+        # Wait for the Future to be set with the audio path
+        try:
+            audio_path = await asyncio.wait_for(
+                future, timeout=60
+            )  # Adjust timeout as needed
+            return audio_path
+        except asyncio.TimeoutError:
+            logger.error("Timeout while waiting for audio download.")
+            return ""
+    async def send_message(
+        self, message: str, retry_count: int = 3, retry_delay: int = 60
+    ):
+        """
+        Send a message through the chat interface with retry logic.
+        :param message: The message to send.
+        :param retry_count: Number of times to retry on failure.
+        :param retry_delay: Seconds to wait before retrying.
+        """
+        attempt = 0
+        while attempt < retry_count:
+            try:
+                # Check if currently rate limited
+                if self.is_rate_limited():
+                    wait_seconds = (
+                        self.rate_limit_until - datetime.utcnow()
+                    ).total_seconds()
+                    wait_seconds = max(wait_seconds, 0)
+                    logger.warning(
+                        f"Currently rate limited. Waiting for {wait_seconds:.2f} seconds before retrying."
+                    )
+                    await asyncio.sleep(wait_seconds)
+                self.user_input = message  # Update the user_input attribute
+                await self.page.fill(
+                    'textarea[placeholder="Talk with Pi"]', self.user_input
+                )
+                await self.page.click('button[aria-label="Submit text"]')
+                logger.info("Chat message submitted")
+                return  # Success, exit the method
+            except Exception as e:
+                logger.error(f"Could not send chat message: {e}")
+                attempt += 1
+                if attempt < retry_count:
+                    logger.info(
+                        f"Retrying to send message in {retry_delay} seconds... (Attempt {attempt}/{retry_count})"
+                    )
+                    await asyncio.sleep(retry_delay)
+                else:
+                    logger.error(
+                        "Max retry attempts reached. Failed to send the message."
+                    )
+                    await self.handle_send_failure()
+        # If all retries fail, handle the failure
+        await self.handle_send_failure()
+import asyncio
 # async def main():
+#     # Initialize the PiBot
+#     bot = PiAIClient(headless=True)
+#     try:
+#         await bot.setup()
+#         # await bot.navigate("https://pi.ai/talk")
+#         # Example usage of the say method
+#         audio_path_neutral = await bot.say("Hello baby.", voice=VoiceType.NEUTRAL.value)
+#         print(f"Neutral Audio Path: {audio_path_neutral}")
+#         await asyncio.sleep(5)
+#         audio_path_happy = await bot.say(
+#             "I'm so happy to see you!", voice=VoiceType.HAPPY.value
+#         )
+#         print(f"Happy Audio Path: {audio_path_happy}")
+#         await asyncio.sleep(5)
+#         audio_path_sad = await bot.say(
+#             "I'm feeling a bit down today.", voice=VoiceType.SAD.value
+#         )
+#         print(f"Sad Audio Path: {audio_path_sad}")
+#         # You can add more messages with different emotions as needed
+#     finally:
+#         await bot.close()
 # if __name__ == "__main__":
 #     asyncio.run(main())

App/app.py CHANGED Viewed

@@ -4,7 +4,7 @@ from fastapi.middleware.gzip import GZipMiddleware
 from .TTS.TTSRoutes import tts_router
 from .Embedding.EmbeddingRoutes import embeddigs_router
 from fastapi.middleware.cors import CORSMiddleware
@@ -33,11 +33,13 @@ app.add_middleware(
     allow_headers=["*"],
 )
 app.add_middleware(GZipMiddleware, minimum_size=1000)
 @app.on_event("startup")
 async def startup():
     FastAPICache.init(InMemoryBackend())
 @app.get("/")

 from .TTS.TTSRoutes import tts_router
 from .Embedding.EmbeddingRoutes import embeddigs_router
+from .TTS.utils.Pi import PiAIClient
 from fastapi.middleware.cors import CORSMiddleware
     allow_headers=["*"],
 )
 app.add_middleware(GZipMiddleware, minimum_size=1000)
+pi = PiAIClient(headless=True)
 @app.on_event("startup")
 async def startup():
     FastAPICache.init(InMemoryBackend())
+    await pi.setup()
 @app.get("/")

Dockerfile CHANGED Viewed

@@ -28,7 +28,7 @@ RUN apt-get update && \
 #copy requirements
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
 # Copy the application code
@@ -37,6 +37,6 @@ USER admin
 COPY --chown=admin . /srv
 # Command to run the application
-CMD uvicorn App.app:app --host 0.0.0.0 --port 7860 --workers 1
 # Expose the server port
 EXPOSE 7860

 #copy requirements
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
+RUN playwright install-deps
 # Copy the application code
 COPY --chown=admin . /srv
 # Command to run the application
+CMD playwright install && uvicorn App.app:app --host 0.0.0.0 --port 7860 --workers 1
 # Expose the server port
 EXPOSE 7860