Spaces:

Yakova
/

Embedding

Running

App Files Files Community

Mbonea commited on Nov 10, 2023

Commit

c1e15bc

1 Parent(s): 8b7f508

minor changes

Browse files

Files changed (6) hide show

App/Embedding/EmbeddingRoutes.py +7 -2
App/Embedding/Schemas.py +4 -0
App/Embedding/utils/Initialize.py +4 -0
App/Embedding/utils/__init__.py +1 -4
App/TTS/utils/Picsart.py +33 -0
App/TTS/utils/Podcastle.py +22 -58

App/Embedding/EmbeddingRoutes.py CHANGED Viewed

@@ -1,7 +1,7 @@
 from fastapi import APIRouter, BackgroundTasks
-from .utils.Initialize import TextSearch, IdSearch
-from .Schemas import SearchRequest, AddDocumentRequest
 import redis, os, json
 REDIS = os.environ.get("REDIS")
@@ -17,6 +17,11 @@ async def create_embeddings(req: AddDocumentRequest):
     pass
 @embeddigs_router.post("/search_id")
 async def search_id(
     req: SearchRequest,

 from fastapi import APIRouter, BackgroundTasks
+from .utils.Initialize import TextSearch, IdSearch, LookUpIds
+from .Schemas import SearchRequest, AddDocumentRequest, TrendingRequest
 import redis, os, json
 REDIS = os.environ.get("REDIS")
     pass
+@embeddigs_router.get("/Trending")
+async def getTrending(req: TrendingRequest):
+    LookUpIds(req.imdb_ids)
 @embeddigs_router.post("/search_id")
 async def search_id(
     req: SearchRequest,

App/Embedding/Schemas.py CHANGED Viewed

@@ -10,5 +10,9 @@ class SearchRequest(BaseModel):
     query: str
 class GetTranscriptions(BaseModel):
     userId: int

     query: str
+class TrendingRequest(BaseModel):
+    imdb_ids: list[str]
 class GetTranscriptions(BaseModel):
     userId: int

App/Embedding/utils/Initialize.py CHANGED Viewed

@@ -71,6 +71,10 @@ def IdSearch(query: str, background_task: BackgroundTasks):
     return TextSearch(text, filter={"key": {"$ne": query}})
 def TextSearch(query: str, filter=None):
     docs = docsearch.similarity_search(query, k=10, filter=filter)
     keys = [doc.metadata["key"] for doc in docs]

     return TextSearch(text, filter={"key": {"$ne": query}})
+def LookUpIds(imdb_ids: list[str]):
+    return FetchDocuments(imdb_ids)
 def TextSearch(query: str, filter=None):
     docs = docsearch.similarity_search(query, k=10, filter=filter)
     keys = [doc.metadata["key"] for doc in docs]

App/Embedding/utils/__init__.py CHANGED Viewed

@@ -1,10 +1,7 @@
 from elasticsearch import Elasticsearch
 import os
-elastic_host = os.environ.get(
-    "ELASTIC_HOST",
-    "https://u46hxt12c:[email protected]:443",
-)
 # initialize elasticSearch
 es = Elasticsearch([elastic_host])

 from elasticsearch import Elasticsearch
 import os
+elastic_host = os.environ.get("ELASTIC_HOST")
 # initialize elasticSearch
 es = Elasticsearch([elastic_host])

App/TTS/utils/Picsart.py ADDED Viewed

	@@ -0,0 +1,33 @@

+import asyncio
+from playwright.async_api import async_playwright
+async def extract_bootstrap_data():
+    async with async_playwright() as p:
+        browser = await p.chromium.launch()
+        page = await browser.new_page()
+        # Navigate to the Pixabay Sound Effects page
+        await page.goto('https://pixabay.com/sound-effects/search/door%20creaking/')
+        # Wait for the content to load (you can adjust the timeout as needed)
+        # await page.wait_for_selector('.js-media-list-wrapper')
+        # await page.wait_for_selector('.js-media-item')
+        # Get the content of the 5th script tag
+        # script_content = await page.evaluate('''() => {
+        #     const scripty=document.querySelectorAll('script')[0];
+        #     return scripty.content
+        # }''')
+        # print(script_content)
+        # await page.evaluate(f'''{script_content}(''')
+        page_content = await page.content()
+        # Print the content of the 5th script tag
+        # print(page_content)
+        # Close the browser
+        await browser.close()
+# Run the extraction function
+if __name__ == '__main__':
+    asyncio.run(extract_bootstrap_data())

App/TTS/utils/Podcastle.py CHANGED Viewed

@@ -1,19 +1,20 @@
 import aiohttp
 import asyncio
-from App.TTS.Schemas import TTSGenerateRequest,StatusRequest
 from pydantic import BaseModel
 class PodcastleAPI:
     def __init__(self, username, password):
         self.base_url = "https://podcastle.ai/api"
         self.username = username
         self.password = password
         self.headers = {
-            'authority': 'podcastle.ai',
-            'accept': '*/*',
-            'accept-language': 'en-US,en;q=0.9',
-            'cache-control': 'no-cache',
-            'content-type': 'application/json',
             # Add your other headers here
         }
         self.session = None  # Initialize the session in the constructor
@@ -28,17 +29,14 @@ class PodcastleAPI:
     async def signin(self):
         url = f"{self.base_url}/auth/signin"
-        payload = {
-            "username": self.username,
-            "password": self.password
-        }
         if not self.session:
             await self.create_session()
         async with self.session.post(url, json=payload) as response:
             response_data = await response.json()
-            self.access_token = response_data['auth']['accessToken']
             return response_data
     async def make_request(self, tts_request: TTSGenerateRequest):
@@ -49,17 +47,21 @@ class PodcastleAPI:
             await self.signin()
         headers_with_auth = self.headers.copy()
-        headers_with_auth['authorization'] = f"Bearer {self.access_token}"
         url = f"{self.base_url}/speech/text-to-speech"
-        async with self.session.post(url, json=tts_request.dict(), headers=headers_with_auth) as response:
             if response.status == 401:
                 # If a 401 error is encountered, sign in again to update the access token
                 await self.signin()
                 # Retry the request with the updated access token
-                headers_with_auth['authorization'] = f"Bearer {self.access_token}"
-                async with self.session.post(url, json=tts_request.dict(), headers=headers_with_auth) as retry_response:
                     response_text = await retry_response.json()
                     return response_text
             else:
@@ -74,7 +76,7 @@ class PodcastleAPI:
             await self.signin()
         headers_with_auth = self.headers.copy()
-        headers_with_auth['authorization'] = f"Bearer {self.access_token}"
         url = f"{self.base_url}/speech/text-to-speech/{tts_status.requestId}"
@@ -83,17 +85,16 @@ class PodcastleAPI:
                 # If a 401 error is encountered, sign in again to update the access token
                 await self.signin()
                 # Retry the request with the updated access token
-                headers_with_auth['authorization'] = f"Bearer {self.access_token}"
-                async with self.session.get(url, headers=headers_with_auth) as retry_response:
                     response_text = await retry_response.json()
                     return response_text
             else:
                 response_text = await response.json()
                 return response_text
     async def __aenter__(self):
         if not self.session:
             await self.create_session()
@@ -101,40 +102,3 @@ class PodcastleAPI:
     async def __aexit__(self, exc_type, exc_value, traceback):
         await self.close_session()
-# Example usage:
-if __name__ == "__main__":
-    class Speak(BaseModel):
-        paragraphId: str
-        text: str
-        speaker: str
-    class TTSGenerateRequest(BaseModel):
-        paragraphs: [Speak]
-        requestId: str
-        workspaceId: str
-    async def main():
-        username = "[email protected]"
-        password = "k7bNvgmJUda3yEG"
-        # Create a TTSGenerateRequest object
-        tts_request = TTSGenerateRequest(
-            paragraphs=[
-                Speak(
-                    paragraphId="6f05p",
-                    text="<speak>Hey Daniel. Are you ok?. Manchester United almost lost yesterday  </speak>",
-                    speaker="c60166365edf46589657770d"
-                )
-            ],
-            requestId="7d6018ae-9617-4d22-879f-5e67283fa140",
-            workspaceId="f84fd58e-2899-4531-9f51-77c155c1e294"
-        )
-        async with PodcastleAPI(username, password) as podcastle_api:
-            # Make the TTS request using the TTSGenerateRequest object
-            response_text = await podcastle_api.make_request(tts_request)
-            print(response_text)
-    loop = asyncio.get_event_loop()
-    loop.run_until_complete(main())

 import aiohttp
 import asyncio
+from App.TTS.Schemas import TTSGenerateRequest, StatusRequest
 from pydantic import BaseModel
 class PodcastleAPI:
     def __init__(self, username, password):
         self.base_url = "https://podcastle.ai/api"
         self.username = username
         self.password = password
         self.headers = {
+            "authority": "podcastle.ai",
+            "accept": "*/*",
+            "accept-language": "en-US,en;q=0.9",
+            "cache-control": "no-cache",
+            "content-type": "application/json",
             # Add your other headers here
         }
         self.session = None  # Initialize the session in the constructor
     async def signin(self):
         url = f"{self.base_url}/auth/signin"
+        payload = {"username": self.username, "password": self.password}
         if not self.session:
             await self.create_session()
         async with self.session.post(url, json=payload) as response:
             response_data = await response.json()
+            self.access_token = response_data["auth"]["accessToken"]
             return response_data
     async def make_request(self, tts_request: TTSGenerateRequest):
             await self.signin()
         headers_with_auth = self.headers.copy()
+        headers_with_auth["authorization"] = f"Bearer {self.access_token}"
         url = f"{self.base_url}/speech/text-to-speech"
+        async with self.session.post(
+            url, json=tts_request.dict(), headers=headers_with_auth
+        ) as response:
             if response.status == 401:
                 # If a 401 error is encountered, sign in again to update the access token
                 await self.signin()
                 # Retry the request with the updated access token
+                headers_with_auth["authorization"] = f"Bearer {self.access_token}"
+                async with self.session.post(
+                    url, json=tts_request.dict(), headers=headers_with_auth
+                ) as retry_response:
                     response_text = await retry_response.json()
                     return response_text
             else:
             await self.signin()
         headers_with_auth = self.headers.copy()
+        headers_with_auth["authorization"] = f"Bearer {self.access_token}"
         url = f"{self.base_url}/speech/text-to-speech/{tts_status.requestId}"
                 # If a 401 error is encountered, sign in again to update the access token
                 await self.signin()
                 # Retry the request with the updated access token
+                headers_with_auth["authorization"] = f"Bearer {self.access_token}"
+                async with self.session.get(
+                    url, headers=headers_with_auth
+                ) as retry_response:
                     response_text = await retry_response.json()
                     return response_text
             else:
                 response_text = await response.json()
                 return response_text
     async def __aenter__(self):
         if not self.session:
             await self.create_session()
     async def __aexit__(self, exc_type, exc_value, traceback):
         await self.close_session()