Final_Assignment_Template

Sleeping

App Files Files Community

lovepreetsingh1996 commited on May 2

Commit

3cf70e0

1 Parent(s): 4946de1

fix: remove wikipedia

Browse files

Files changed (1) hide show

app.py +34 -31

app.py CHANGED Viewed

@@ -36,24 +36,28 @@ class BasicAgent:
         print("BasicAgent initialized.")
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
-        def get_youtube_transcript(youtube_link: str) -> str:
             """Fetches transcript of the given youtube_link and returns matching answers based on query.
                 Args:
                 youtube_link (str): youtube video link for which we need to answer questions on.
             """
-            loader = YoutubeTranscriptReader()
-            documents = loader.load_data(
-                ytlinks=[youtube_link]
-            )
-            text = documents[0].text_resource.text
-            return "Here's the transcript from the video, examine and formulate answer based on what is said in the transcript: \n" + text
         youtube_transcript_answer_tool = FunctionTool.from_defaults(
-            get_youtube_transcript,
-            name="get_youtube_transcript",
-            description="Fetches transcript of the given youtube video and returns matching answers based on query. To be called when video link is given.",
         )
         def duck_duck_go_search_tool(query: str) -> str:
@@ -82,33 +86,32 @@ class BasicAgent:
                 description="Searches the web and refines the result into a high-quality answer. Use when other tools don't seem suitable"
             )
-        def wikipedia_search(query: str) -> str:
-            try:
-                text = WikipediaToolSpec().search_data(query)
-                documents = [Document(text)]
-                splitter = SentenceSplitter(chunk_size=256)
-                nodes = splitter.get_nodes_from_documents(documents)
-                retriever = BM25Retriever(nodes=nodes, similarity_top_k=10)
-                synthesizer = get_response_synthesizer(response_mode="refine", llm=self.llm)
-                query_engine = RetrieverQueryEngine(retriever=retriever, response_synthesizer=synthesizer)
-                response = query_engine.query(query)
-                return response.response
-            except Exception as e:
-                return f"An error occurred: {e}"
-        wikipedia_search_tool = FunctionTool.from_defaults(
-                wikipedia_search,
-                name="wikipedia_search",
-                description="Searches wikipedia and converts results into a high quality answer."
-            )
-        agent = AgentWorkflow.from_tools_or_functions([duckduckgo_search_tool, youtube_transcript_answer_tool, wikipedia_search_tool], llm=self.llm)
         async def run_agent():
             return await agent.run(question)
@@ -173,7 +176,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     answers_payload = []
     print(f"Running agent on {len(questions_data)} questions...")
     for item in questions_data:
-        time.sleep(45)
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id or question_text is None:

         print("BasicAgent initialized.")
     def __call__(self, question: str) -> str:
         print(f"Agent received question (first 50 chars): {question[:50]}...")
+        def get_answers_from_youtube_transcript(youtube_link: str) -> str:
             """Fetches transcript of the given youtube_link and returns matching answers based on query.
                 Args:
                 youtube_link (str): youtube video link for which we need to answer questions on.
+                query (str): question to answer from video transcript.
             """
+            try:
+                loader = YoutubeTranscriptReader()
+                documents = loader.load_data(
+                    ytlinks=[youtube_link]
+                )
+                text = documents[0].text_resource.text
+                return "Here's the transcript from the video, examine and formulate answer based on what is said in the transcript: \n" + text
+            except Exception as e:
+                print("error", e)
         youtube_transcript_answer_tool = FunctionTool.from_defaults(
+            get_answers_from_youtube_transcript,
+            name="get_answers_from_youtube_transcript",
+            description="Fetches transcript of the given youtube_link and returns matching answers based on query. To be called when video link is given.",
         )
         def duck_duck_go_search_tool(query: str) -> str:
                 description="Searches the web and refines the result into a high-quality answer. Use when other tools don't seem suitable"
             )
+        # def wikipedia_search(query: str) -> str:
+        #     try:
+        #         text = WikipediaToolSpec().search_data(query)
+        #         documents = [Document(text=text)]
+        #         splitter = SentenceSplitter(chunk_size=256)
+        #         nodes = splitter.get_nodes_from_documents(documents)
+        #         retriever = BM25Retriever(nodes=nodes, similarity_top_k=1)
+        #         synthesizer = get_response_synthesizer(response_mode="refine", llm=llm)
+        #         query_engine = RetrieverQueryEngine(retriever=retriever, response_synthesizer=synthesizer)
+        #         response = query_engine.query(query)
+        #         return response.response
+        #     except Exception as e:
+        #         return f"An error occurred: {e}"
+        # wikipedia_search_tool = FunctionTool.from_defaults(
+        #         wikipedia_search,
+        #         name="wikipedia_search",
+        #         description="Searches wikipedia and converts results into a high quality answer."
+        #     )
+        agent = AgentWorkflow.from_tools_or_functions([duckduckgo_search_tool, youtube_transcript_answer_tool], llm=self.llm)
         async def run_agent():
             return await agent.run(question)
     answers_payload = []
     print(f"Running agent on {len(questions_data)} questions...")
     for item in questions_data:
+        time.sleep(60)
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id or question_text is None: