Final_Assignment_Agent

Paused

App Files Files Community

Martin Bär commited on Apr 27

Commit

09a402e

1 Parent(s): ba66f78

Only activate langfuse conditionally

Browse files

Files changed (2) hide show

.gitignore +1 -1
basic_agent.py +18 -8

.gitignore CHANGED Viewed

@@ -1,4 +1,4 @@
 __pycache__
 .venv
-tool_tests.ipynb
 .env

 __pycache__
 .venv
+*.ipynb
 .env

basic_agent.py CHANGED Viewed

@@ -8,14 +8,20 @@ from llama_index.core.tools.tool_spec.load_and_search import LoadAndSearchToolSp
 from llama_index.readers.web import SimpleWebPageReader
 from llama_index.core.tools.ondemand_loader_tool import OnDemandLoaderTool
 from langfuse.llama_index import LlamaIndexInstrumentor
-# Langfuse
-instrumentor = LlamaIndexInstrumentor()
-instrumentor.start()
 class BasicAgent:
-    def __init__(self):
-        llm = HuggingFaceInferenceAPI(model_name="Qwen/Qwen2.5-Coder-32B-Instruct")
         # Initialize tools
         tool_spec = DuckDuckGoSearchToolSpec()
@@ -31,6 +37,8 @@ class BasicAgent:
         # Convert into a LoadAndSearchToolSpec because the wikipedia search tool returns
         # entire Wikipedia pages and this can pollute the context window of the LLM
         wiki_search_tool_las = LoadAndSearchToolSpec.from_defaults(wiki_search_tool).to_tool_list()
         webpage_tool = OnDemandLoaderTool.from_defaults(
@@ -41,7 +49,7 @@ class BasicAgent:
         # Create Alfred with all the tools
         self.agent = AgentWorkflow.from_tools_or_functions(
-            wiki_search_tool_las + [search_tool], # webpage_tool does not work properly
             llm=llm,
             verbose=True,
             system_prompt=("You are a helpful agent that can search Wikipedia and the Internet for answers. "
@@ -52,5 +60,7 @@ class BasicAgent:
     async def __call__(self, question: str) -> str:
         response = await self.agent.run(user_msg=question) # ctx=self.ctx)
-        instrumentor.flush()
         return response.response.content

 from llama_index.readers.web import SimpleWebPageReader
 from llama_index.core.tools.ondemand_loader_tool import OnDemandLoaderTool
 from langfuse.llama_index import LlamaIndexInstrumentor
+from llama_index.llms.ollama import Ollama
 class BasicAgent:
+    def __init__(self, ollama=False, langfuse=True):
+        if not ollama:
+            llm = HuggingFaceInferenceAPI(model_name="Qwen/Qwen2.5-Coder-32B-Instruct")
+        else:
+            llm = Ollama(model="mistral:latest", request_timeout=120.0)
+        # Langfuse
+        self.langfuse = langfuse
+        if self.langfuse:
+            self.instrumentor = LlamaIndexInstrumentor()
+            self.instrumentor.start()
         # Initialize tools
         tool_spec = DuckDuckGoSearchToolSpec()
         # Convert into a LoadAndSearchToolSpec because the wikipedia search tool returns
         # entire Wikipedia pages and this can pollute the context window of the LLM
+        # TODO this does not work so well. We need to make the retriever return the top 5 chunks or sth.
         wiki_search_tool_las = LoadAndSearchToolSpec.from_defaults(wiki_search_tool).to_tool_list()
         webpage_tool = OnDemandLoaderTool.from_defaults(
         # Create Alfred with all the tools
         self.agent = AgentWorkflow.from_tools_or_functions(
+            wiki_search_tool_las + [search_tool], # webpage_tool does not work properly - cookies etc
             llm=llm,
             verbose=True,
             system_prompt=("You are a helpful agent that can search Wikipedia and the Internet for answers. "
     async def __call__(self, question: str) -> str:
         response = await self.agent.run(user_msg=question) # ctx=self.ctx)
+        if self.langfuse:
+            self.instrumentor.flush()
         return response.response.content