Spaces:

Aedelon
/

GAIA_Agent

Sleeping

GAIA_Agent / agents /reasoning_agent.py

Delanoe Pirard

cookies.txt

68bd1d5 about 2 months ago

10.4 kB

	import os
	import logging

	from llama_index.core.agent.workflow import ReActAgent
	from llama_index.core.tools import FunctionTool
	from llama_index.llms.google_genai import GoogleGenAI
	from llama_index.llms.openai import OpenAI

	# Setup logging
	logger = logging.getLogger(__name__)

	# Helper function to load prompt from file
	def load_prompt_from_file(filename: str, default_prompt: str) -> str:
	"""Loads a prompt from a text file."""
	try:
	# Assuming the prompt file is in the same directory as the agent script
	script_dir = os.path.dirname(__file__)
	prompt_path = os.path.join(script_dir, filename)
	with open(prompt_path, "r") as f:
	prompt = f.read()
	logger.info(f"Successfully loaded prompt from {prompt_path}")
	return prompt
	except FileNotFoundError:
	logger.warning(f"Prompt file {filename} not found at {prompt_path}. Using default.")
	return default_prompt
	except Exception as e:
	logger.error(f"Error loading prompt file {filename}: {e}", exc_info=True)
	return default_prompt

	# --- Tool Function ---

	def reasoning_tool_fn(context: str) -> str:
	"""
	Perform chain-of-thought reasoning over the provided context using a dedicated LLM.
	Args:
	context (str): The conversation/workflow history and current problem statement.
	Returns:
	str: A structured reasoning trace and conclusion, or an error message.
	"""
	logger.info(f"Executing reasoning tool with context length: {len(context)}")

	# Configuration for the reasoning LLM (OpenAI in the original)
	reasoning_llm_model = os.getenv("REASONING_LLM_MODEL", "gpt-4o-mini") # Use gpt-4o-mini as default
	openai_api_key = os.getenv("OPENAI_API_KEY")

	if not openai_api_key:
	logger.error("ALPAFLOW_OPENAI_API_KEY not found for reasoning tool LLM.")
	return "Error: ALPAFLOW_OPENAI_API_KEY must be set to use the reasoning tool."

	# Define the prompt for the reasoning LLM
	reasoning_prompt = f"""You are an expert reasoning engine. Analyze the following workflow context and problem statement:

	--- CONTEXT START ---
	{context}
	--- CONTEXT END ---

	Perform the following steps:
	1. Comprehension: Identify the core question/problem and key constraints from the context.
	2. Decomposition: Break the problem into logical sub-steps.
	3. Chain-of-Thought: Reason through each sub-step, stating assumptions and deriving implications.
	4. Verification: Check conclusions against constraints.
	5. Synthesis: Integrate results into a cohesive answer/recommendation.
	6. Clarity: Use precise language.

	Respond with your numbered reasoning steps followed by a concise final conclusion or recommendation.
	"""

	try:
	# Note: Original used OpenAI with a specific key and model. Retaining that.
	# Consider adding `reasoning_effort="high"` if supported and desired.
	llm = OpenAI(
	model=reasoning_llm_model,
	api_key=openai_api_key,
	reasoning_effort="high",
	temperature=0.055,
	max_tokens=16384
	)
	logger.info(f"Using reasoning LLM: {reasoning_llm_model}")
	response = llm.complete(reasoning_prompt)
	logger.info("Reasoning tool execution successful.")
	return response.text
	except Exception as e:
	logger.error(f"Error during reasoning tool LLM call: {e}", exc_info=True)
	return f"Error during reasoning: {e}"


	def answer_question(question: str) -> str:
	"""
	Answer any question by following this strict format:
	1. Include your chain of thought (your reasoning steps).
	2. End your reply with the exact template:
	FINAL ANSWER: [YOUR FINAL ANSWER]
	YOUR FINAL ANSWER must be:
	- A number, or
	- As few words as possible, or
	- A comma-separated list of numbers and/or strings.
	Formatting rules:
	* If asked for a number, do not use commas or units (e.g., $, %), unless explicitly requested.
	* If asked for a string, do not include articles or abbreviations (e.g., city names), and write digits in plain text.
	* If asked for a comma-separated list, apply the above rules to each element.
	This tool should be invoked immediately after completing the final planning sub-step.
	"""
	logger.info(f"Answering question: {question[:100]}")

	gemini_api_key = os.getenv("GEMINI_API_KEY")
	if not gemini_api_key:
	logger.error("GEMINI_API_KEY not set for answer_question tool.")
	return "Error: GEMINI_API_KEY not set."

	model_name = os.getenv("ANSWER_TOOL_LLM_MODEL", "gemini-2.5-pro-preview-03-25")

	# Build the assistant prompt enforcing the required format
	assistant_prompt = (
	"You are a general AI assistant. I will ask you a question. "
	"Report your thoughts, and finish your answer with the following template: "
	"FINAL ANSWER: [YOUR FINAL ANSWER]. "
	"YOUR FINAL ANSWER should be a number OR as few words as possible "
	"OR a comma separated list of numbers and/or strings. "
	"If you are asked for a number, don't use commas for thousands or any units like $ or % unless specified. "
	"If you are asked for a string, omit articles and abbreviations, and write digits in plain text. "
	"If you are asked for a comma separated list, apply these rules to each element.\n\n"
	f"Question: {question}\n"
	"Answer:"
	)

	try:
	llm = GoogleGenAI(api_key=gemini_api_key, model="gemini-2.5-pro-preview-03-25", temperature=0.05)
	logger.info(f"Using answer LLM: {model_name}")
	response = llm.complete(assistant_prompt)
	logger.info("Answer generated successfully.")
	return response.text
	except Exception as e:
	logger.error(f"LLM call failed during answer generation: {e}", exc_info=True)
	return f"Error during answer generation: {e}"


	# --- Tool Definition ---
	reasoning_tool = FunctionTool.from_defaults(
	fn=reasoning_tool_fn,
	name="reasoning_tool",
	description=(
	"Applies detailed chain-of-thought reasoning to the provided workflow context using a dedicated LLM. "
	"Input: context (str). Output: Reasoning steps and conclusion (str) or error message."
	),
	)

	answer_question = FunctionTool.from_defaults(
	fn=answer_question,
	name="answer_question",
	description=(
	"Use this tool to answer any question, reporting your reasoning steps and ending with 'FINAL ANSWER: ...'. "
	"Invoke this tool immediately after the final sub-step of planning is complete."
	),
	)

	# --- Agent Initialization ---
	def initialize_reasoning_agent() -> ReActAgent:
	"""Initializes the Reasoning Agent."""
	logger.info("Initializing ReasoningAgent...")

	# Configuration for the agent's main LLM (Google GenAI)
	agent_llm_model = os.getenv("REASONING_AGENT_LLM_MODEL", "gemini-2.5-pro-preview-03-25")
	gemini_api_key = os.getenv("GEMINI_API_KEY")

	if not gemini_api_key:
	logger.error("GEMINI_API_KEY not found for ReasoningAgent.")
	raise ValueError("GEMINI_API_KEY must be set for ReasoningAgent")

	try:
	llm = GoogleGenAI(api_key=gemini_api_key, model="gemini-2.5-pro-preview-03-25", temperature=0.05)
	logger.info(f"Using agent LLM: {agent_llm_model}")

	# Load system prompt
	default_system_prompt = ("You are ReasoningAgent... [Default prompt content - replace with actual]" # Placeholder
	)
	system_prompt = load_prompt_from_file("../prompts/reasoning_agent_prompt.txt", default_system_prompt)
	if system_prompt == default_system_prompt:
	logger.warning("Using default/fallback system prompt for ReasoningAgent.")

	agent = ReActAgent(
	name="reasoning_agent",
	description=(
	"An autonomous reasoning specialist that applies `reasoning_tool` to perform "
	"in-depth chain-of-thought analysis on incoming queries or contexts, "
	"then seamlessly delegates the synthesized insights to `planner_agent` "
	"or `long_context_management_agent` for subsequent task orchestration."
	),
	tools=[reasoning_tool],
	llm=llm,
	system_prompt=system_prompt,
	can_handoff_to=[
	"code_agent",
	"research_agent",
	"math_agent",
	"role_agent",
	"image_analyzer_agent",
	"text_analyzer_agent",
	"planner_agent",
	"long_context_management_agent",
	"advanced_validation_agent",
	"video_analyzer_agent"
	],
	)

	return agent

	except Exception as e:
	logger.error(f"Error during ReasoningAgent initialization: {e}", exc_info=True)
	raise

	# Example usage (for testing if run directly)
	if __name__ == "__main__":
	logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s')
	logger.info("Running reasoning_agent.py directly for testing...")

	# Check required keys
	required_keys = ["GEMINI_API_KEY", "ALPAFLOW_OPENAI_API_KEY"]
	missing_keys = [key for key in required_keys if not os.getenv(key)]
	if missing_keys:
	print(f"Error: Required environment variable(s) not set: {', '.join(missing_keys)}. Cannot run test.")
	else:
	try:
	# Test the reasoning tool directly
	print("\nTesting reasoning_tool_fn...")
	test_context = "User asked: What is the capital of France? ResearchAgent found: Paris. VerifierAgent confirmed: High confidence."
	reasoning_output = reasoning_tool_fn(test_context)
	print(f"Reasoning Tool Output:\n{reasoning_output}")

	# Initialize the agent (optional)
	# test_agent = initialize_reasoning_agent()
	# print("\nReasoning Agent initialized successfully for testing.")
	# Example chat (would require context passing mechanism)
	# result = test_agent.chat("Synthesize the findings about the capital of France.")
	# print(f"Agent chat result: {result}")

	except Exception as e:
	print(f"Error during testing: {e}")