HF_Agents_Final_Project

Sleeping

HF_Agents_Final_Project / tests /test_chess_formatting.py

Yago Bolivar

feat: add tests for chess position analysis and prompt formatting scenarios

9bdf620 3 months ago

7.65 kB

	import yaml
	import os
	import pytest
	from unittest.mock import MagicMock

	# Create mock classes for testing
	class MockModel:
	def __init__(self):
	pass

	def __call__(self, prompt, **kwargs):
	return self.generate_text(prompt, **kwargs)

	def generate_text(self, prompt, **kwargs):
	# This method will be implemented in child classes
	pass

	class CodeAgent:
	def __init__(self, model=None, tools=None, max_steps=None, verbosity_level=None,
	name=None, description=None, prompt_templates=None):
	self.model = model
	self.tools = tools
	self.max_steps = max_steps
	self.verbosity_level = verbosity_level
	self.name = name
	self.description = description
	self.prompt_templates = prompt_templates
	self.step_counter = 0

	def run(self, query):
	"""Simulate running the agent for testing purposes."""
	response = None
	for step in range(self.max_steps):
	response = self.model.generate_text("", step=step)
	if isinstance(response, dict) and "choices" in response:
	response = response["choices"][0]["message"]["content"]
	if "final_answer" in response:
	break
	return response

	def __call__(self, query):
	return self.run(query)

	# Load your updated prompts.yaml
	# Get the correct path relative to this script
	try:
	script_dir = os.path.dirname(os.path.abspath(__file__))
	project_root = os.path.dirname(script_dir) # Go up one level from tests/ to project root
	prompts_path = os.path.join(project_root, "prompts.yaml")

	print(f"Looking for prompts.yaml at: {prompts_path}")

	with open(prompts_path, 'r') as stream:
	prompt_templates = yaml.safe_load(stream)
	print("Successfully loaded prompts.yaml")
	except FileNotFoundError:
	print(f"Warning: prompts.yaml not found at {prompts_path}. Tests may fail.")
	prompt_templates = {}
	except yaml.YAMLError as e:
	print(f"Error parsing prompts.yaml: {e}")
	prompt_templates = {}

	# Create a specialized model for testing chess position scenario
	class ChessPositionTestModel(MockModel):
	def __init__(self):
	super().__init__()

	def generate_text(self, prompt, **kwargs):
	# For testing purposes, we'll simulate a series of responses
	# to see how the agent handles multi-step chess analysis
	step = kwargs.get("step", 0)

	responses = [
	# Step 0: Initial response asking for the chess image
	"""Thought: I need to see the chess image to analyze the position.
	```py
	print("I need the chess image to analyze the position. Please provide the image.")
	```<end_code>""",

	# Step 1: After receiving the image
	"""Thought: Now I can see the chess position. I'll analyze it.
	```py
	from src.image_processing_tool import ImageProcessor

	image_processor = ImageProcessor()
	analysis = image_processor.analyze_chess_position(image_path="chess_image.png")
	print(f"Chess position analysis: {analysis}")
	```<end_code>""",

	# Step 2: Error handling when image analysis fails
	"""Thought: There was an error analyzing the chess position. I'll try a different approach.
	```py
	print("The image analysis failed. Let me try a different method.")
	# Alternative approach
	```<end_code>""",

	# Step 3: Final answer
	"""Thought: I've analyzed the chess position and determined the best move.
	```py
	final_answer("e4 to e5")
	```<end_code>"""
	]

	# Return the appropriate response for this step
	if step < len(responses):
	return {"choices": [{"message": {"content": responses[step]}}]}
	else:
	return {"choices": [{"message": {"content": "Test complete"}}]}

	# Simulating a chess position analysis
	def test_chess_position_scenario():
	print("\nTesting chess position analysis scenario\n")

	# Create a minimal version of your tools for testing
	class DummyImageProcessorTool:
	def __init__(self):
	self.name = "image_processor"
	self.description = "Analyze images including chess positions"
	self.inputs = {"image_path": "string"}
	self.output_type = "string"

	def analyze_chess_position(self, image_path):
	return "Position analyzed: white king on e1, black king on e8"

	class DummyFinalAnswerTool:
	def __init__(self):
	self.name = "final_answer"
	self.description = "Use this to provide the final answer"
	self.inputs = {"answer": "string"}
	self.output_type = "string"

	def __call__(self, answer):
	return f"Final answer submitted: {answer}"

	# Create the test model
	model = ChessPositionTestModel()

	# Create agent with your updated prompts
	tools = [DummyImageProcessorTool(), DummyFinalAnswerTool()]
	try:
	agent = CodeAgent(
	model=model,
	tools=tools,
	max_steps=4, # Allow for 4 steps to see all responses
	verbosity_level=2, # Increased verbosity to see more details
	name="ChessTestAgent",
	description="Testing chess position analysis formatting",
	prompt_templates=prompt_templates
	)
	except Exception as e:
	print(f"Error creating agent: {e}")
	return

	# Test with a chess position analysis task
	print("Starting chess position analysis test...")
	result = agent("Analyze this chess position and determine the best move for white.")

	print(f"Final result: {result}")
	print("-"*50)
	return result

	def test_prompt_structure():
	"""Test that the prompt structure includes proper formatting instructions."""
	print("\nTesting prompt structure for formatting instructions\n")

	# Check if prompts.yaml was loaded successfully
	if not prompt_templates:
	pytest.skip("No prompt templates available to test")

	# Get the system prompt from the templates
	system_prompt = prompt_templates.get("system_prompt", {}).get("main", "")

	# Check that the system prompt contains the necessary elements
	formatting_elements = [
	"IMPORTANT FORMATTING RULES for ALL responses:", # Section header
	"EVERY response MUST follow the format", # Format requirement
	"```py", # Code block start
	"```<end_code>", # Code block end
	"MUST include a code block", # Code block requirement
	"Example of correct formatting:" # Example section
	]

	for element in formatting_elements:
	assert element in system_prompt, f"Missing required formatting element: {element}"

	# Check that the example shows proper formatting
	example_start = system_prompt.find("Example of correct formatting:")
	if example_start != -1:
	example_content = system_prompt[example_start:system_prompt.find("\n\n", example_start)]

	assert "Thought:" in example_content, "Example missing Thought: section"
	assert "```py" in example_content, "Example missing code block start"
	assert "```<end_code>" in example_content, "Example missing code block end"
	else:
	pytest.fail("No formatting example found in system prompt")

	print("✓ Prompt structure contains all required formatting elements")

	# Run the tests if executed directly
	if __name__ == "__main__":
	test_prompt_structure()
	test_chess_position_scenario()