import os from typing import List, Optional, Union from agentpress.tool import Tool, ToolResult, openapi_schema, xml_schema class MessageTool(Tool): """Tool for user communication and interaction. This tool provides methods for asking questions, with support for attachments and user takeover suggestions. """ def __init__(self): super().__init__() # Commented out as we are just doing this via prompt as there is no need to call it as a tool @openapi_schema({ "type": "function", "function": { "name": "ask", "description": "Ask user a question and wait for response. Use for: 1) Requesting clarification on ambiguous requirements, 2) Seeking confirmation before proceeding with high-impact changes, 3) Gathering additional information needed to complete a task, 4) Offering options and requesting user preference, 5) Validating assumptions when critical to task success. IMPORTANT: Use this tool only when user input is essential to proceed. Always provide clear context and options when applicable. Include relevant attachments when the question relates to specific files or resources.", "parameters": { "type": "object", "properties": { "text": { "type": "string", "description": "Question text to present to user - should be specific and clearly indicate what information you need. Include: 1) Clear question or request, 2) Context about why the input is needed, 3) Available options if applicable, 4) Impact of different choices, 5) Any relevant constraints or considerations." }, "attachments": { "anyOf": [ {"type": "string"}, {"items": {"type": "string"}, "type": "array"} ], "description": "(Optional) List of files or URLs to attach to the question. Include when: 1) Question relates to specific files or configurations, 2) User needs to review content before answering, 3) Options or choices are documented in files, 4) Supporting evidence or context is needed. Always use relative paths to /workspace directory." } }, "required": ["text"] } } }) @xml_schema( tag_name="ask", mappings=[ {"param_name": "text", "node_type": "content", "path": "."}, {"param_name": "attachments", "node_type": "attribute", "path": ".", "required": False} ], example=''' Ask user a question and wait for response. Use for: 1) Requesting clarification on ambiguous requirements, 2) Seeking confirmation before proceeding with high-impact changes, 3) Gathering additional information needed to complete a task, 4) Offering options and requesting user preference, 5) Validating assumptions when critical to task success. IMPORTANT: Use this tool only when user input is essential to proceed. Always provide clear context and options when applicable. Include relevant attachments when the question relates to specific files or resources. I'm planning to bake the chocolate cake for your birthday party. The recipe mentions "rich frosting" but doesn't specify what type. Could you clarify your preferences? For example: 1. Would you prefer buttercream or cream cheese frosting? 2. Do you want any specific flavor added to the frosting (vanilla, coffee, etc.)? 3. Should I add any decorative toppings like sprinkles or fruit? 4. Do you have any dietary restrictions I should be aware of? This information will help me make sure the cake meets your expectations for the celebration. ''' ) async def ask(self, text: str, attachments: Optional[Union[str, List[str]]] = None) -> ToolResult: """Ask the user a question and wait for a response. Args: text: The question to present to the user attachments: Optional file paths or URLs to attach to the question Returns: ToolResult indicating the question was successfully sent """ try: # Convert single attachment to list for consistent handling if attachments and isinstance(attachments, str): attachments = [attachments] return self.success_response({"status": "Awaiting user response..."}) except Exception as e: return self.fail_response(f"Error asking user: {str(e)}") @openapi_schema({ "type": "function", "function": { "name": "web_browser_takeover", "description": "Request user takeover of browser interaction. Use this tool when: 1) The page requires complex human interaction that automated tools cannot handle, 2) Authentication or verification steps require human input, 3) The page has anti-bot measures that prevent automated access, 4) Complex form filling or navigation is needed, 5) The page requires human verification (CAPTCHA, etc.). IMPORTANT: This tool should be used as a last resort after web-search and crawl-webpage have failed, and when direct browser tools are insufficient. Always provide clear context about why takeover is needed and what actions the user should take.", "parameters": { "type": "object", "properties": { "text": { "type": "string", "description": "Instructions for the user about what actions to take in the browser. Include: 1) Clear explanation of why takeover is needed, 2) Specific steps the user should take, 3) What information to look for or extract, 4) How to indicate when they're done, 5) Any important context about the current page state." }, "attachments": { "anyOf": [ {"type": "string"}, {"items": {"type": "string"}, "type": "array"} ], "description": "(Optional) List of files or URLs to attach to the takeover request. Include when: 1) Screenshots or visual references are needed, 2) Previous search results or crawled content is relevant, 3) Supporting documentation is required. Always use relative paths to /workspace directory." } }, "required": ["text"] } } }) @xml_schema( tag_name="web-browser-takeover", mappings=[ {"param_name": "text", "node_type": "content", "path": "."}, {"param_name": "attachments", "node_type": "attribute", "path": ".", "required": False} ], example=''' I've encountered a CAPTCHA verification on the page. Please: 1. Solve the CAPTCHA puzzle 2. Let me know once you've completed it 3. I'll then continue with the automated process If you encounter any issues or need to take additional steps, please let me know. ''' ) async def web_browser_takeover(self, text: str, attachments: Optional[Union[str, List[str]]] = None) -> ToolResult: """Request user takeover of browser interaction. Args: text: Instructions for the user about what actions to take attachments: Optional file paths or URLs to attach to the request Returns: ToolResult indicating the takeover request was successfully sent """ try: # Convert single attachment to list for consistent handling if attachments and isinstance(attachments, str): attachments = [attachments] return self.success_response({"status": "Awaiting user browser takeover..."}) except Exception as e: return self.fail_response(f"Error requesting browser takeover: {str(e)}") # @openapi_schema({ # "type": "function", # "function": { # "name": "inform", # "description": "Inform the user about progress, completion of a major step, or important context. Use this tool: 1) To provide updates between major sections of work, 2) After accomplishing significant milestones, 3) When transitioning to a new phase of work, 4) To confirm actions were completed successfully, 5) To provide context about upcoming steps. IMPORTANT: Use FREQUENTLY throughout execution to provide UI context to the user. The user CANNOT respond to this tool - they can only respond to the 'ask' tool. Use this tool to keep the user informed without requiring their input.", # "parameters": { # "type": "object", # "properties": { # "text": { # "type": "string", # "description": "Information to present to the user. Include: 1) Clear statement of what has been accomplished or what is happening, 2) Relevant context or impact, 3) Brief indication of next steps if applicable." # }, # "attachments": { # "anyOf": [ # {"type": "string"}, # {"items": {"type": "string"}, "type": "array"} # ], # "description": "(Optional) List of files or URLs to attach to the information. Include when: 1) Information relates to specific files or resources, 2) Showing intermediate results or outputs, 3) Providing supporting documentation. Always use relative paths to /workspace directory." # } # }, # "required": ["text"] # } # } # }) # @xml_schema( # tag_name="inform", # mappings=[ # {"param_name": "text", "node_type": "content", "path": "."}, # {"param_name": "attachments", "node_type": "attribute", "path": ".", "required": False} # ], # example=''' # Inform the user about progress, completion of a major step, or important context. Use this tool: 1) To provide updates between major sections of work, 2) After accomplishing significant milestones, 3) When transitioning to a new phase of work, 4) To confirm actions were completed successfully, 5) To provide context about upcoming steps. IMPORTANT: Use FREQUENTLY throughout execution to provide UI context to the user. The user CANNOT respond to this tool - they can only respond to the 'ask' tool. Use this tool to keep the user informed without requiring their input." # # # # # # # # # # # I've completed the data analysis of the sales figures. Key findings include: # - Q4 sales were 28% higher than Q3 # - Product line A showed the strongest performance # - Three regions missed their targets # I'll now proceed with creating the executive summary report based on these findings. # # ''' # ) # async def inform(self, text: str, attachments: Optional[Union[str, List[str]]] = None) -> ToolResult: # """Inform the user about progress or important updates without requiring a response. # Args: # text: The information to present to the user # attachments: Optional file paths or URLs to attach # Returns: # ToolResult indicating the information was successfully sent # """ # try: # # Convert single attachment to list for consistent handling # if attachments and isinstance(attachments, str): # attachments = [attachments] # return self.success_response({"status": "Information sent"}) # except Exception as e: # return self.fail_response(f"Error informing user: {str(e)}") @openapi_schema({ "type": "function", "function": { "name": "complete", "description": "A special tool to indicate you have completed all tasks and are about to enter complete state. Use ONLY when: 1) All tasks in todo.md are marked complete [x], 2) The user's original request has been fully addressed, 3) There are no pending actions or follow-ups required, 4) You've delivered all final outputs and results to the user. IMPORTANT: This is the ONLY way to properly terminate execution. Never use this tool unless ALL tasks are complete and verified. Always ensure you've provided all necessary outputs and references before using this tool.", "parameters": { "type": "object", "properties": {}, "required": [] } } }) @xml_schema( tag_name="complete", mappings=[], example=''' ''' ) async def complete(self) -> ToolResult: """Indicate that the agent has completed all tasks and is entering complete state. Returns: ToolResult indicating successful transition to complete state """ try: return self.success_response({"status": "complete"}) except Exception as e: return self.fail_response(f"Error entering complete state: {str(e)}") if __name__ == "__main__": import asyncio async def test_message_tool(): message_tool = MessageTool() # Test question ask_result = await message_tool.ask( text="Would you like to proceed with the next phase?", attachments="summary.pdf" ) print("Question result:", ask_result) # Test inform inform_result = await message_tool.inform( text="Completed analysis of data. Processing results now.", attachments="analysis.pdf" ) print("Inform result:", inform_result) asyncio.run(test_message_tool())