Final_Assignment_Template

Sleeping

gdms commited on May 29

Commit

30944a6

1 Parent(s): 1542c35

Montagem arquitetura

Browse files

Files changed (16) hide show

.gitignore +0 -2
agent.py +55 -0
agent_util.py +43 -0
app.py +55 -0
audio_util.py +79 -0
constantes.py +30 -0
file_util.py +80 -0
image_util.py +85 -0
prompts.py +34 -0
question_files/cca530fc-4052-43b2-b130-b30968d8aa44.png +0 -0
question_files/f918266a-b3e0-4914-865d-4faa564f1aef.py +0 -35
requirements.txt +2 -1
tools.py +627 -0
video_util.py +31 -0
web_util.py +99 -0
wikipedia_util.py +133 -0

.gitignore CHANGED Viewed

@@ -1,5 +1,3 @@
-*.mp3
-*.xlsx
 video_analysis_output/
 get-pip.py
 *.m4a

 video_analysis_output/
 get-pip.py
 *.m4a

agent.py ADDED Viewed

	@@ -0,0 +1,55 @@

+from langgraph.prebuilt import create_react_agent
+from prompts import *
+from tools import *
+from langgraph_supervisor import create_supervisor
+from langchain.chat_models import init_chat_model
+import glob
+class Agent:
+    def __init__(self):
+        print("Initializing Agent....")
+        print("--> Audio Agent")
+        self.audio_agent = create_react_agent(
+            model="openai:gpt-4o-mini",  # gpt-4o-mini-2024-07-18
+            tools=[extract_text_from_url_tool, extract_text_from_file_tool],
+            prompt= AUDIO_AGENT_PROMPT,
+            name="audio_agent",
+        )
+        print("--> Web Search Agent")
+        self.web_search_agent = create_react_agent(
+            model="openai:gpt-4o-mini",  # gpt-4o-mini-2024-07-18
+            tools=[search_web_tool],
+            prompt= WEB_SEARCH_AGENT_PROMPT,
+            name="web_research_agent",
+        )
+        print("--> Supervisor")
+        self.supervisor = create_supervisor(
+            model=init_chat_model("openai:gpt-4o-mini"),
+            agents=[self.web_search_agent, self.audio_agent],
+            tools=[bird_video_count_tool,chess_image_to_fen_tool,chess_fen_get_best_next_move_tool,
+                get_excel_columns_tool, calculate_excel_sum_by_columns_tool,execute_python_code_tool,
+                text_inverter_tool, check_table_commutativity_tool],
+            prompt= SUPERVISOR_PROMPT,
+            add_handoff_back_messages=True,
+            output_mode="full_history",
+        ).compile()
+        print("Agent initialized.")
+    def _exist_file_with_task_id(task_id: str) -> str:
+        padrao = os.path.join(AGENTS_FILES_PATH, f"{task_id}.*")
+        arquivos_encontrados = glob.glob(padrao)
+        return arquivos_encontrados[0] if arquivos_encontrados else None
+    def __call__(self, question: str, task_id: str) -> str:
+        print(f"Agent received question (first 50 chars): {question[:50]}...")
+        file = self._exist_file_with_task_id(task_id)
+        fixed_answer = "This is a default answer."
+        print(f"Agent returning fixed answer: {fixed_answer}")
+        return fixed_answer

agent_util.py ADDED Viewed

	@@ -0,0 +1,43 @@

+from langchain_core.messages import convert_to_messages
+class Agent_Util:
+    @staticmethod
+    def pretty_print_message(message, indent=False):
+        pretty_message = message.pretty_repr(html=True)
+        if not indent:
+            print(pretty_message)
+            return
+        indented = "\n".join("\t" + c for c in pretty_message.split("\n"))
+        print(indented)
+    @staticmethod
+    def pretty_print_messages(update, last_message=False):
+        is_subgraph = False
+        if isinstance(update, tuple):
+            ns, update = update
+            # skip parent graph updates in the printouts
+            if len(ns) == 0:
+                return
+            graph_id = ns[-1].split(":")[0]
+            print(f"Update from subgraph {graph_id}:")
+            print("\n")
+            is_subgraph = True
+        for node_name, node_update in update.items():
+            update_label = f"Update from node {node_name}:"
+            if is_subgraph:
+                update_label = "\t" + update_label
+            print(update_label)
+            print("\n")
+            messages = convert_to_messages(node_update["messages"])
+            if last_message:
+                messages = messages[-1:]
+            for m in messages:
+                Agent_Util.pretty_print_message(m, indent=is_subgraph)
+            print("\n")

app.py CHANGED Viewed

@@ -4,6 +4,61 @@ import requests
 import inspect
 import pandas as pd
 # (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"

 import inspect
 import pandas as pd
+import getpass
+import os
+import requests
+from typing import Tuple, List, Dict, Any, Optional, ClassVar, Literal
+import json
+import re
+import sys
+import io
+import traceback
+from contextlib import redirect_stdout, redirect_stderr
+from openai import OpenAI
+import pandas as pd
+#Multi-agent
+from langchain_tavily import TavilySearch, TavilyExtract
+from langgraph.prebuilt import create_react_agent
+from langgraph_supervisor import create_supervisor
+from langchain.chat_models import init_chat_model
+#langgraph
+from pydantic import BaseModel
+from langgraph.graph import START, StateGraph, MessagesState
+from langgraph.prebuilt import tools_condition, ToolNode
+from IPython.display import Image, display
+from langchain.tools import tool
+from langgraph.prebuilt import create_react_agent
+from langchain_core.messages import convert_to_messages
+from langsmith import utils
+#web tool
+from tavily import TavilyClient
+import markdownify
+import wikipediaapi
+from datetime import datetime, timezone
+import urllib.parse
+from bs4 import BeautifulSoup
+import time
+#audio
+import shutil
+import subprocess
+#video
+import cv2
+#imagem
+import base64
+import mimetypes
+from urllib.parse import urlparse, unquote
+import google.generativeai as genai
 # (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"

audio_util.py ADDED Viewed

	@@ -0,0 +1,79 @@

+import os
+import re
+import subprocess
+from openai import OpenAI
+from constantes import YOUTUBE_COOKIE_PATH
+from file_util import File_Util
+class Audio_Util:
+    """
+        Manipulação de audio
+    """
+    @staticmethod
+    def download_audio_from_url(url: str, output_path: str, audio_file_name: str) -> str:
+        """
+            Baixa um arquivo de áudio a partir de uma URL.
+            Args:
+                url: url do audio
+                output_path: local esperado para gravação do audio
+                audio_file_name: nome do arquivo que deve ser utilizado para download
+        """
+        audio_path = f'{output_path}/{audio_file_name}.%(ext)s'
+        print(f"Baixando áudio de {url} para {audio_path}...")
+        try:
+            # Comando yt-dlp para baixar o melhor áudio disponível e convertê-lo para mp3
+            command = [
+                'yt-dlp',
+                "--cookies", YOUTUBE_COOKIE_PATH,
+                '-f', 'bestaudio[ext=m4a]',
+                '-o', audio_path,
+                url
+            ]
+            result = subprocess.run(command, check=True, capture_output=True, text=True)
+            lista_arquivos = File_Util.retirar_sufixo_codec_arquivo(output_path)
+            print("Download de áudio concluído com sucesso.")
+            return f"{output_path}/{lista_arquivos[0]}"
+        except subprocess.CalledProcessError as e:
+            print(f"Erro ao baixar o áudio: {e}")
+            print(f"Saída do erro: {e.stderr}")
+            return False
+        except FileNotFoundError:
+            print("Erro: O comando 'yt-dlp' não foi encontrado. Certifique-se de que ele está instalado e no PATH do sistema.")
+            return False
+    @staticmethod
+    def extract_text_from_audio_file(audio_path: str) -> str:
+        """
+        Usa a API Whisper da OpenAI para transcrever o áudio em texto com quebras de linha naturais,
+        removendo timestamps e IDs. Salva em arquivo .txt se o caminho for fornecido.
+        """
+        client = OpenAI(api_key=os.getenv("OPENAI_API_KEY"))
+        try:
+            audio_path = f"{audio_path}"
+            print(f"Iniciando transcrição (formato SRT simplificado): {audio_path}")
+            with open(audio_path, "rb") as audio_file:
+                transcription = client.audio.transcriptions.create(
+                    model="whisper-1",
+                    file=audio_file,
+                    response_format="srt"
+                )
+            # Remove linhas com números e timestamps
+            lines = transcription.splitlines()
+            only_text = [line.strip() for line in lines if not re.match(r"^\d+$", line) and "-->" not in line]
+            formatted_text = "\n".join(only_text)
+            return formatted_text
+        except Exception as e:
+            print(f"Erro ao transcrever áudio: {e}")
+            return ""

constantes.py ADDED Viewed

	@@ -0,0 +1,30 @@

+import os
+OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
+TAVILY_API_KEY = os.getenv("TAVILY_API_KEY")
+GEMINI_API_KEY = os.getenv("GEMINI_API_KEY")
+LANGCHAIN_API_KEY = os.getenv("LANGCHAIN_API_KEY")
+os.environ["LANGCHAIN_TRACING_V2"] = "true"
+os.environ["LANGCHAIN_PROJECT"] = "hf-final-assessment"
+OUTPUT_AUDIO_PATH   ="./audio_analysis_output"
+AUDIO_FILENAME = "downloaded_audio"
+TRANSCRIPT_FILENAME = "transcript.txt"
+OUTPUT_IMAGE_PATH = "./image_analysis_output"
+IMAGE_FILE_NAME = "downloaded_image"
+OUTPUT_VIDEO_PATH = "./video_analysis_output"
+VIDEO_FILE_NAME = "downloaded_video"
+FRAME_INTERVAL_SECONDS = 0.5 # Intervalo entre frames a serem extraídos
+INICIO_FRAME_IMPORTANTE  = 191 # inicio intervalo relevante, para não ficar caro a inferencia ao gpt
+FIM_FRAME_IMPORTANTE = 193# fim intervalo relevante, para não ficar caro a inferencia ao gpt
+YOUTUBE_COOKIE_PATH = "./support/cookie-youtube.txt"
+GPT_IMAGE_MODEL = "gpt-4o"
+GEMINI_MODEL = "gemini-2.0-flash"
+CHESSVISION_TO_FEN_URL = "http://app.chessvision.ai/predict"
+CHESS_MOVE_API = "https://chess-api.com/v1"
+AGENTS_FILES_PATH = "./files"

file_util.py ADDED Viewed

	@@ -0,0 +1,80 @@

+import os
+import re
+import shutil
+from typing import List
+from constantes import AGENTS_FILES_PATH
+class File_Util:
+    """
+        Manipulação de diretórios e arquivos
+    """
+    @staticmethod
+    def create_or_clear_output_directory(output_dir: str):
+        """
+            Cria o diretório de saída se não existir.
+        """
+        if not os.path.exists(output_dir):
+            os.makedirs(output_dir)
+            print(f"Diretório criado: {output_dir}")
+        else:
+            # Limpa todos os arquivos e subdiretórios
+            for filename in os.listdir(output_dir):
+                file_path = os.path.join(output_dir, filename)
+                try:
+                    if os.path.isfile(file_path) or os.path.islink(file_path):
+                        os.unlink(file_path)
+                    elif os.path.isdir(file_path):
+                        shutil.rmtree(file_path)
+                except Exception as e:
+                    print(f"Erro ao excluir {file_path}: {e}")
+            print(f"Diretório limpo: {output_dir}")
+    @staticmethod
+    def retirar_sufixo_codec_arquivo(directory: str) -> List[str]:
+        """
+            Os arquivos de audio e video quando baixados ficam com o codec
+            embutido no nome, dificultando identificar o nome do arquivo a ser
+            processado. O objetivo é remover o sufixo do nome do arquivo.
+        """
+        return_list = []
+        for filename in os.listdir(directory):
+            # Procura padrão como ".f123" antes da extensão
+            new_filename = re.sub(r'\.f\d{3}(?=\.\w+$)', '', filename)
+            if new_filename != filename:
+                old_path = os.path.join(directory, filename)
+                new_path = os.path.join(directory, new_filename)
+                os.rename(old_path, new_path)
+                print(f"Renomeado: {filename} → {new_filename}")
+            return_list.append(new_filename)
+        return return_list
+    @staticmethod
+    def tratar_arquivo_local(caminho_entrada: str) -> str:
+        """
+        Verifica se o arquivo existe no caminho informado.
+        Se não existir, adiciona o path padrão do sistema.
+        Parâmetros:
+        - caminho_entrada (str): Caminho completo ou nome do arquivo.
+        Retorna:
+        - str: Caminho válido para o arquivo, ou None se não encontrado.
+        """
+        # Verifica se o arquivo já existe no caminho informado
+        if os.path.isfile(caminho_entrada):
+            return caminho_entrada
+        # Tenta procurar no diretório padrão, se fornecido
+        novo_caminho = os.path.join(AGENTS_FILES_PATH, os.path.basename(caminho_entrada))
+        if os.path.isfile(novo_caminho):
+            return novo_caminho
+        # Arquivo não encontrado
+        return None

image_util.py ADDED Viewed

	@@ -0,0 +1,85 @@

+import base64
+import mimetypes
+import os
+from urllib.parse import unquote, urlparse
+import requests
+from file_util import File_Util
+class Image_Util:
+    """
+        Manipulação de imagens
+    """
+    @staticmethod
+    def encode_image_to_base64(image_path: str) -> str:
+        """Codifica um arquivo de imagem (frame) para base64."""
+        image_path_tratado = File_Util.tratar_arquivo_local(image_path)
+        if not image_path_tratado:
+            return None
+        try:
+            with open(image_path_tratado, "rb") as image_file:
+                return base64.b64encode(image_file.read()).decode('utf-8')
+        except FileNotFoundError:
+            print(f"Erro: Arquivo não encontrado em {image_path}")
+            return None
+        except Exception as e:
+            print(f"Erro ao codificar imagem {image_path} para base64: {e}")
+            return None
+    @staticmethod
+    def get_image_extension_from_url(url: str) -> str:
+        """
+        Retorna a extensão do arquivo de imagem com base na URL informada.
+        Args:
+            url: URL da imagem (pode conter parâmetros).
+        Returns:
+            Extensão do arquivo (ex: 'jpg', 'png') ou None se não for possível identificar.
+        """
+        path = unquote(urlparse(url).path)  # decodifica e extrai o caminho da URL
+        filename = os.path.basename(path)
+        # Tenta extrair extensão diretamente
+        _, ext = os.path.splitext(filename)
+        ext = ext.lower().lstrip('.')  # remove o ponto
+        # Verifica se a extensão é de imagem conhecida
+        if ext in ['jpg', 'jpeg', 'png', 'gif', 'bmp', 'webp', 'tiff']:
+            return ext
+        # Caso não haja extensão, tenta deduzir pelo tipo MIME
+        mime_type, _ = mimetypes.guess_type(url)
+        if mime_type and mime_type.startswith("image/"):
+            return mime_type.split("/")[1]  # ex: 'image/png' → 'png'
+        return None
+    @staticmethod
+    def download_image_from_url(url: str, output_path: str, image_file_name: str) -> str:
+        """
+            Baixa uma imagem a partir de uma URL.
+            Args:
+                url: url da imagem
+                output_path: local esperado para gravação da imagem
+                image_file_name: nome do arquivo que deve ser utilizado para download
+        """
+        File_Util.create_or_clear_output_directory(output_path)
+        image_path = f'{output_path}/{image_file_name}.{Image_Util.get_image_extension_from_url(url)}'
+        response = requests.get(url, stream=True)
+        if response.status_code == 200:
+            if save_path is None:
+                save_path = os.path.basename(url.split("?")[0])  # remove query params, se houver
+            with open(save_path, 'wb') as f:
+                for chunk in response.iter_content(1024):
+                    f.write(chunk)
+            return save_path
+        else:
+            raise Exception(f"Erro ao baixar imagem: {response.status_code} - {response.reason}")
+        return image_path

prompts.py ADDED Viewed

	@@ -0,0 +1,34 @@

+AUDIO_AGENT_PROMPT = (
+        "You are an audio agent.\n\n"
+        "INSTRUCTIONS:\n"
+        "- Assist ONLY with audio-related tasks, DO NOT do any math\n"
+        "- If you get an audio request related to a file, use the file name to call the tools, they know the path to find the file. \n"
+        "- Its tools can even extract text from videos on the internet \n"
+        "- After you're done with your tasks, respond to the supervisor directly\n"
+        "- Respond ONLY with the results of your work, do NOT include ANY other text."
+    )
+WEB_SEARCH_AGENT_PROMPT = (
+        "You are a web research agent.\n\n"
+        "INSTRUCTIONS:\n"
+        "- Assist ONLY with research-related tasks, DO NOT do any math\n"
+        "- After you're done with your tasks, respond to the supervisor directly\n"
+        "- Respond ONLY with the results of your work, do NOT include ANY other text."
+    )
+SUPERVISOR_PROMPT = (
+        """
+        You are a general AI assistant. I will ask you a question. Report your thoughts, and finish your answer with the following template:
+        FINAL ANSWER: [YOUR FINAL ANSWER]. YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings.
+        If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise.
+        If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise.
+        If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
+        To assist in your task, you can supervise other agents who perform specific tasks that could not be handled by tools, since they require the processing of another LLM. Below, I will inform you about your assistants:
+        - web_research_agent. Assign web research related tasks to this agent
+        - audio_agent. Assign audio related tasks to this agent. This agent can extract text from videos in files or on the internet.
+        Assign work to one agent at a time, do not call agents in parallel.
+        Priorize the use of tools and another agents to help in reasoning.
+        When a file or URL is entered at the prompt, use it in tools or other agents, both are prepared to handle files and URLs.
+        When I inform a file in the format File:<file name> use the file name to invoke the tool, it will know how to treat it.
+        """
+    )

question_files/cca530fc-4052-43b2-b130-b30968d8aa44.png DELETED Viewed

Binary file (63.1 kB)

question_files/f918266a-b3e0-4914-865d-4faa564f1aef.py DELETED Viewed

@@ -1,35 +0,0 @@
-from random import randint
-import time
-class UhOh(Exception):
-    pass
-class Hmm:
-    def __init__(self):
-        self.value = randint(-100, 100)
-    def Yeah(self):
-        if self.value == 0:
-            return True
-        else:
-            raise UhOh()
-def Okay():
-    while True:
-        yield Hmm()
-def keep_trying(go, first_try=True):
-    maybe = next(go)
-    try:
-        if maybe.Yeah():
-            return maybe.value
-    except UhOh:
-        if first_try:
-            print("Working...")
-            print("Please wait patiently...")
-        time.sleep(0.1)
-        return keep_trying(go, first_try=False)
-if __name__ == "__main__":
-    go = Okay()
-    print(f"{keep_trying(go)}")

requirements.txt CHANGED Viewed

@@ -6,4 +6,5 @@ bs4
 tavily-python
 markdownify
 wikipedia-api
-yt-dlp

 tavily-python
 markdownify
 wikipedia-api
+yt-dlp
+ipython

tools.py ADDED Viewed

	@@ -0,0 +1,627 @@

+from contextlib import redirect_stderr, redirect_stdout
+import io
+import json
+import os
+import subprocess
+import traceback
+from typing import Dict, List, Literal, Optional
+import google.generativeai as genai
+import cv2
+import pandas as pd
+from pydantic import BaseModel
+import requests
+from audio_util import Audio_Util
+from constantes import *
+from file_util import File_Util
+from image_util import Image_Util
+from tavily import TavilyClient
+from web_util import Web_Util
+from wikipedia_util import Wikipedia_Historical_Page, Wikipedia_Util
+class Video_Util:
+    def download_video_from_url(url: str, output_path: str, video_file_name: str) -> str:
+        """Baixa o vídeo do YouTube usando yt-dlp."""
+        video_path = f'{output_path}/{video_file_name}.%(ext)s'
+        print(f"Baixando vídeo de {url} para {video_path}...")
+        try:
+            # Comando yt-dlp para baixar o melhor formato mp4
+            command = [
+                'yt-dlp',
+                "--cookies", YOUTUBE_COOKIE_PATH,
+                '-f', 'bestvideo[ext=mp4]+bestaudio[ext=m4a]/best[ext=mp4]/best',
+                '-o', video_path,
+                url
+            ]
+            result = subprocess.run(command, check=True, capture_output=True, text=True)
+            lista_arquivos = File_Util.retirar_sufixo_codec_arquivo(output_path)
+            print("Download de áudio concluído com sucesso.")
+            return f"{output_path}/{lista_arquivos[0]}"
+        except subprocess.CalledProcessError as e:
+            print(f"Erro ao baixar o vídeo: {e}")
+            print(f"Saída do erro: {e.stderr}")
+            return False
+        except FileNotFoundError:
+            print("Erro: O comando 'yt-dlp' não foi encontrado. Certifique-se de que ele está instalado e no PATH do sistema.")
+            print("Você pode instalá-lo com: pip install yt-dlp")
+            return False
+def execute_python_code_tool(code_path: str) -> str:
+    """
+        Execute code python informed in code_path param
+        Args:
+            code_path: Path to the python file.
+        Returns:
+            Execution result.
+    """
+    saida = io.StringIO()
+    erros = io.StringIO()
+    final_code_path = File_Util.tratar_arquivo_local(code_path)
+    if not final_code_path:
+        return f"Erro: Arquivo não encontrado em {code_path}"
+    print(f"Executando código em {final_code_path}...")
+    try:
+        with open(final_code_path, 'r', encoding='utf-8') as f:
+            codigo = f.read()
+        # Captura stdout e stderr usando contexto
+        with redirect_stdout(saida), redirect_stderr(erros):
+            exec(codigo, {'__name__': '__main__'})
+        # Pega o conteúdo das saídas
+        saida_valor = saida.getvalue()
+        erro_valor = erros.getvalue()
+        if erro_valor:
+            return f"[ERRO DE EXECUÇÃO]:\n{erro_valor}"
+        return saida_valor if saida_valor.strip() else "[SEM SAÍDA]"
+    except Exception:
+        return f"[EXCEÇÃO DURANTE EXECUÇÃO]:\n{traceback.format_exc()}"
+def chess_image_to_fen_tool(image_path:str, current_player: Literal["black", "white"]) -> Dict[str,str]:
+    """
+        Convert chess image to FEN (Forsyth-Edwards Notation) notation.
+        Args:
+            image_path: Path to the image file.
+            current_player: Whose turn it is to play. Must be either 'black' or 'white'.
+        Returns:
+            JSON with FEN (Forsyth-Edwards Notation) string representing the current board position.
+    """
+    print(f"Image to Fen invocada com os seguintes parametros:")
+    print(f"image_path: {image_path}")
+    print(f"current_player: {current_player}")
+    if current_player not in ["black", "white"]:
+        raise ValueError("current_player must be 'black' or 'white'")
+    base64_image = Image_Util.encode_image_to_base64(image_path)
+    if not base64_image:
+        raise ValueError("Failed to encode image to base64.")
+    base64_image_encoded =  f"data:image/jpeg;base64,{base64_image}"
+    url = CHESSVISION_TO_FEN_URL
+    payload = {
+        "board_orientation": "predict",
+        "cropped": False,
+        "current_player": "black",
+        "image": base64_image_encoded,
+        "predict_turn": False
+    }
+    response = requests.post(url, json=payload)
+    if response.status_code == 200:
+        dados = response.json()
+        if dados.get("success"):
+            print(f"Retorno Chessvision {dados}")
+            fen = dados.get("result")
+            fen = fen.replace("_", " ") #retorna _ no lugar de espaço em branco
+            return json.dumps({"fen": fen})
+        else:
+            raise Exception("Requisição feita, mas falhou na predição.")
+    else:
+        raise Exception(f"Erro na requisição: {response.status_code}")
+def chess_fen_get_best_next_move_tool(fen: str, current_player: Literal["black", "white"]) -> str:
+    """
+        Return the best move in algebric notation.
+        Args:
+            fen: FEN (Forsyth-Edwards Notation) notation.
+        Returns:
+            Best move in algebric notation.
+    """
+    if not fen:
+        raise ValueError("fen must be provided.")
+    if current_player not in ["black", "white"]:
+        raise ValueError("current_player must be 'black' or 'white'")
+    url = CHESS_MOVE_API
+    payload = {
+       "fen": fen,
+       "depth": 1
+    }
+    print(f"Buscando melhor jogada em {CHESS_MOVE_API} - {payload}")
+    response = requests.post(url, json=payload)
+    if response.status_code == 200:
+        #print(f"Retorno melhor jogada --> {response.text}")
+        dados = response.json()
+        move_algebric_notation = dados.get("san")
+        move = dados.get("text")
+        print(f"Melhor jogada segundo chess-api.com -> {move}")
+        return move_algebric_notation
+    else:
+        raise Exception(f"Erro na requisição: {response.status_code}")
+def extract_frames_from_video_to_files(url: str) -> List[str]:
+    """
+        Extract frames from a video and store in temporaily files.
+        Args:
+            url: URL to the video.
+        Returns:
+            List of frame file paths.
+    """
+    frames_list: List[str] = []
+    File_Util.create_or_clear_output_directory(OUTPUT_VIDEO_PATH)
+    File_Util.create_or_clear_output_directory(OUTPUT_IMAGE_PATH)
+    video_download_file_name = Video_Util.download_video_from_url(url, OUTPUT_VIDEO_PATH, VIDEO_FILE_NAME)
+    if not video_download_file_name:
+        raise ValueError("Failed to download video.")
+    print(f"Extraindo frames de {video_download_file_name} a cada {FRAME_INTERVAL_SECONDS} segundos...")
+    if not os.path.exists(video_download_file_name):
+        print(f"Erro: Arquivo de vídeo não encontrado em {video_download_file_name}")
+        return []
+    cap = cv2.VideoCapture(video_download_file_name)
+    # Verificar a resolução
+    width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+    height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    print(f"Resolução original do vídeo: {width}x{height}")
+    if not cap.isOpened():
+        print(f"Erro ao abrir o arquivo de vídeo: {video_download_file_name}")
+        return []
+    fps = cap.get(cv2.CAP_PROP_FPS)
+    if fps == 0:
+        print("Erro: Não foi possível obter o FPS do vídeo. Usando FPS padrão de 30.")
+        fps = 30 # Valor padrão caso a leitura falhe
+    # retirado para permitir fracionado frame_interval = int(fps * interval_sec)
+    frame_interval = fps * FRAME_INTERVAL_SECONDS
+    total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+    print(f"Vídeo FPS: {fps:.2f}, Intervalo de frames: {frame_interval}, Total de frames: {total_frames}")
+    extracted_frames_paths = []
+    frame_count = 0
+    saved_frame_index = 5 # o importante nunca começa no inicio, é um deslocamento inicial para iniciar depois da introdução
+    while True:
+        # Define a posição do próximo frame a ser lido
+        # Adiciona frame_interval para pegar o frame *após* o intervalo de tempo
+        # ajustado para float target_frame_pos = saved_frame_index * frame_interval
+        target_frame_pos = int(saved_frame_index * frame_interval)
+        if target_frame_pos >= total_frames:
+            break # Sai se o próximo frame alvo estiver além do final do vídeo
+        if (saved_frame_index < INICIO_FRAME_IMPORTANTE or saved_frame_index > FIM_FRAME_IMPORTANTE):
+            print(f"Pulando frame {saved_frame_index}")
+            saved_frame_index += 1
+            continue # evitar custo desnecessário para inferencia ao gpt
+        cap.set(cv2.CAP_PROP_POS_FRAMES, target_frame_pos)
+        ret, frame = cap.read()
+        if not ret:
+            print(f"Não foi possível ler o frame na posição {target_frame_pos}. Pode ser o fim do vídeo ou um erro.")
+            break # Sai se não conseguir ler o frame
+        # redimensiona o frame (custo chamada)
+        # removido porque poderia afetar a nitidez e impactar o resultado
+        # frame = cv2.resize(frame, (1280, 720))
+        # Calcula o timestamp em segundos
+        timestamp_sec = target_frame_pos / fps
+        # Salva o frame
+        frame_filename = f"frame_{saved_frame_index:04d}_time_{timestamp_sec:.2f}s.png"
+        frame_path = os.path.join(OUTPUT_IMAGE_PATH, frame_filename)
+        try:
+            # modificado para salvar com qualidade máxima cv2.imwrite(frame_path, frame)
+            cv2.imwrite(frame_path, frame, [cv2.IMWRITE_PNG_COMPRESSION, 0])
+            extracted_frames_paths.append(frame_path)
+            print(f"Frame salvo: {frame_path} (Timestamp: {timestamp_sec:.2f}s)")
+            saved_frame_index += 1
+        except Exception as e:
+            print(f"Erro ao salvar o frame {frame_path}: {e}")
+            # Continua para o próximo intervalo mesmo se um frame falhar
+        # Segurança para evitar loop infinito caso algo dê errado com a lógica de posição
+        if saved_frame_index > (total_frames / frame_interval) + 2:
+             print("Aviso: N��mero de frames salvos parece exceder o esperado. Interrompendo extração.")
+             break
+    cap.release()
+    print(f"Extração de frames concluída. Total de frames salvos: {len(extracted_frames_paths)}")
+    return extracted_frames_paths
+    return frames_list;
+def count_birds_species(image_path: str) -> int:
+    bird_count_prompt = """You are a world-class expert in avian species classification. Analyze the provided image and determine how many
+                    **distinct bird species** are present. Consider size, shape, plumage, coloration, and beak structure. Focus only on
+                    visible morphological differences. Return a **single integer** with no explanation. Do not count individuals of the same species. '
+                    If unsure, assume that bird is a different specie."""
+    if not OPENAI_API_KEY:
+        raise ValueError("OPENAI API KEY must be defined.")
+    base64_image = Image_Util.encode_image_to_base64(image_path)
+    genai.configure(api_key=GEMINI_API_KEY)
+    model = genai.GenerativeModel(GEMINI_MODEL)
+    print(f"Enviando frame para análise no {GEMINI_MODEL}...")
+    try:
+        response = model.generate_content(
+            contents=[
+                {
+                    "role": "user",
+                    "parts": [
+                        {f"text": f"{bird_count_prompt}"},
+                        {"inline_data": {
+                            "mime_type": "image/jpeg",
+                            "data": base64_image
+                        }}
+                    ]
+                }
+            ],
+            generation_config={
+                "temperature": 0.0,
+                "max_output_tokens": 500
+            })
+        # Extrai o conteúdo da resposta
+        analysis_result = response.text.strip()
+        print(f"Análise recebida: {analysis_result}")
+        return int(analysis_result)
+    except Exception as e:
+        print(f"Erro ao chamar a API OpenAI: {e}")
+        return {"error": str(e)}
+def bird_video_count_tool(url: str) -> int:
+    """
+        Count different species of birds in a video.
+        Args:
+            url: URL to the video.
+        Returns:
+            Count of different species of birds.
+    """
+    frames_path_list = extract_frames_from_video_to_files(url)
+    if not frames_path_list:
+        raise ValueError("Failed to extract frames.")
+    max_species: int = 0
+    for frame_path in frames_path_list:
+        species_count = count_birds_species(frame_path)
+        if species_count > max_species:
+            max_species = species_count
+    return max_species
+def extract_text_from_url_tool (audio_url:str) -> str:
+    """
+    Extracts text from an audio url using the OpenAI Whisper API.
+    Args:
+        audio_url: URL to the audio file.
+    Returns:
+        text extracted from the audio url.
+    """
+    if not audio_url:
+        raise ValueError("'audio_url'must be provided.")
+    if not OUTPUT_AUDIO_PATH:
+        raise ValueError("OUTPUT_AUDIO_PATH must be defined.")
+    File_Util.create_or_clear_output_directory(OUTPUT_AUDIO_PATH)
+    audio_download_file_name = Audio_Util.download_audio_from_url(audio_url, OUTPUT_AUDIO_PATH, AUDIO_FILENAME)
+    if not audio_download_file_name:
+        raise ValueError("Failed to download audio.")
+    transcript = Audio_Util.extract_text_from_audio_file(audio_download_file_name)
+    return transcript
+def extract_text_from_file_tool(audio_file_name:str) -> str:
+    """
+        Extracts text from an audio file using the OpenAI Whisper API.
+    Args:
+        audio_file_name: Name of the audio file.
+    Returns:
+        text extracted from the audio file.
+    """
+    if not audio_file_name and not audio_file_name:
+        raise ValueError(" 'audio_file_name' must be provided.")
+    if not OUTPUT_AUDIO_PATH:
+        raise ValueError("OUTPUT_AUDIO_PATH must be defined.")
+    treated_path = f"{AGENTS_FILES_PATH}/{audio_file_name}"
+    transcript = Audio_Util.extract_text_from_audio_file(treated_path)
+    return transcript
+class Search_Web_Result(BaseModel):
+    page_title: str
+    page_url: str
+    page_html_content: str
+    page_markdown_content: str
+def search_web_tool(query: str,
+                    wikipedia_has_priority: bool,
+                    wikipedia_historical_date: Optional[str]=None,
+                    convert_to_markdown: bool=True
+                    ) -> List[Search_Web_Result]:
+    """
+    Searches the web for pages with the most relevant information about the topic, returning a list of Search_Web_Result (title, url, html content and markdown content)
+    Args:
+        query: The main topic or question to search for.
+        use_wikipedia_priority: If true, prioritize results from Wikipedia.
+        wikipedia_date: Optional date to fetch historical Wikipedia data.
+    Returns:
+        A list of URLs or page titles sorted by relevance.
+    """
+    return_list: List[Search_Web_Result] = []
+    try:
+        tavily = TavilyClient(api_key=TAVILY_API_KEY)
+    except Exception as e:
+        print(f"Erro ao inicializar o cliente Tavily: {e}")
+        raise
+    print(f"\n--- Realizando busca por '{query}' usando Tavily ---")
+    print(f"Prioridade para Wikipedia: {wikipedia_has_priority}")
+    print(f"Data para Wikipedia: {wikipedia_historical_date}")
+    print(f"Convertendo HTML para Markdown: {convert_to_markdown}")
+    try:
+        response = tavily.search(query=query, search_depth="basic", max_results=10)
+        search_results = response.get('results', [])
+    except Exception as e:
+        print(f"Erro ao realizar busca com Tavily: {e}")
+        raise
+    if not search_results:
+        print("Nenhum resultado encontrado pela busca Tavily.")
+        return []
+    if wikipedia_has_priority:
+        print("Prioridade para Wikipedia habilitada. Filtrando resultados Tavily por Wikipedia...")
+        return _processa_resultado_wikipedia(search_results, wikipedia_historical_date, convert_to_markdown)
+    urls_to_process = []
+    print("Usando os 5 primeiros resultados gerais.")
+    urls_to_process = [res['url'] for res in search_results[:5]]
+    print(f"\n--- Processando {len(urls_to_process)} URLs selecionadas ---")
+    for url in urls_to_process:
+        title, html_content = Web_Util.download_html(url)
+        if not title or not html_content:
+            raise AssertionError(f"Falha ao processar URL: {url}")
+        md_content = ""
+        if convert_to_markdown:
+            md_content = Web_Util.convert_html_to_markdown(title, html_content)
+            if not md_content:
+                raise AssertionError(f"Falha ao converter URL: {url}, html:{html_content}")
+        return_list.append(Search_Web_Result(
+            page_title=title,
+            page_url=url,
+            page_html_content=html_content if not convert_to_markdown else "",
+            page_markdown_content=md_content
+        ))
+    return return_list
+def _processa_resultado_wikipedia(search_results: List[str], wikipedia_historical_date: str,
+                                  convert_to_markdown:bool) -> List[Search_Web_Result]:
+    """
+    Trata do resultado de pesquisa quando existe prioridade para Wikipedia.
+    Args:
+        search_results: Lista com resultados da busca realizado pelo Tavily.
+        wikipedia_historical_date: A data para buscar uma revisão histórica da Wikipedia.
+        convert_to_markdown: Se true, converte o conteúdo HTML para Markdown.
+    Returns:
+        Lista com os resultados processados.
+    """
+    print("Prioridade para Wikipedia habilitada. Filtrando resultados Tavily por Wikipedia...")
+    wiki_urls = [res['url'] for res in search_results if Web_Util.is_wikipedia_url(res['url'])]
+    if not wiki_urls:
+        print("Nenhuma URL da Wikipedia encontrada nos resultados.")
+        return []
+    # Pega o primeiro resultado da Wikipedia
+    first_wiki_url = wiki_urls[0]
+    page_title_guess = first_wiki_url.split('/')[-1].replace('_', ' ')
+    page_check = Wikipedia_Util.wiki_executor.page(page_title_guess)
+    if not page_check.exists():
+        raise AssertionError(f"Página '{page_title_guess}' não encontrada na Wikipedia.")
+    page_title = None
+    page_url = None
+    if not wikipedia_historical_date:
+        page_title = page_title_guess
+        page_url = first_wiki_url
+    else:
+        # Busca revisão histórica
+        historical_wiki_info: Wikipedia_Historical_Page = Wikipedia_Util.get_wikipedia_page_historical_content(page_check.title, wikipedia_historical_date)
+        print(f"Dados da versão histórica wikipedia - {historical_wiki_info}")
+        page_title = historical_wiki_info.title
+        page_url = historical_wiki_info.url
+    title, html_content = Web_Util.download_html(page_url)
+    print(f"title {title}")
+    if not html_content:
+        raise AssertionError(f"Conteúdo da página {page_url} não foi baixado, não será possível continuar.")
+    md_content = ""
+    if convert_to_markdown:
+        md_content = Web_Util.convert_html_to_markdown(page_title, html_content)
+        if md_content and wikipedia_historical_date:
+            # Adiciona informação sobre a revisão no início do conteúdo (CORRIGIDO)
+            header = f"# Wikipedia Content for '{historical_wiki_info.title}'\n"
+            header += f"*Revision from {historical_wiki_info.timestamp} (ID: {historical_wiki_info.revision_id})*\n"
+            header += f"*Regarding search date: {wikipedia_historical_date}*\n\n"
+            header += "---\n\n"
+            md_content = header + md_content
+    return_list = [
+         Search_Web_Result(
+            page_title=page_title,
+            page_url=page_url,
+            page_html_content=html_content if not convert_to_markdown else "",
+            page_markdown_content=md_content
+        )
+    ]
+    return return_list
+def text_inverter_tool(text: str ) -> str:
+    """
+    Invert the text.
+    Args:
+        text: Text to be inverted.
+    Returns:
+        Inverted text.
+    """
+    return text[::-1]
+def parse_markdown_table_to_dict(markdown: str) -> dict:
+    """
+        Convert binary operation table in markdown format to a dictionary
+        Args:
+            markdown: table in markdown format
+    """
+    linhas = markdown.strip().split('\n')
+    # Remove barras verticais nas extremidades e divide pelas internas
+    cabecalho = [col.strip() for col in linhas[0].strip('|').split('|')]
+    colunas = cabecalho[1:]  # ignora o '*'
+    tabela = {}
+    for linha in linhas[2:]:  # pula cabeçalho e separador
+        partes = [p.strip() for p in linha.strip('|').split('|')]
+        linha_elem = partes[0]
+        valores = partes[1:]
+        if len(valores) != len(colunas):
+            raise ValueError(f"Erro ao processar linha '{linha_elem}': número de colunas incompatível.")
+        tabela[linha_elem] = dict(zip(colunas, valores))
+    return tabela
+def check_table_commutativity_tool(markdown: str) -> dict:
+    """
+        Check if the table in markdown format is commutative
+        Args:
+            table: table in markdown format
+    """
+    contraexemplos = []
+    elementos = set()
+    table = parse_markdown_table_to_dict(markdown)
+    for x in table:
+        for y in table:
+            if x != y and table[x][y] != table[y][x]:
+                contraexemplos.append((x, y))
+                elementos.update([x, y])
+    return {
+        "counter_example": contraexemplos,
+        "elements_involved": sorted(elementos)
+    }
+def get_excel_columns_tool(file_path: str) -> list[str]:
+    """
+        Get the columns of an Excel file.
+        Args:
+            file_path: Path to the Excel file.
+        Returns:
+            List of column names.
+    """
+    final_excel_path = File_Util.tratar_arquivo_local(file_path)
+    print(f"Extraindo as colunas do arquivo {file_path}")
+    df = pd.read_excel(final_excel_path, nrows=0)
+    return df.columns.tolist()
+def calculate_excel_sum_by_columns_tool(
+    file_path: str,
+    include_columns: list[str]
+) -> str:
+    """
+        Calculate the sum of values in specified columns of an Excel file.
+    Args:
+    - file_path: Path to the Excel file.
+    - include_columns: Columns included in the sum
+    """
+    final_excel_path = File_Util.tratar_arquivo_local(file_path)
+    print(f"Calculando soma de {include_columns} em {final_excel_path}")
+    df = pd.read_excel(final_excel_path)
+    total = df[include_columns].sum().sum()  # soma todas as colunas e depois soma os totais
+    return total

video_util.py ADDED Viewed

	@@ -0,0 +1,31 @@

+import subprocess
+from constantes import YOUTUBE_COOKIE_PATH
+from file_util import File_Util
+class Video_Util:
+    def download_video_from_url(url: str, output_path: str, video_file_name: str) -> str:
+        """Baixa o vídeo do YouTube usando yt-dlp."""
+        video_path = f'{output_path}/{video_file_name}.%(ext)s'
+        print(f"Baixando vídeo de {url} para {video_path}...")
+        try:
+            # Comando yt-dlp para baixar o melhor formato mp4
+            command = [
+                'yt-dlp',
+                "--cookies", YOUTUBE_COOKIE_PATH,
+                '-f', 'bestvideo[ext=mp4]+bestaudio[ext=m4a]/best[ext=mp4]/best',
+                '-o', video_path,
+                url
+            ]
+            result = subprocess.run(command, check=True, capture_output=True, text=True)
+            lista_arquivos = File_Util.retirar_sufixo_codec_arquivo(output_path)
+            print("Download de áudio concluído com sucesso.")
+            return f"{output_path}/{lista_arquivos[0]}"
+        except subprocess.CalledProcessError as e:
+            print(f"Erro ao baixar o vídeo: {e}")
+            print(f"Saída do erro: {e.stderr}")
+            return False
+        except FileNotFoundError:
+            print("Erro: O comando 'yt-dlp' não foi encontrado. Certifique-se de que ele está instalado e no PATH do sistema.")
+            print("Você pode instalá-lo com: pip install yt-dlp")
+            return False

web_util.py ADDED Viewed

	@@ -0,0 +1,99 @@

+from typing import Tuple
+from bs4 import BeautifulSoup
+import markdownify
+import requests
+class Web_Util:
+    HEADERS = {
+      'User-Agent': 'MyCoolSearchBot/1.0 ([email protected])'
+  }
+    @staticmethod
+    def is_wikipedia_url(url: str) -> bool:
+        """Verifica se uma URL pertence ao domínio da Wikipedia."""
+        return "wikipedia.org" in url.lower()
+    @staticmethod
+    def _limpar_html(html: str) -> Tuple[str, str]:
+        """
+            Remove tags <script>, <style> e atributos inline.
+            Args:
+                html: HTML a ser limpo.
+            Returns:
+                Titulo da pagina e html limpo.
+        """
+        soup = BeautifulSoup(html, 'html.parser')
+        # Extrai o título da página (primeiro tenta <title>, depois <h1>)
+        title_tag = soup.find('title')
+        title = title_tag.get_text(strip=True) if title_tag else None
+        # Remove tags <script> e <style>
+        for tag in soup(['script', 'style']):
+            tag.decompose()
+        # Remove tags <img>
+        for img in soup.find_all('img'):
+            img.decompose()
+        # Remove atributos que aplicam CSS ou JS inline
+        for tag in soup.find_all(True):
+            for attr in ['style', 'onclick', 'onmouseover', 'onload', 'class', 'id']:
+                if attr in tag.attrs:
+                    del tag.attrs[attr]
+        return title, str(soup)
+    @staticmethod
+    def download_html(url: str) -> Tuple[str, str]:
+        """
+            Baixa o conteúdo HTML de uma URL, retornando também o titulo.
+            Args:
+                url: URL a ser baixada.
+            Returns:
+                Uma tupla contendo o título e o conteúdo HTML.
+        """
+        print(f"Baixando e convertendo: {url}")
+        try:
+            response = requests.get(url, headers=Web_Util.HEADERS, timeout=20)
+            response.raise_for_status()  # Verifica se houve erro no request
+            # Tenta detectar a codificação, mas assume UTF-8 como fallback
+            response.encoding = response.apparent_encoding or 'utf-8'
+            html_content = response.text
+            # Usa readability para extrair o conteúdo principal
+            title, cleaned_html = Web_Util._limpar_html(html_content)
+            return title, cleaned_html
+        except requests.exceptions.RequestException as e:
+            print(f"Erro ao acessar a URL (requestException) {url}: {e}")
+            return None
+        except Exception as e:
+            print(f"Erro ao acessar a URL (erro genérico) {url}: {e}")
+            return None
+    @staticmethod
+    def convert_html_to_markdown(title: str, html: str) -> str:
+        """Converte o html para markdown."""
+        try:
+            md_content = markdownify.markdownify(
+                html,
+                heading_style="ATX",
+                strip=['script', 'style'],
+                escape_underscores=False)
+            return f"# {title}\n\n" + md_content.strip()
+        except Exception as e:
+            print(f"Erro ao converter HTML para Markdown: {e}")
+            return None
+        @staticmethod
+        def download_html_and_convert_to_md(url: str) -> str:
+            """Baixa o conteúdo HTML de uma URL e o converte para Markdown."""
+            title, html = Web_Util.download_html(url)
+            if title and html:
+                return Web_Util.convert_html_to_markdown(title)
+            else:
+                return None

wikipedia_util.py ADDED Viewed

	@@ -0,0 +1,133 @@

+from datetime import datetime, timezone
+from typing import Tuple
+import urllib
+from gradio import List
+from pydantic import BaseModel
+import requests
+import wikipediaapi
+class Wikipedia_Historical_Page(BaseModel):
+    title: str
+    url: str
+    revision_id: str
+    timestamp: str
+class Wikipedia_Util:
+    WIKI_LANG = 'en' # Linguagem da Wikipedia (atualizado para inglês)
+    MEDIAWIKI_API_URL = f"https://{WIKI_LANG}.wikipedia.org/w/api.php"
+    HEADERS = {
+        'User-Agent': 'MyCoolSearchBot/1.0 ([email protected])'
+    }
+    wiki_executor = wikipediaapi.Wikipedia(
+        language=WIKI_LANG,
+        extract_format=wikipediaapi.ExtractFormat.HTML, # Usado apenas para page.exists()
+        user_agent='MyCoolSearchBot/1.0 ([email protected])' # Definir um User-Agent é boa prática
+        )
+    @staticmethod
+    def get_wikipedia_revision_info(page_title: str, target_date_str: str) -> Tuple[str,str]:
+        """
+        Busca o ID e timestamp da revisão mais próxima (<=) da data fornecida via API MediaWiki.
+            Args:
+                page_title: wikipedia encontra páginas históricas pelo titulo
+                target_date_str: data no formato "YYYY-MM-DD"
+            Returns:
+                Uma tupla contendo o ID da revisão e o timestamp da revisão.
+        """
+        try:
+            # Converte a data string para um objeto datetime e formata para ISO 8601 com Z (UTC)
+            target_dt = datetime.strptime(target_date_str, '%Y-%m-%d')
+            # Precisamos do final do dia para garantir que incluímos todas as revisões daquele dia
+            target_dt_end_of_day = target_dt.replace(hour=23, minute=59, second=59, tzinfo=timezone.utc)
+            target_timestamp_iso = target_dt_end_of_day.strftime('%Y-%m-%dT%H:%M:%SZ')
+        except ValueError:
+            print("Formato de data inválido. Use AAAA-MM-DD.")
+            return None, None
+        params = {
+            "action": "query",
+            "prop": "revisions",
+            "titles": page_title,
+            "rvlimit": 1,
+            "rvdir": "older", # Busca a revisão imediatamente anterior ou igual ao timestamp
+            "rvprop": "ids|timestamp", # Queremos o ID da revisão e o timestamp
+            "rvstart": target_timestamp_iso, # Começa a busca a partir desta data/hora
+            "format": "json",
+            "formatversion": 2 # Formato JSON mais moderno e fácil de parsear
+        }
+        try:
+            print(f"Consultando API MediaWiki para revisão de '{page_title}' em {target_date_str}...")
+            response = requests.get(Wikipedia_Util.MEDIAWIKI_API_URL, params=params, headers=Wikipedia_Util.HEADERS, timeout=15)
+            response.raise_for_status()
+            data = response.json()
+            # Verifica se a página foi encontrada
+            page_data = data.get("query", {}).get("pages", [])
+            if not page_data or page_data[0].get("missing", False):
+                print(f"Página '{page_title}' não encontrada na API MediaWiki.")
+                # Tenta verificar com a biblioteca wikipediaapi como fallback (pode pegar redirecionamentos)
+                page = Wikipedia_Util.wiki_executor.page(page_title)
+                if page.exists():
+                    print(f"Página '{page_title}' existe (possivelmente redirecionada para '{page.title}'). Tentando novamente com o título canônico...")
+                    return Wikipedia_Util.get_wikipedia_revision_info(page.title, target_date_str) # Chama recursivamente com o título correto
+                else:
+                    print(f"Página '{page_title}' realmente não encontrada.")
+                    return None, None
+            # Extrai as revisões
+            revisions = page_data[0].get("revisions", [])
+            if not revisions:
+                print(f"Nenhuma revisão encontrada para '{page_title}' antes ou em {target_date_str}.")
+                # Pode acontecer se a página foi criada depois da data alvo
+                return None, None
+            revision = revisions[0]
+            revid = revision.get("revid")
+            timestamp = revision.get("timestamp")
+            print(f"Encontrada revisão: ID={revid}, Timestamp={timestamp}")
+            return revid, timestamp
+        except requests.exceptions.RequestException as e:
+            print(f"Erro ao chamar a API MediaWiki: {e}")
+            return None, None
+        except Exception as e:
+            print(f"Erro ao processar resposta da API MediaWiki: {e}")
+            return None, None
+    @staticmethod
+    def get_wikipedia_page_historical_content(page_title: str, target_date_str: str) -> List[Wikipedia_Historical_Page]:
+        """Obtém o conteúdo Markdown de uma revisão histórica específica da Wikipedia."""
+        # Busca o ID da revisão correta usando a API MediaWiki
+        revid, timestamp = Wikipedia_Util.get_wikipedia_revision_info(page_title, target_date_str)
+        if not revid:
+            print(f"Não foi poss��vel encontrar uma revisão adequada para '{page_title}' em {target_date_str}.")
+            return None
+        # Constrói a URL para a revisão específica
+        # Nota: Codifica o título da página para a URL
+        # Precisamos garantir que estamos usando o título correto (pode ter sido redirecionado)
+        page_check = Wikipedia_Util.wiki_executor.page(page_title) # Verifica novamente para obter o título canônico se houve redirecionamento
+        if not page_check.exists():
+            print(f"Erro inesperado: Página '{page_title}' não encontrada após busca de revisão.")
+            return None
+        canonical_title = page_check.title
+        encoded_title = urllib.parse.quote(canonical_title.replace(' ', '_'))
+        revision_url = f"https://{Wikipedia_Util.WIKI_LANG}.wikipedia.org/w/index.php?title={encoded_title}&oldid={revid}"
+        return Wikipedia_Historical_Page(
+            title=canonical_title,
+            url=revision_url,
+            revision_id=str(revid), #parametro obrigatoriamente string
+            timestamp=timestamp
+        )