Spaces:

Agents-MCP-Hackathon
/

TDAgentTools

Runtime error

App Files Files Community

pedrobento988 commited on Jun 5

Commit

f1d068a

verified ·

1 Parent(s): 0efeabf

Add RDAP tool (#6)

Browse files

- feat: Add RDAP tool (b7c5e0bed5b4dcd56ecb5e31f60107b517b49002)

Files changed (5) hide show

app.py +7 -2
pyproject.toml +1 -0
tdagent/constants.py +8 -0
tdagent/tools/get_url_content.py +1 -7
tdagent/tools/rdap.py +109 -0

app.py CHANGED Viewed

@@ -8,9 +8,12 @@ from tdagent.tools.lookup_company_cloud_account_information import (
     gr_lookup_company_cloud_account_information,
 )
 from tdagent.tools.query_abuse_ip_db import gr_query_abuseipdb
 from tdagent.tools.send_email import gr_send_email
 from tdagent.tools.virus_total import gr_virus_total_url_info
-from tdagent.tools.whois import gr_query_whois
 ## Tools to load into the application interface ##
@@ -26,7 +29,9 @@ class ToolInfo(NamedTuple):
 TOOLS = (
     ToolInfo("Get URL Content", gr_get_url_http_content),
     ToolInfo("Query AbuseIPDB", gr_query_abuseipdb),
-    ToolInfo("Query WHOIS", gr_query_whois),
     ToolInfo("Virus Total URL info", gr_virus_total_url_info),
     ## Fake tools
     ToolInfo("Fake company directory", gr_internal_company),

     gr_lookup_company_cloud_account_information,
 )
 from tdagent.tools.query_abuse_ip_db import gr_query_abuseipdb
+from tdagent.tools.rdap import gr_query_rdap
 from tdagent.tools.send_email import gr_send_email
 from tdagent.tools.virus_total import gr_virus_total_url_info
+# from tdagent.tools.whois import gr_query_whois
 ## Tools to load into the application interface ##
 TOOLS = (
     ToolInfo("Get URL Content", gr_get_url_http_content),
     ToolInfo("Query AbuseIPDB", gr_query_abuseipdb),
+    # Whois does not work from Spaces (port 43 blocked)
+    # ToolInfo("Query WHOIS", gr_query_whois),
+    ToolInfo("Query RDAP", gr_query_rdap),
     ToolInfo("Virus Total URL info", gr_virus_total_url_info),
     ## Fake tools
     ToolInfo("Fake company directory", gr_internal_company),

pyproject.toml CHANGED Viewed

@@ -128,4 +128,5 @@ convention = "google"
 [tool.ruff.lint.per-file-ignores]
 "*/__init__.py" = ["F401"]
 "tdagent/cli/**/*.py" = ["D103", "T201"]
 "tests/*.py" = ["D103", "PLR2004", "S101"]

 [tool.ruff.lint.per-file-ignores]
 "*/__init__.py" = ["F401"]
 "tdagent/cli/**/*.py" = ["D103", "T201"]
+"tdagent/tools/rdap.py" = ["PLR2004"]
 "tests/*.py" = ["D103", "PLR2004", "S101"]

tdagent/constants.py ADDED Viewed

	@@ -0,0 +1,8 @@

+import enum
+class HttpContentType(str, enum.Enum):
+    """Http content type values."""
+    HTML = "text/html"
+    JSON = "application/json"

tdagent/tools/get_url_content.py CHANGED Viewed

@@ -1,15 +1,9 @@
-import enum
 from collections.abc import Sequence
 import gradio as gr
 import requests
-class HttpContentType(str, enum.Enum):
-    """Http content type values."""
-    HTML = "text/html"
-    JSON = "application/json"
 def get_url_http_content(

 from collections.abc import Sequence
 import gradio as gr
 import requests
+from tdagent.constants import HttpContentType
 def get_url_http_content(

tdagent/tools/rdap.py ADDED Viewed

	@@ -0,0 +1,109 @@

+import enum
+import cachetools
+import gradio as gr
+import requests
+import whois
+from tdagent.constants import HttpContentType
+# one of domain, ip, autnum, entity etc
+_RDAP_URL_TEMPLATE = r"https://rdap.org/{rdap_type}/{rdap_object}"
+_CACHE_MAX_SIZE = 4096
+_CACHE_TTL_SECONDS = 3600
+class RdapTypes(str, enum.Enum):
+    """RDAP object types."""
+    DOMAIN = "domain"
+    IP = "ip"
+    AUTNUM = "autnum"
+    ENTITY = "entity"
+@cachetools.cached(
+    cache=cachetools.TTLCache(maxsize=_CACHE_MAX_SIZE, ttl=_CACHE_TTL_SECONDS),
+)
+def query_rdap(  # noqa: PLR0911
+    url_or_ip: str,
+    timeout: int = 30,
+) -> dict[str, str | int | float]:
+    """Query RDAP to get information about Internet resources.
+    The Registration Data Access Protocol (RDAP) is the successor to WHOIS.
+    Like WHOIS, RDAP provides access to information about Internet resources
+    (domain names, autonomous system numbers, and IP addresses).
+    Args:
+        url_or_ip: URL, domain or IP to query for RDAP information.
+        timeout: Request timeout in seconds. Defaults to 30.
+    Returns:
+        A JSON formatted string with RDAP information. In there is
+        an error, the JSON will contain the key "error" with an
+        error message.
+    """
+    rdap_type = RdapTypes.DOMAIN
+    rdap_object = url_or_ip
+    if whois.IPV4_OR_V6.match(url_or_ip):
+        rdap_type = RdapTypes.IP
+    else:
+        rdap_object = whois.extract_domain(url_or_ip)
+    query_url = _RDAP_URL_TEMPLATE.format(rdap_type=rdap_type, rdap_object=rdap_object)
+    response = requests.get(
+        query_url,
+        timeout=timeout,
+        headers={"Accept": HttpContentType.JSON},
+    )
+    try:
+        response.raise_for_status()
+    except requests.HTTPError as err:
+        if err.response.status_code == 302:
+            if "Location" in err.response.headers:
+                return {
+                    "message": "Follow the location to find RDAP information",
+                    "location": err.response.headers["Location"],
+                }
+            return {
+                "error": (
+                    "Information not found in RDAP.org but it knows of"
+                    " a service which is authoritative for the requested resource."
+                ),
+            }
+        if err.response.status_code == 400:
+            return {
+                "error": (
+                    "Invalid request (malformed path, unsupported object "
+                    " type, invalid IP address, etc)"
+                ),
+            }
+        if err.response.status_code == 403:
+            return {
+                "error": "You've been blocked due to abuse or other misbehavior",
+            }
+        if err.response.status_code == 404:
+            return {
+                "error": (
+                    "RDAP.org doesn't know of an RDAP service which is"
+                    " authoritative for the requested resource. RDAP.org"
+                    " only knows about servers that are registered with IANA"
+                ),
+            }
+        return {
+            "error": str(err),
+        }
+    return response.json()
+gr_query_rdap = gr.Interface(
+    fn=query_rdap,
+    inputs=["text"],
+    outputs="json",
+    title="Get RDAP information for a given URL.",
+    description="Query a RDAP database to gather information about a url or domain.",
+)