Spaces:

habulaj
/

newapi-clone

Running

App Files Files Community

habulaj commited on 2 days ago

Commit

f83678a

verified ·

1 Parent(s): fbd0ae7

Update routers/searchterm.py

Browse files

Files changed (1) hide show

routers/searchterm.py +102 -1

routers/searchterm.py CHANGED Viewed

@@ -5,10 +5,16 @@ import asyncio
 import httpx
 import aiohttp
 import trafilatura
 from urllib.parse import urlparse
 from typing import List, Dict, Any, Optional
 from fastapi import APIRouter, HTTPException, Body
 from newspaper import Article
 router = APIRouter()
@@ -34,6 +40,13 @@ BLOCKED_DOMAINS = {"reddit.com", "www.reddit.com", "old.reddit.com",
 MAX_TEXT_LENGTH = 4000
 def is_blocked_domain(url: str) -> bool:
     try:
@@ -60,6 +73,44 @@ def get_realistic_headers() -> Dict[str, str]:
     }
 async def search_brave_term(client: httpx.AsyncClient, term: str) -> List[Dict[str, str]]:
     params = {"q": term, "count": 10, "safesearch": "off", "summary": "false"}
@@ -180,4 +231,54 @@ async def search_terms(payload: Dict[str, List[str]] = Body(...)) -> Dict[str, A
             else:
                 final_results = []
-    return {"results": final_results}

 import httpx
 import aiohttp
 import trafilatura
+import json
+import uuid
+import time
+from pathlib import Path
 from urllib.parse import urlparse
 from typing import List, Dict, Any, Optional
 from fastapi import APIRouter, HTTPException, Body
+from fastapi.responses import FileResponse
 from newspaper import Article
+from threading import Timer
 router = APIRouter()
 MAX_TEXT_LENGTH = 4000
+# Diretório para arquivos temporários
+TEMP_DIR = Path("/tmp")
+TEMP_DIR.mkdir(exist_ok=True)
+# Dicionário para controlar arquivos temporários
+temp_files = {}
 def is_blocked_domain(url: str) -> bool:
     try:
     }
+def delete_temp_file(file_id: str, file_path: Path):
+    """Remove arquivo temporário após expiração"""
+    try:
+        if file_path.exists():
+            file_path.unlink()
+        temp_files.pop(file_id, None)
+        print(f"Arquivo temporário removido: {file_path}")
+    except Exception as e:
+        print(f"Erro ao remover arquivo temporário: {e}")
+def create_temp_file(data: Dict[str, Any]) -> Dict[str, str]:
+    """Cria arquivo temporário e agenda sua remoção"""
+    file_id = str(uuid.uuid4())
+    file_path = TEMP_DIR / f"fontes_{file_id}.txt"
+    # Salva o JSON no arquivo
+    with open(file_path, 'w', encoding='utf-8') as f:
+        json.dump(data, f, ensure_ascii=False, indent=2)
+    # Agenda remoção em 24 horas (86400 segundos)
+    timer = Timer(86400, delete_temp_file, args=[file_id, file_path])
+    timer.start()
+    # Registra o arquivo temporário
+    temp_files[file_id] = {
+        "path": file_path,
+        "created_at": time.time(),
+        "timer": timer
+    }
+    return {
+        "file_id": file_id,
+        "download_url": f"/download-temp/{file_id}",
+        "expires_in_hours": 24
+    }
 async def search_brave_term(client: httpx.AsyncClient, term: str) -> List[Dict[str, str]]:
     params = {"q": term, "count": 10, "safesearch": "off", "summary": "false"}
             else:
                 final_results = []
+    # Cria o JSON final
+    result_data = {"results": final_results}
+    # Cria arquivo temporário
+    temp_file_info = create_temp_file(result_data)
+    return {
+        "message": "Dados salvos em arquivo temporário",
+        "total_results": len(final_results),
+        "file_info": temp_file_info
+    }
+@router.get("/download-temp/{file_id}")
+async def download_temp_file(file_id: str):
+    """Endpoint para download do arquivo temporário"""
+    if file_id not in temp_files:
+        raise HTTPException(status_code=404, detail="Arquivo não encontrado ou expirado")
+    file_info = temp_files[file_id]
+    file_path = file_info["path"]
+    if not file_path.exists():
+        temp_files.pop(file_id, None)
+        raise HTTPException(status_code=404, detail="Arquivo não encontrado")
+    return FileResponse(
+        path=str(file_path),
+        filename="fontes.txt",
+        media_type="text/plain",
+        headers={"Content-Disposition": "attachment; filename=fontes.txt"}
+    )
+@router.get("/temp-files/status")
+async def get_temp_files_status():
+    """Endpoint para verificar status dos arquivos temporários (debug)"""
+    status = {}
+    current_time = time.time()
+    for file_id, info in temp_files.items():
+        age_hours = (current_time - info["created_at"]) / 3600
+        remaining_hours = max(0, 24 - age_hours)
+        status[file_id] = {
+            "age_hours": round(age_hours, 2),
+            "remaining_hours": round(remaining_hours, 2),
+            "exists": info["path"].exists()
+        }
+    return {"temp_files": status}