Spaces:

mgbam
/

CryptoSentinel_AI

Running

App Files Files Community

mgbam commited on 3 days ago

Commit

347f446

verified ·

1 Parent(s): a17b947

Update app/sentiment.py

Browse files

Files changed (1) hide show

app/sentiment.py +42 -123

app/sentiment.py CHANGED Viewed

@@ -1,133 +1,52 @@
 """
-Provides a robust, asynchronous SentimentAnalyzer class.
-This module communicates with the Hugging Face Inference API to perform sentiment
-analysis without requiring local model downloads. It's designed for use within
-an asynchronous application like FastAPI.
 """
-import asyncio
-import logging
-import os
-# ====================================================================
-#                       FINAL FIX APPLIED HERE
-# ====================================================================
-# Import Optional and Union for Python 3.9 compatibility.
-from typing import TypedDict, Union, Optional
-# ====================================================================
-import httpx
-# --- Configuration & Models ---
-# Configure logging for this module
-logger = logging.getLogger(__name__)
-# Define the expected structure of a result payload for type hinting
-class SentimentResult(TypedDict):
-    id: int
-    text: str
-    # Using Union for Python 3.9 compatibility
-    result: dict[str, Union[str, float]]
-# --- Main Class: SentimentAnalyzer ---
-class SentimentAnalyzer:
     """
-    Manages sentiment analysis requests to the Hugging Face Inference API.
-    This class handles asynchronous API communication, manages a result queue for
-    Server-Sent Events (SSE), and encapsulates all related state and logic.
     """
-    HF_API_URL = "https://api-inference.huggingface.co/models/distilbert-base-uncased-finetuned-sst-2-english"
-    # ====================================================================
-    #                       FINAL FIX APPLIED HERE
-    # ====================================================================
-    # Changed `str | None` to `Optional[str]` for Python 3.9 compatibility.
-    def __init__(self, client: httpx.AsyncClient, api_token: Optional[str] = None):
-    # ====================================================================
         """
-        Initializes the SentimentAnalyzer.
-        Args:
-            client: An instance of httpx.AsyncClient for making API calls.
-            api_token: The Hugging Face API token.
         """
-        self.client = client
-        self.api_token = api_token or os.getenv("HF_API_TOKEN")
-        if not self.api_token:
-            raise ValueError("Hugging Face API token is not set. Please set the HF_API_TOKEN environment variable.")
-        self.headers = {"Authorization": f"Bearer {self.api_token}"}
-        # A queue is the ideal structure for a producer-consumer pattern,
-        # where the API endpoint is the producer and SSE streamers are consumers.
-        self.result_queue: asyncio.Queue[SentimentResult] = asyncio.Queue()
-    async def compute_and_publish(self, text: str, request_id: int) -> None:
-        """
-        Performs sentiment analysis via an external API and places the result
-        into a queue for consumption by SSE streams.
-        Args:
-            text: The input text to analyze.
-            request_id: A unique identifier for this request.
-        """
-        analysis_result: dict[str, Union[str, float]] = {"label": "ERROR", "score": 0.0, "error": "Unknown failure"}
         try:
-            response = await self.client.post(
-                self.HF_API_URL,
-                headers=self.headers,
-                json={"inputs": text, "options": {"wait_for_model": True}},
-                timeout=20.0
-            )
-            response.raise_for_status()
-            data = response.json()
-            # Validate the expected response structure from the Inference API
-            if isinstance(data, list) and data and isinstance(data[0], list) and data[0]:
-                # The model returns a list containing a list of results
-                res = data[0][0]
-                analysis_result = {"label": res.get("label"), "score": round(res.get("score", 0.0), 4)}
-                logger.info("✅ Sentiment computed for request #%d", request_id)
-            else:
-                raise ValueError(f"Unexpected API response format: {data}")
-        except httpx.HTTPStatusError as e:
-            error_msg = f"API returned status {e.response.status_code}"
-            logger.error("❌ Sentiment API error for request #%d: %s", request_id, error_msg)
-            analysis_result["error"] = error_msg
-        except httpx.RequestError as e:
-            error_msg = f"Network request failed: {e}"
-            logger.error("❌ Sentiment network error for request #%d: %s", request_id, error_msg)
-            analysis_result["error"] = error_msg
-        except (ValueError, KeyError) as e:
-            error_msg = f"Failed to parse API response: {e}"
-            logger.error("❌ Sentiment parsing error for request #%d: %s", request_id, error_msg)
-            analysis_result["error"] = error_msg
-        # Always publish a result to the queue, even if it's an error state
-        payload: SentimentResult = {
-            "id": request_id,
-            "text": text,
-            "result": analysis_result
-        }
-        await self.result_queue.put(payload)
-    async def stream_results(self): # Type hint removed for simplicity, was -> SentimentResult
-        """
-        An async generator that yields new results as they become available.
-        This is the consumer part of the pattern.
-        """
-        while True:
-            try:
-                # This efficiently waits until an item is available in the queue
-                result = await self.result_queue.get()
-                yield result
-                self.result_queue.task_done()
-            except asyncio.CancelledError:
-                logger.info("Result stream has been cancelled.")
-                break

 """
+The Tier 1 Intelligence Sieve.
+This module uses a locally-hosted, finance-optimized transformer model (FinBERT)
+to perform initial, high-speed sentiment analysis. It acts as a gatekeeper,
+only escalating high-conviction events to the more powerful Tier 2 analyst.
 """
+from transformers import pipeline
+from threading import Lock
+class SentimentEngine:
     """
+    A thread-safe, high-performance sentiment analysis engine using a local model.
+    Implemented as a singleton to ensure the model is loaded only once.
     """
+    _instance = None
+    _lock = Lock()
+    def __new__(cls):
+        with cls._lock:
+            if cls._instance is None:
+                print("🧠 [Tier 1] Initializing local sentiment model (FinBERT)... This may take a moment.")
+                try:
+                    cls._instance = super().__new__(cls)
+                    # Using a model specifically fine-tuned on financial text for superior accuracy.
+                    cls._instance.sentiment_pipeline = pipeline(
+                        "sentiment-analysis",
+                        model="ProsusAI/finbert"
+                    )
+                    print("✅ [Tier 1] FinBERT model is online and ready.")
+                except Exception as e:
+                    print(f"❌ CRITICAL: Failed to load local FinBERT model. Tier 1 filtering will be disabled. Error: {e}")
+                    cls._instance.sentiment_pipeline = None
+        return cls._instance
+    def analyze(self, text: str) -> dict:
         """
+        Analyzes text using the local model if available.
+        Returns a dictionary with 'label' and 'score'.
         """
+        if not self.sentiment_pipeline:
+            return {"label": "neutral", "score": 0.0}
         try:
+            # FinBERT labels are 'positive', 'negative', 'neutral'
+            return self.sentiment_pipeline(text)[0]
+        except Exception as e:
+            print(f"Error in local sentiment analysis: {e}")
+            return {"label": "neutral", "score": 0.0}
+# Create a singleton instance that will be imported by the main app.
+LocalSentimentFilter = SentimentEngine()