Spaces:

MUFASA25
/

PhishGuardian_AI

Runtime error

App Files Files Community

MUFASA25 commited on May 30

Commit

09b3e31

verified ·

1 Parent(s): cc8ce94

simplest form

Browse files

Files changed (1) hide show

app.py +91 -222

app.py CHANGED Viewed

@@ -2,91 +2,67 @@ import gradio as gr
 import torch
 from transformers import AutoTokenizer, AutoModelForSequenceClassification
 import logging
-import numpy as np
-# Configure logging
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 # Model configuration
 MODEL_NAME = "cybersectony/phishing-email-detection-distilbert_v2.4.1"
 # Global variables for model and tokenizer
 tokenizer = None
 model = None
 def load_model():
-    """Load the model and tokenizer with error handling"""
     global tokenizer, model
     try:
-        logger.info("Loading model and tokenizer...")
         tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
         model = AutoModelForSequenceClassification.from_pretrained(MODEL_NAME)
-        # Debug: Print model configuration
-        logger.info(f"Model config: {model.config}")
-        logger.info(f"Number of labels: {model.config.num_labels}")
-        if hasattr(model.config, 'id2label'):
-            logger.info(f"Label mapping: {model.config.id2label}")
-        # Test model with simple input to check if it's working
-        test_input = "Hello world"
-        inputs = tokenizer(test_input, return_tensors="pt", truncation=True, max_length=512)
-        with torch.no_grad():
-            outputs = model(**inputs)
-            test_probs = torch.nn.functional.softmax(outputs.logits, dim=-1)
-            logger.info(f"Test probabilities: {test_probs[0].tolist()}")
         logger.info("Model loaded successfully!")
         return True
     except Exception as e:
         logger.error(f"Error loading model: {e}")
         return False
-def get_colored_bar(percentage, label):
-    """Create colored progress bar based on percentage and label type"""
-    # Determine color based on percentage and label
-    if "phishing" in label.lower() or "suspicious" in label.lower():
-        # Red scale for dangerous content
-        if percentage >= 70:
-            color = "🟥"  # High danger - red
-        elif percentage >= 40:
-            color = "🟠"  # Medium danger - orange
-        else:
-            color = "🟡"  # Low danger - yellow
-    else:
-        # Green scale for legitimate content
-        if percentage >= 70:
-            color = "🟢"  # High confidence - green
-        elif percentage >= 40:
-            color = "🟡"  # Medium confidence - yellow
-        else:
-            color = "⚪"  # Low confidence - white
-    # Create bar (scale to 20 characters)
-    bar_length = max(1, int(percentage / 5))  # Ensure at least 1 if percentage > 0
-    bar = color * bar_length + "⚪" * (20 - bar_length)
-    return bar
 def predict_email(email_text):
-    """
-    Enhanced prediction function with proper model output handling
-    """
     # Input validation
-    if not email_text or not email_text.strip():
-        return "⚠️ **Error**: Please enter some email text to analyze."
-    if len(email_text.strip()) < 5:
-        return "⚠️ **Warning**: Email text too short for reliable analysis."
     # Check if model is loaded
     if tokenizer is None or model is None:
         if not load_model():
-            return "❌ **Error**: Failed to load the model."
     try:
-        # Preprocess and tokenize
         inputs = tokenizer(
             email_text,
             return_tensors="pt",
@@ -95,210 +71,103 @@ def predict_email(email_text):
             padding=True
         )
-        # Get prediction with proper handling
         with torch.no_grad():
             outputs = model(**inputs)
-            # Apply temperature scaling to prevent overconfidence
-            temperature = 1.5
-            scaled_logits = outputs.logits / temperature
-            predictions = torch.nn.functional.softmax(scaled_logits, dim=-1)
-        # Get probabilities
-        probs = predictions[0].tolist()
-        # Log raw outputs for debugging
-        logger.info(f"Raw logits: {outputs.logits[0].tolist()}")
-        logger.info(f"Scaled probabilities: {probs}")
-        # Get proper labels from model config or use fallback
-        if hasattr(model.config, 'id2label') and model.config.id2label:
-            labels = {model.config.id2label[i]: probs[i] for i in range(len(probs))}
-        else:
-            # Fallback - check the actual model output dimension
-            if len(probs) == 2:
-                labels = {
-                    "Legitimate Email": probs[0],
-                    "Phishing Email": probs[1]
-                }
-            elif len(probs) == 4:
-                labels = {
-                    "Legitimate Email": probs[0],
-                    "Phishing Email": probs[1],
-                    "Suspicious Content": probs[2],
-                    "Spam Email": probs[3]
-                }
-            else:
-                # Generic labels
-                labels = {f"Class {i}": probs[i] for i in range(len(probs))}
-        # Check if model is giving reasonable outputs
-        prob_variance = np.var(probs)
-        max_prob = max(probs)
-        # If variance is too low, the model might not be working properly
-        if prob_variance < 0.01 and max_prob > 0.99:
-            logger.warning("Model showing signs of overconfidence or poor calibration")
-            # Apply smoothing
-            smoothed_probs = [(p * 0.8 + 0.2/len(probs)) for p in probs]
-            labels = {list(labels.keys())[i]: smoothed_probs[i] for i in range(len(smoothed_probs))}
-        # Find prediction
-        max_label = max(labels.items(), key=lambda x: x[1])
-        # Determine risk level and emoji
-        confidence = max_label[1]
-        prediction_name = max_label[0]
-        if any(word in prediction_name.lower() for word in ['phishing', 'suspicious', 'spam']):
-            if confidence > 0.8:
-                risk_emoji = "🚨"
-                risk_level = "HIGH RISK"
-            elif confidence > 0.6:
-                risk_emoji = "⚠️"
-                risk_level = "MEDIUM RISK"
-            else:
-                risk_emoji = "⚡"
-                risk_level = "LOW RISK"
         else:
-            if confidence > 0.8:
-                risk_emoji = "✅"
-                risk_level = "SAFE"
-            elif confidence > 0.6:
-                risk_emoji = "✅"
-                risk_level = "LIKELY SAFE"
-            else:
-                risk_emoji = "❓"
-                risk_level = "UNCERTAIN"
-        # Format output with colored bars
-        result = f"{risk_emoji} **{risk_level}**\n\n"
-        result += f"**Primary Classification**: {prediction_name}\n"
-        result += f"**Confidence**: {confidence:.1%}\n\n"
-        result += f"**Detailed Analysis**:\n"
-        # Sort by probability and add colored bars
-        for label, prob in sorted(labels.items(), key=lambda x: x[1], reverse=True):
-            percentage = prob * 100
-            colored_bar = get_colored_bar(percentage, label)
-            result += f"{label}: {percentage:.1f}% {colored_bar}\n"
-        # Add debug info
-        result += f"\n**Debug Info**:\n"
-        result += f"Model Variance: {prob_variance:.4f}\n"
-        result += f"Raw Probabilities: {[f'{p:.3f}' for p in probs]}\n"
-        # Add recommendations based on actual classification
-        if any(word in prediction_name.lower() for word in ['phishing', 'suspicious']) and confidence > 0.6:
-            result += f"\n⚠️ **Recommendation**: This email shows signs of being malicious. Avoid clicking links or providing personal information."
-        elif 'spam' in prediction_name.lower():
-            result += f"\n🗑️ **Recommendation**: This appears to be spam. Consider deleting or marking as junk."
-        elif confidence > 0.7:
-            result += f"\n✅ **Recommendation**: This email appears legitimate, but always remain vigilant."
         else:
-            result += f"\n❓ **Recommendation**: Classification uncertain. Exercise caution and verify sender if needed."
-        return result
     except Exception as e:
-        logger.error(f"Error during prediction: {e}", exc_info=True)
-        return f"❌ **Error**: Analysis failed - {str(e)}"
-# Example emails for testing
 example_legitimate = """Dear Customer,
-Thank you for your recent purchase from TechStore. Your order #ORD-2024-001234 has been successfully processed.
 Order Details:
-- Product: Wireless Headphones
 - Amount: $79.99
-- Estimated delivery: 3-5 business days
-You will receive a tracking number once your item ships.
 Best regards,
-TechStore Customer Service"""
-example_phishing = """URGENT SECURITY ALERT!!!
-Your account has been COMPROMISED! Immediate action required!
-Click here NOW to secure your account: http://fake-security-site.malicious.com/urgent-verify
-WARNING: You have only 24 hours before your account is permanently suspended!
-This is your FINAL notice - act immediately!
-Security Department"""
 example_neutral = """Hi team,
-Hope everyone is doing well. Just wanted to remind you about the meeting scheduled for tomorrow at 2 PM in the conference room.
-Please bring your project updates and any questions you might have.
 Thanks,
-Sarah"""
 # Load model on startup
 load_model()
-# Create enhanced Gradio interface
-with gr.Blocks(title="PhishGuardian AI", theme=gr.themes.Soft()) as iface:
-    gr.Markdown("""
-    # 🛡️ PhishGuardian AI - Enhanced Detection
-    Advanced phishing email detection with colored risk indicators and improved model handling.
-    """)
     with gr.Row():
         with gr.Column(scale=2):
             email_input = gr.Textbox(
-                lines=10,
-                placeholder="Paste your email content here for analysis...",
-                label="📧 Email Content",
-                info="Enter the complete email text for comprehensive analysis"
             )
             with gr.Row():
-                analyze_btn = gr.Button("🔍 Analyze Email", variant="primary", size="lg")
-                clear_btn = gr.Button("🗑️ Clear", variant="secondary")
         with gr.Column(scale=2):
             output = gr.Textbox(
-                label="🛡️ Security Analysis Results",
-                lines=20,
                 interactive=False,
                 show_copy_button=True
             )
-    # Example section with better examples
-    gr.Markdown("### 📝 Test Examples")
     with gr.Row():
-        legit_btn = gr.Button("✅ Legitimate Email", size="sm")
-        phish_btn = gr.Button("🚨 Phishing Email", size="sm")
-        neutral_btn = gr.Button("📄 Neutral Text", size="sm")
-    # Event handlers
     analyze_btn.click(predict_email, inputs=email_input, outputs=output)
     clear_btn.click(lambda: ("", ""), outputs=[email_input, output])
-    legit_btn.click(lambda: example_legitimate, outputs=email_input)
-    phish_btn.click(lambda: example_phishing, outputs=email_input)
-    neutral_btn.click(lambda: example_neutral, outputs=email_input)
-    # Footer with model info
-    gr.Markdown("""
-    ---
-    **🔧 Model**: cybersectony/phishing-email-detection-distilbert_v2.4.1
-    **🎯 Features**: Temperature scaling, colored risk bars, enhanced debugging
-    **🏛️ Institution**: University of Dar es Salaam (UDSM)
-    """)
 if __name__ == "__main__":
-    iface.launch(
-        share=True,
-        server_name="0.0.0.0",
-        server_port=7860,
-        show_error=True,
-        debug=True
-    )

 import torch
 from transformers import AutoTokenizer, AutoModelForSequenceClassification
 import logging
+import re
+# Configure logging (minimal)
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 # Model configuration
 MODEL_NAME = "cybersectony/phishing-email-detection-distilbert_v2.4.1"
+# Explanation of labels and their values
+"""
+Labels and Their Meanings:
+- Legitimate: The email appears safe and is likely from a trusted source.
+- Phishing: The email may be a scam attempting to steal personal information.
+- Suspicious: The email has questionable content and may not be safe.
+- Spam: The email is likely unwanted promotional or junk content.
+Each label comes with a percentage (0-100%) indicating the model's confidence.
+Higher percentages mean the model is more certain of the classification.
+"""
 # Global variables for model and tokenizer
 tokenizer = None
 model = None
 def load_model():
+    """Load the model and tokenizer with basic error handling"""
     global tokenizer, model
     try:
         tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
         model = AutoModelForSequenceClassification.from_pretrained(MODEL_NAME)
         logger.info("Model loaded successfully!")
         return True
     except Exception as e:
         logger.error(f"Error loading model: {e}")
         return False
+def is_valid_email_text(text):
+    """Basic validation for email-like text"""
+    if not text or not text.strip():
+        return False, "Please enter some email text."
+    if len(text.strip()) < 10:
+        return False, "Text too short for analysis."
+    # Check for basic email-like structure or meaningful words
+    if len(text.split()) < 3 or not re.search(r"[a-zA-Z]{3,}", text):
+        return False, "Text appears incoherent or not email-like."
+    return True, ""
 def predict_email(email_text):
+    """Simplified prediction function with clear output"""
     # Input validation
+    valid, message = is_valid_email_text(email_text)
+    if not valid:
+        return f"⚠️ Error: {message}"
     # Check if model is loaded
     if tokenizer is None or model is None:
         if not load_model():
+            return "❌ Error: Failed to load the model."
     try:
+        # Tokenize input
         inputs = tokenizer(
             email_text,
             return_tensors="pt",
             padding=True
         )
+        # Get prediction
         with torch.no_grad():
             outputs = model(**inputs)
+            probs = torch.nn.functional.softmax(outputs.logits, dim=-1)[0].tolist()
+        # Get labels from model config or fallback
+        labels = (model.config.id2label if hasattr(model.config, 'id2label') and model.config.id2label
+                  else {0: "Legitimate", 1: "Phishing", 2: "Suspicious", 3: "Spam"} if len(probs) == 4
+                  else {0: "Legitimate", 1: "Phishing"})
+        # Map probabilities to labels
+        results = {labels[i]: probs[i] * 100 for i in range(len(probs))}
+        # Get top prediction
+        max_label, max_prob = max(results.items(), key=lambda x: x[1])
+        # Simplified risk levels
+        if "phishing" in max_label.lower() or "suspicious" in max_label.lower():
+            risk_level = "⚠️ Risky" if max_prob > 60 else "⚡ Low Risk"
+        elif "spam" in max_label.lower():
+            risk_level = "🗑️ Spam"
         else:
+            risk_level = "✅ Safe" if max_prob > 60 else "❓ Uncertain"
+        # Format output
+        output = f"Result: {risk_level}\n"
+        output += f"Top Prediction: {max_label} ({max_prob:.1f}%)\n"
+        output += "Details:\n"
+        for label, prob in sorted(results.items(), key=lambda x: x[1], reverse=True):
+            output += f"{label}: {prob:.1f}%\n"
+        # Simple recommendation
+        if "phishing" in max_label.lower() or "suspicious" in max_label.lower():
+            output += "Advice: Avoid clicking links or sharing info."
+        elif "spam" in max_label.lower():
+            output += "Advice: Mark as spam or delete."
         else:
+            output += "Advice: Appears safe, but stay cautious."
+        return output
     except Exception as e:
+        logger.error(f"Error during prediction: {e}")
+        return f"❌ Error: Analysis failed - {str(e)}"
+# Example emails
 example_legitimate = """Dear Customer,
+Thank you for your purchase from TechStore. Your order #ORD-2024-001234 is processed.
 Order Details:
+- Product: Wireless Headphones
 - Amount: $79.99
+- Delivery: 3-5 days
 Best regards,
+TechStore"""
+example_phishing = """URGENT!!!
+Your account is COMPROMISED! Click here to secure: http://fake-site.com/verify
+Act NOW or your account will be suspended!
+Security Team"""
 example_neutral = """Hi team,
+Reminder: meeting today at 10 PM. Bring project updates.
 Thanks,
+Byabato"""
 # Load model on startup
 load_model()
+# Minimalist Gradio interface
+with gr.Blocks(title="PhishGuardian", theme=gr.themes.Soft()) as iface:
+    gr.Markdown("# 🛡️ PhishGuardian\nSimple email safety checker.\n\nCheck if an email is safe or risky. Paste the email text and click 'Check'.")
     with gr.Row():
         with gr.Column(scale=2):
             email_input = gr.Textbox(
+                lines=8,
+                placeholder="Paste email here...",
+                label="📧 Email"
             )
             with gr.Row():
+                analyze_btn = gr.Button("🔍 Check", variant="primary")
+                clear_btn = gr.Button("🗑️ Clear")
         with gr.Column(scale=2):
             output = gr.Textbox(
+                label="✅ Results",
+                lines=10,
                 interactive=False,
                 show_copy_button=True
             )
+    gr.Markdown("### 📝 Examples")
     with gr.Row():
+        gr.Button("✅ Legitimate", size="sm").click(lambda: example_legitimate, outputs=email_input)
+        gr.Button("🚨 Phishing", size="sm").click(lambda: example_phishing, outputs=email_input)
+        gr.Button("📄 Neutral", size="sm").click(lambda: example_neutral, outputs=email_input)
     analyze_btn.click(predict_email, inputs=email_input, outputs=output)
     clear_btn.click(lambda: ("", ""), outputs=[email_input, output])
 if __name__ == "__main__":
+    iface.launch(server_port=7860, show_error=True)