Spaces:

deepugaur
/

new__project

Sleeping

App Files Files Community

deepugaur commited on Nov 23, 2024

Commit

1c1f9d0

verified ·

1 Parent(s): 466d440

Update app.py

Browse files

Files changed (1) hide show

app.py +68 -58

app.py CHANGED Viewed

@@ -2,89 +2,99 @@
 import streamlit as st
 import tensorflow as tf
-from tensorflow.keras.preprocessing.text import Tokenizer
-from tensorflow.keras.preprocessing.sequence import pad_sequences
 import numpy as np
 from lime.lime_text import LimeTextExplainer
-import matplotlib.pyplot as plt
-# Streamlit Title
-st.title("Prompt Injection Detection and Prevention")
-st.write("Classify prompts as malicious or valid and understand predictions using LIME.")
-# Cache Model Loading
 @st.cache_resource
 def load_model(filepath):
     return tf.keras.models.load_model(filepath)
-# Tokenizer Setup
 @st.cache_resource
-def setup_tokenizer():
-    tokenizer = Tokenizer(num_words=5000)
-    # Predefined vocabulary for demonstration purposes; replace with your actual tokenizer setup.
-    tokenizer.fit_on_texts(["example prompt", "malicious attack", "valid input prompt"])
-    return tokenizer
-# Preprocessing Function
 def preprocess_prompt(prompt, tokenizer, max_length=100):
     sequence = tokenizer.texts_to_sequences([prompt])
-    return pad_sequences(sequence, maxlen=max_length)
-# Prediction Function
-def detect_prompt(prompt, tokenizer, model):
-    processed_prompt = preprocess_prompt(prompt, tokenizer)
     prediction = model.predict(processed_prompt)[0][0]
-    class_label = 'Malicious' if prediction >= 0.5 else 'Valid'
     confidence_score = prediction * 100 if prediction >= 0.5 else (1 - prediction) * 100
     return class_label, confidence_score
-# LIME Explanation
 def lime_explain(prompt, model, tokenizer, max_length=100):
-    explainer = LimeTextExplainer(class_names=["Valid", "Malicious"])
     def predict_fn(prompts):
         sequences = tokenizer.texts_to_sequences(prompts)
         padded_sequences = pad_sequences(sequences, maxlen=max_length)
         predictions = model.predict(padded_sequences)
         return np.hstack([1 - predictions, predictions])
-    explanation = explainer.explain_instance(
-        prompt,
-        predict_fn,
-        num_features=10
-    )
     return explanation
-# Load Model Section
-st.subheader("Load Your Trained Model")
-model = None
-tokenizer = None
-model_path = "deep_learning_model (1).h5"  # Ensure this file is in the same directory as app.py
-try:
-    model = load_model(model_path)
-    tokenizer = setup_tokenizer()
-    st.success("Model Loaded Successfully!")
-    # User Prompt Input
-    st.subheader("Classify Your Prompt")
     user_prompt = st.text_input("Enter a prompt to classify:")
     if user_prompt:
-        class_label, confidence_score = detect_prompt(user_prompt, tokenizer, model)
-        st.write(f"Predicted Class: **{class_label}**")
-        st.write(f"Confidence Score: **{confidence_score:.2f}%**")
-        # LIME Explanation
-        st.subheader("LIME Explanation")
-        explanation = lime_explain(user_prompt, model, tokenizer)
-        explanation_as_html = explanation.as_html()
-        st.components.v1.html(explanation_as_html, height=500)
-except Exception as e:
-    st.error(f"Error Loading Model: {e}")
-# Footer
-st.write("---")
-st.write("Developed for detecting and preventing prompt injection attacks.")

 import streamlit as st
 import tensorflow as tf
 import numpy as np
+from tensorflow.keras.preprocessing.sequence import pad_sequences
+import pickle
+from lime import lime_text
 from lime.lime_text import LimeTextExplainer
+# Load the model
 @st.cache_resource
 def load_model(filepath):
     return tf.keras.models.load_model(filepath)
+# Load tokenizer
 @st.cache_resource
+def load_tokenizer(filepath):
+    with open(filepath, 'rb') as handle:
+        return pickle.load(handle)
+# Preprocess prompt
 def preprocess_prompt(prompt, tokenizer, max_length=100):
     sequence = tokenizer.texts_to_sequences([prompt])
+    padded_sequence = pad_sequences(sequence, maxlen=max_length)
+    return padded_sequence
+# Predict prompt class
+def detect_prompt(prompt, tokenizer, model, max_length=100):
+    processed_prompt = preprocess_prompt(prompt, tokenizer, max_length)
     prediction = model.predict(processed_prompt)[0][0]
+    class_label = "Malicious" if prediction >= 0.5 else "Valid"
     confidence_score = prediction * 100 if prediction >= 0.5 else (1 - prediction) * 100
     return class_label, confidence_score
+# LIME explanation
 def lime_explain(prompt, model, tokenizer, max_length=100):
     def predict_fn(prompts):
         sequences = tokenizer.texts_to_sequences(prompts)
         padded_sequences = pad_sequences(sequences, maxlen=max_length)
         predictions = model.predict(padded_sequences)
         return np.hstack([1 - predictions, predictions])
+    class_names = ["Valid", "Malicious"]
+    explainer = LimeTextExplainer(class_names=class_names)
+    explanation = explainer.explain_instance(prompt, predict_fn, num_features=10)
     return explanation
+# Streamlit App
+st.title("Prompt Injection Detection and Prevention")
+st.write("Classify prompts as malicious or valid and understand predictions using LIME.")
+# Model input
+model_path = st.text_input("Enter the path to your trained model (.h5):")
+if model_path:
+    try:
+        model = load_model(model_path)
+        st.success("Model Loaded Successfully!")
+    except Exception as e:
+        st.error(f"Error Loading Model: {e}")
+        model = None
+else:
+    model = None
+# Tokenizer input
+tokenizer_path = st.text_input("Enter the path to your tokenizer file (.pickle):")
+if tokenizer_path:
+    try:
+        tokenizer = load_tokenizer(tokenizer_path)
+        st.success("Tokenizer Loaded Successfully!")
+    except Exception as e:
+        st.error(f"Error Loading Tokenizer: {e}")
+        tokenizer = None
+else:
+    tokenizer = None
+# Prompt classification
+if model and tokenizer:
     user_prompt = st.text_input("Enter a prompt to classify:")
     if user_prompt:
+        st.subheader("Model Prediction")
+        try:
+            # Classify the prompt
+            class_label, confidence_score = detect_prompt(user_prompt, tokenizer, model)
+            st.write(f"Predicted Class: **{class_label}**")
+            st.write(f"Confidence Score: **{confidence_score:.2f}%**")
+            # Debugging information
+            st.write("Debugging Information:")
+            st.write(f"Tokenized Sequence: {tokenizer.texts_to_sequences([user_prompt])}")
+            st.write(f"Padded Sequence: {preprocess_prompt(user_prompt, tokenizer)}")
+            st.write(f"Raw Model Output: {model.predict(preprocess_prompt(user_prompt, tokenizer))[0][0]}")
+            # Generate LIME explanation
+            explanation = lime_explain(user_prompt, model, tokenizer)
+            explanation_as_html = explanation.as_html()
+            st.components.v1.html(explanation_as_html, height=500)
+        except Exception as e:
+            st.error(f"Error during prediction: {e}")