Spaces:

saakshigupta
/

deepfake-explainer-app

Paused

saakshigupta commited on Mar 26

Commit

4cad98d

verified ·

1 Parent(s): 0bdc990

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import streamlit as st
 import torch
 from PIL import Image
 import io
-from transformers import AutoProcessor, AutoModelForCausalLM
 from peft import PeftModel
 # Page config
@@ -21,12 +21,23 @@ st.markdown("Upload an image to analyze it for possible deepfake manipulation")
 def load_model():
     """Load model and processor (cached to avoid reloading)"""
     # Load base model
-    base_model_id = "unsloth/llama-3.2-11b-vision-instruct"
     processor = AutoProcessor.from_pretrained(base_model_id)
-    model = AutoModelForCausalLM.from_pretrained(
         base_model_id,
         device_map="auto",
-        torch_dtype=torch.float16
     )
     # Load adapter

 import torch
 from PIL import Image
 import io
+from transformers import AutoProcessor, BitsAndBytesConfig, MllamaForCausalLM
 from peft import PeftModel
 # Page config
 def load_model():
     """Load model and processor (cached to avoid reloading)"""
     # Load base model
+    base_model_id = "unsloth/llama-3.2-11b-vision-instruct-unsloth-bnb-4bit"
     processor = AutoProcessor.from_pretrained(base_model_id)
+    # Configure 4-bit quantization
+    quantization_config = BitsAndBytesConfig(
+        load_in_4bit=True,
+        bnb_4bit_compute_dtype=torch.float16,
+        bnb_4bit_quant_type="nf4",
+        bnb_4bit_use_double_quant=True
+    )
+    # Use the specific model class MllamaForCausalLM instead of AutoModelForCausalLM
+    model = MllamaForCausalLM.from_pretrained(
         base_model_id,
         device_map="auto",
+        torch_dtype=torch.float16,
+        quantization_config=quantization_config
     )
     # Load adapter