Spaces:

pascal-maker
/

medical-vlm-sam2

Running

App Files Files Community

pascal-maker commited on Jun 12

Commit

07f5f6e

verified ·

1 Parent(s): 6cd7b7a

Update app.py

Browse files

Files changed (1) hide show

app.py +233 -559

app.py CHANGED Viewed

@@ -1,582 +1,256 @@
 #!/usr/bin/env python
-# -*- coding: utf-8 -*-
 """
-Combined Medical-VLM, **SAM-2 automatic masking**, and CheXagent demo.
-⭑ Changes ⭑
------------
-1. Fixed SAM-2 installation and import issues
-2. Added proper error handling for missing dependencies
-3. Made SAM-2 functionality optional with graceful fallback
-4. Added installation instructions and requirements check
 """
-# ---------------------------------------------------------------------
-# Standard libs
-# ---------------------------------------------------------------------
-import os
 import sys
-import uuid
-import tempfile
 import subprocess
-import warnings
-from threading import Thread
-# Environment setup
-os.environ["PYTORCH_ENABLE_MPS_FALLBACK"] = "1"
-warnings.filterwarnings("ignore", message=r".*upsample_bicubic2d.*")
-# ---------------------------------------------------------------------
-# Third-party libs
-# ---------------------------------------------------------------------
-import torch
 import numpy as np
-from PIL import Image, ImageDraw
-import gradio as gr
-# =============================================================================
-# Dependency checker and installer
-# =============================================================================
-def check_and_install_sam2():
-    """Check if SAM-2 is available and attempt installation if needed."""
     try:
-        print("[SAM-2 Debug] Attempting to import SAM-2 modules...")
         from sam2.build_sam import build_sam2
-        from sam2.automatic_mask_generator import SAM2AutomaticMaskGenerator
-        print("[SAM-2 Debug] Successfully imported SAM-2 modules")
         return True, "SAM-2 already available"
-    except ImportError as e:
-        print(f"[SAM-2 Debug] Import error: {str(e)}")
-        print("[SAM-2 Debug] Attempting to install SAM-2...")
         try:
-            # Clone SAM-2 repository
-            if not os.path.exists("segment-anything-2"):
-                print("[SAM-2 Debug] Cloning SAM-2 repository...")
-                subprocess.run([
-                    "git", "clone",
-                    "https://github.com/facebookresearch/segment-anything-2.git"
-                ], check=True)
-                print("[SAM-2 Debug] Repository cloned successfully")
-            # Install SAM-2
-            print("[SAM-2 Debug] Installing SAM-2...")
-            original_dir = os.getcwd()
-            os.chdir("segment-anything-2")
-            subprocess.run([sys.executable, "-m", "pip", "install", "-e", "."], check=True)
-            os.chdir(original_dir)
-            print("[SAM-2 Debug] Installation completed")
-            # Add to Python path
-            sam2_path = os.path.abspath("segment-anything-2")
-            if sam2_path not in sys.path:
-                sys.path.insert(0, sam2_path)
-                print(f"[SAM-2 Debug] Added {sam2_path} to Python path")
-            # Try importing again
-            print("[SAM-2 Debug] Attempting to import SAM-2 modules again...")
-            from sam2.build_sam import build_sam2
-            from sam2.automatic_mask_generator import SAM2AutomaticMaskGenerator
-            print("[SAM-2 Debug] Successfully imported SAM-2 modules after installation")
-            return True, "SAM-2 installed successfully"
-        except Exception as e:
-            print(f"[SAM-2 Debug] Installation failed: {str(e)}")
-            print(f"[SAM-2 Debug] Error type: {type(e).__name__}")
-            return False, f"SAM-2 installation failed: {e}"
-# Check SAM-2 availability
 SAM2_AVAILABLE, SAM2_STATUS = check_and_install_sam2()
 print(f"SAM-2 Status: {SAM2_STATUS}")
-# =============================================================================
-# SAM-2 imports (conditional)
-# =============================================================================
 if SAM2_AVAILABLE:
     try:
-        from sam2.build_sam import build_sam2
-        from sam2.automatic_mask_generator import SAM2AutomaticMaskGenerator
-        from sam2.modeling.sam2_base import SAM2Base
-    except ImportError as e:
-        print(f"SAM-2 import error: {e}")
-        SAM2_AVAILABLE = False
-# =============================================================================
-# Qwen-VLM imports & helper
-# =============================================================================
-from transformers import Qwen2_5_VLForConditionalGeneration, AutoProcessor
-from qwen_vl_utils import process_vision_info
-# =============================================================================
-# CheXagent imports
-# =============================================================================
-from transformers import AutoTokenizer, AutoModelForCausalLM, TextIteratorStreamer
-# ---------------------------------------------------------------------
-# Devices
-# ---------------------------------------------------------------------
-def get_device():
-    if torch.cuda.is_available():
-        return torch.device("cuda")
-    if torch.backends.mps.is_available():
-        return torch.device("mps")
-    return torch.device("cpu")
-# =============================================================================
-# Qwen-VLM model & agent
-# =============================================================================
-_qwen_model = None
-_qwen_processor = None
-_qwen_device = None
-def load_qwen_model_and_processor(hf_token=None):
-    global _qwen_model, _qwen_processor, _qwen_device
-    if _qwen_model is None:
-        _qwen_device = "mps" if torch.backends.mps.is_available() else "cpu"
-        print(f"[Qwen] loading model on {_qwen_device}")
-        auth_kwargs = {"use_auth_token": hf_token} if hf_token else {}
-        _qwen_model = Qwen2_5_VLForConditionalGeneration.from_pretrained(
-            "Qwen/Qwen2.5-VL-3B-Instruct",
-            trust_remote_code=True,
-            attn_implementation="eager",
-            torch_dtype=torch.float32,
-            low_cpu_mem_usage=True,
-            device_map=None,
-            **auth_kwargs,
-        ).to(_qwen_device)
-        _qwen_processor = AutoProcessor.from_pretrained(
-            "Qwen/Qwen2.5-VL-3B-Instruct",
-            trust_remote_code=True,
-            **auth_kwargs,
-        )
-    return _qwen_model, _qwen_processor, _qwen_device
-class MedicalVLMAgent:
-    """Light wrapper around Qwen-VLM with an optional image."""
-    def __init__(self, model, processor, device):
-        self.model = model
-        self.processor = processor
-        self.device = device
-        self.system_prompt = (
-            "You are a medical information assistant with vision capabilities.\n"
-            "Disclaimer: I am not a licensed medical professional. "
-            "The information provided is for reference only and should not be taken as medical advice."
-        )
-    def run(self, user_text: str, image: Image.Image | None = None) -> str:
-        messages = [
-            {"role": "system", "content": [{"type": "text", "text": self.system_prompt}]}
-        ]
-        user_content = []
-        if image is not None:
-            tmp = f"/tmp/{uuid.uuid4()}.png"
-            image.save(tmp)
-            user_content.append({"type": "image", "image": tmp})
-        user_content.append({"type": "text", "text": user_text or "Please describe the image."})
-        messages.append({"role": "user", "content": user_content})
-        prompt_text = self.processor.apply_chat_template(
-            messages, tokenize=False, add_generation_prompt=True
-        )
-        img_inputs, vid_inputs = process_vision_info(messages)
-        inputs = self.processor(
-            text=[prompt_text],
-            images=img_inputs,
-            videos=vid_inputs,
-            padding=True,
-            return_tensors="pt",
-        ).to(self.device)
-        with torch.no_grad():
-            out = self.model.generate(**inputs, max_new_tokens=128)
-        trimmed = out[0][inputs.input_ids.shape[1] :]
-        return self.processor.decode(trimmed, skip_special_tokens=True).strip()
-# =============================================================================
-# SAM-2 model + AutomaticMaskGenerator (final minimal version)
-# =============================================================================
-import os
-import numpy as np
-from PIL import Image, ImageDraw
-from sam2.build_sam import build_sam2
-from sam2.automatic_mask_generator import SAM2AutomaticMaskGenerator
-def initialize_sam2():
-    # These two files are already in your repo
-    CKPT = "checkpoints/sam2.1_hiera_large.pt"   # ≈2.7 GB
-    CFG  = "configs/sam2.1/sam2.1_hiera_l.yaml"
-    # One chdir so Hydra's search path starts inside sam2/sam2/
-    os.chdir("sam2/sam2")
-    device = get_device()
-    print(f"[SAM-2] building model on {device}")
-    sam2_model = build_sam2(
-        CFG,        # relative to sam2/sam2/
-        CKPT,       # relative after chdir
-        device=device,
-        apply_postprocessing=False,
-    )
-    mask_gen = SAM2AutomaticMaskGenerator(
-        model=sam2_model,
-        points_per_side=32,
-        pred_iou_thresh=0.86,
-        stability_score_thresh=0.92,
-        crop_n_layers=0,
-    )
-    return sam2_model, mask_gen
-# ---------------------- build once ----------------------
-try:
-    _sam2_model, _mask_generator = initialize_sam2()
-    print("[SAM-2] Successfully initialized!")
-except Exception as e:
-    print(f"[SAM-2] Failed to initialize: {e}")
-    _sam2_model, _mask_generator = None, None
-def automatic_mask_overlay(image_np: np.ndarray) -> np.ndarray:
-    """Generate masks and alpha-blend them on top of the original image."""
-    if _mask_generator is None:
-        raise RuntimeError("SAM-2 mask generator not initialized")
-    anns = _mask_generator.generate(image_np)
-    if not anns:
-        return image_np
-    overlay = image_np.copy()
-    if overlay.ndim == 2:  # grayscale → RGB
-        overlay = np.stack([overlay] * 3, axis=2)
-    for ann in sorted(anns, key=lambda x: x["area"], reverse=True):
-        m = ann["segmentation"]
-        color = np.random.randint(0, 255, 3, dtype=np.uint8)
-        overlay[m] = (overlay[m] * 0.5 + color * 0.5).astype(np.uint8)
-    return overlay
-def tumor_segmentation_interface(image: Image.Image | None):
-    if image is None:
-        return None, "Please upload an image."
-    if _mask_generator is None:
-        return None, "SAM-2 not properly initialized. Check the console for errors."
-    try:
-        img_np = np.array(image.convert("RGB"))
-        out_np = automatic_mask_overlay(img_np)
-        n_masks = len(_mask_generator.generate(img_np))
-        return Image.fromarray(out_np), f"{n_masks} masks found."
     except Exception as e:
-        return None, f"SAM-2 error: {e}"
-# =============================================================================
-# Simple fallback segmentation (when SAM-2 is not available)
-# =============================================================================
-def simple_segmentation_fallback(image: Image.Image | None):
-    """Simple fallback segmentation using basic image processing."""
-    if image is None:
-        return None, "Please upload an image."
     try:
-        import cv2
-        from skimage import segmentation, color
-        # Convert to numpy array
-        img_np = np.array(image.convert("RGB"))
-        # Simple watershed segmentation
-        gray = cv2.cvtColor(img_np, cv2.COLOR_RGB2GRAY)
-        _, binary = cv2.threshold(gray, 0, 255, cv2.THRESH_BINARY_INV + cv2.THRESH_OTSU)
-        # Remove noise
-        kernel = np.ones((3,3), np.uint8)
-        opening = cv2.morphologyEx(binary, cv2.MORPH_OPEN, kernel, iterations=2)
-        # Sure background area
-        sure_bg = cv2.dilate(opening, kernel, iterations=3)
-        # Finding sure foreground area
-        dist_transform = cv2.distanceTransform(opening, cv2.DIST_L2, 5)
-        _, sure_fg = cv2.threshold(dist_transform, 0.7*dist_transform.max(), 255, 0)
-        # Create overlay
-        overlay = img_np.copy()
-        overlay[sure_fg > 0] = [255, 0, 0]  # Red overlay
-        # Alpha blend
-        result = cv2.addWeighted(img_np, 0.7, overlay, 0.3, 0)
-        return Image.fromarray(result), "Simple segmentation applied (SAM-2 not available)"
-    except Exception as e:
-        return None, f"Fallback segmentation error: {e}"
-# =============================================================================
-# CheXagent set-up
-# =============================================================================
-try:
-    print("[CheXagent] Starting initialization...")
-    chex_name = "StanfordAIMI/CheXagent-2-3b"
-    print(f"[CheXagent] Loading tokenizer from {chex_name}")
-    chex_tok = AutoTokenizer.from_pretrained(chex_name, trust_remote_code=True)
-    print("[CheXagent] Tokenizer loaded successfully")
-    print("[CheXagent] Loading model...")
-    chex_model = AutoModelForCausalLM.from_pretrained(
-        chex_name,
-        device_map="auto",
-        trust_remote_code=True,
-        torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32
-    )
-    print("[CheXagent] Model loaded successfully")
-    if torch.cuda.is_available():
-        print("[CheXagent] Converting to half precision for GPU")
-        chex_model = chex_model.half()
     else:
-        print("[CheXagent] Using full precision for CPU")
-        chex_model = chex_model.float()
-    chex_model.eval()
-    CHEXAGENT_AVAILABLE = True
-    print("[CheXagent] Initialization complete")
-except Exception as e:
-    print(f"[CheXagent] Initialization failed: {str(e)}")
-    print(f"[CheXagent] Error type: {type(e).__name__}")
-    CHEXAGENT_AVAILABLE = False
-    chex_tok, chex_model = None, None
-def get_model_device(model):
-    if model is None:
-        return torch.device("cpu")
-    for p in model.parameters():
-        return p.device
-    return torch.device("cpu")
-def clean_text(text):
-    return text.replace("</s>", "")
-@torch.no_grad()
-def response_report_generation(pil_image_1, pil_image_2):
-    """Structured chest-X-ray report (streaming)."""
-    if not CHEXAGENT_AVAILABLE:
-        yield "CheXagent is not available. Please check installation."
-        return
-    streamer = TextIteratorStreamer(chex_tok, skip_prompt=True, skip_special_tokens=True)
-    paths = []
-    for im in [pil_image_1, pil_image_2]:
-        if im is None:
-            continue
-        with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tfile:
-            im.save(tfile.name)
-            paths.append(tfile.name)
-    if not paths:
-        yield "Please upload at least one image."
-        return
-    device = get_model_device(chex_model)
-    anatomies = [
-        "View",
-        "Airway",
-        "Breathing",
-        "Cardiac",
-        "Diaphragm",
-        "Everything else (e.g., mediastinal contours, bones, soft tissues, tubes, valves, pacemakers)",
-    ]
-    prompts = [
-        "Determine the view of this CXR",
-        *[
-            f'Provide a detailed description of "{a}" in the chest X-ray'
-            for a in anatomies[1:]
-        ],
-    ]
-    findings = ""
-    partial = "## Generating Findings (step-by-step):\n\n"
-    for idx, (anat, prompt) in enumerate(zip(anatomies, prompts)):
-        query = chex_tok.from_list_format(
-            [*[{"image": p} for p in paths], {"text": prompt}]
-        )
-        conv = [
-            {"from": "system", "value": "You are a helpful assistant."},
-            {"from": "human", "value": query},
-        ]
-        inp = chex_tok.apply_chat_template(
-            conv, add_generation_prompt=True, return_tensors="pt"
-        ).to(device)
-        generate_kwargs = dict(
-            input_ids=inp,
-            max_new_tokens=512,
-            do_sample=False,
-            num_beams=1,
-            streamer=streamer,
-        )
-        Thread(target=chex_model.generate, kwargs=generate_kwargs).start()
-        partial += f"**Step {idx}: {anat}...**\n\n"
-        for tok in streamer:
-            if idx:
-                findings += tok
-            partial += tok
-            yield clean_text(partial)
-        partial += "\n\n"
-        findings += " "
-    findings = findings.strip()
-    # Impression
-    partial += "## Generating Impression\n\n"
-    prompt = f"Write the Impression section for the following Findings: {findings}"
-    conv = [
-        {"from": "system", "value": "You are a helpful assistant."},
-        {"from": "human", "value": chex_tok.from_list_format([{"text": prompt}])},
-    ]
-    inp = chex_tok.apply_chat_template(
-        conv, add_generation_prompt=True, return_tensors="pt"
-    ).to(device)
-    Thread(
-        target=chex_model.generate,
-        kwargs=dict(
-            input_ids=inp,
-            do_sample=False,
-            num_beams=1,
-            max_new_tokens=512,
-            streamer=streamer,
-        ),
-    ).start()
-    for tok in streamer:
-        partial += tok
-        yield clean_text(partial)
-    yield clean_text(partial)
-@torch.no_grad()
-def response_phrase_grounding(pil_image, prompt_text):
-    """Very simple visual-grounding placeholder."""
-    if not CHEXAGENT_AVAILABLE:
-        return "CheXagent is not available. Please check installation.", None
-    if pil_image is None:
-        return "Please upload an image.", None
-    with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as tfile:
-        pil_image.save(tfile.name)
-        img_path = tfile.name
-    device = get_model_device(chex_model)
-    query = chex_tok.from_list_format([{"image": img_path}, {"text": prompt_text}])
-    conv = [
-        {"from": "system", "value": "You are a helpful assistant."},
-        {"from": "human", "value": query},
-    ]
-    inp = chex_tok.apply_chat_template(
-        conv, add_generation_prompt=True, return_tensors="pt"
-    ).to(device)
-    out = chex_model.generate(
-        input_ids=inp, do_sample=False, num_beams=1, max_new_tokens=512
-    )
-    resp = clean_text(chex_tok.decode(out[0][inp.shape[1] :]))
-    # simple center box (placeholder)
-    w, h = pil_image.size
-    cx, cy, sz = w // 2, h // 2, min(w, h) // 4
-    draw = ImageDraw.Draw(pil_image)
-    draw.rectangle([(cx - sz, cy - sz), (cx + sz, cy + sz)], outline="red", width=3)
-    return resp, pil_image
-# =============================================================================
-# Gradio UI
-# =============================================================================
-def create_ui():
-    """Create the Gradio interface."""
-    # Load Qwen model
-    try:
-        qwen_model, qwen_proc, qwen_dev = load_qwen_model_and_processor()
-        med_agent = MedicalVLMAgent(qwen_model, qwen_proc, qwen_dev)
-        qwen_available = True
-    except Exception as e:
-        print(f"Qwen model not available: {e}")
-        qwen_available = False
-        med_agent = None
-    with gr.Blocks(title="Medical AI Assistant") as demo:
-        gr.Markdown("# Combined Medical Q&A · SAM-2 Automatic Masking · CheXagent")
-        # Status information
-        with gr.Row():
-            gr.Markdown(f"""
-            **System Status:**
-            - Qwen VLM: {'✅ Available' if qwen_available else '❌ Not Available'}
-            - SAM-2: {'✅ Available' if SAM2_AVAILABLE else '❌ Not Available'}
-            - CheXagent: {'✅ Available' if CHEXAGENT_AVAILABLE else '❌ Not Available'}
-            """)
-        # Medical Q&A Tab
-        with gr.Tab("Medical Q&A"):
-            if qwen_available:
-                q_in = gr.Textbox(label="Question / description", lines=3)
-                q_img = gr.Image(label="Optional image", type="pil")
-                q_btn = gr.Button("Submit")
-                q_out = gr.Textbox(label="Answer")
-                q_btn.click(fn=med_agent.run, inputs=[q_in, q_img], outputs=q_out)
-            else:
-                gr.Markdown("❌ Medical Q&A is not available. Qwen model failed to load.")
-        # Segmentation Tab
-        with gr.Tab("Automatic masking"):
-            seg_img = gr.Image(label="Upload medical image", type="pil")
-            seg_btn = gr.Button("Run segmentation")
-            seg_out = gr.Image(label="Segmentation result", type="pil")
-            seg_status = gr.Textbox(label="Status", interactive=False)
-            if SAM2_AVAILABLE and _mask_generator is not None:
-                seg_btn.click(
-                    fn=tumor_segmentation_interface,
-                    inputs=seg_img,
-                    outputs=[seg_out, seg_status],
-                )
-            else:
-                seg_btn.click(
-                    fn=simple_segmentation_fallback,
-                    inputs=seg_img,
-                    outputs=[seg_out, seg_status],
-                )
-        # CheXagent Tabs
-        with gr.Tab("CheXagent – Structured report"):
-            if CHEXAGENT_AVAILABLE:
-                gr.Markdown("Upload one or two chest X-ray images; the report streams live.")
-                cx1 = gr.Image(label="Image 1", image_mode="L", type="pil")
-                cx2 = gr.Image(label="Image 2", image_mode="L", type="pil")
-                cx_report = gr.Markdown()
-                gr.Interface(
-                    fn=response_report_generation,
-                    inputs=[cx1, cx2],
-                    outputs=cx_report,
-                    live=True,
-                ).render()
-            else:
-                gr.Markdown("❌ CheXagent structured report is not available.")
-        with gr.Tab("CheXagent – Visual grounding"):
-            if CHEXAGENT_AVAILABLE:
-                vg_img = gr.Image(image_mode="L", type="pil")
-                vg_prompt = gr.Textbox(value="Locate the highlighted finding:")
-                vg_text = gr.Markdown()
-                vg_out_img = gr.Image()
-                gr.Interface(
-                    fn=response_phrase_grounding,
-                    inputs=[vg_img, vg_prompt],
-                    outputs=[vg_text, vg_out_img],
-                ).render()
-            else:
-                gr.Markdown("❌ CheXagent visual grounding is not available.")
-    return demo
-if __name__ == "__main__":
-    demo = create_ui()
-    demo.launch(server_name="0.0.0.0", server_port=7860, share=True)

 #!/usr/bin/env python
 """
+post_analyzer_enhanced.py · Enhanced Post Analysis Tool
+=====================================================
+Analyzes images of posts by running YOLOv8 inference, applying spatial layout rules,
+computing a nuanced confidence score, and detecting anomalies ("afwijking").
+Generates JSON reports for image directories and uploaded images.
+Includes SAM-2 alias patch for Hugging Face compatibility.
 """
+from __future__ import annotations
+import argparse
+import json
 import sys
+import os
 import subprocess
+import tempfile
+from pathlib import Path
+from typing import List, Union
+from datetime import datetime
+from urllib.parse import urlparse
+import cv2
+import yaml
 import numpy as np
+from dataclasses import dataclass
+from ultralytics import YOLO
+import requests
+from PIL import Image
+import io
+# ───── Data Classes ──────────────────────────────────────────────────────────
+@dataclass
+class PostPart:
+    name: str
+    x: float      # normalized center x
+    y: float      # normalized center y
+    width: float
+    height: float
+    confidence: float = 1.0
+@dataclass
+class PostAnalysis:
+    image_path: Path
+    parts: List[PostPart]
+    anomalies: List[PostPart]
+    violations: List[str]
+    is_conform: bool
+    confidence_score: float
+# ───── Configuration Load ────────────────────────────────────────────────────
+def load_yaml_config(yaml_path: Path) -> dict:
+    if not yaml_path.exists():
+        sys.exit(f"Required {yaml_path} was not found – aborting.")
+    with yaml_path.open("r", encoding="utf-8") as fh:
+        data = yaml.safe_load(fh)
+    if "names" not in data:
+        sys.exit("'names' field missing in data.yaml – unable to continue.")
+    return {
+        "names": data["names"],
+        "class_to_name": {i: n for i, n in enumerate(data["names"])},
+        "name_to_class": {n: i for i, n in enumerate(data["names"])},
+    }
+# ───── SAM-2 Alias Patch ─────────────────────────────────────────────────────
+# Maps sam_2 package to sam2 namespace for correct imports
+try:
+    import sam_2
+    import importlib
+    sys.modules['sam2'] = sam_2
+    for sub in ['build_sam','automatic_mask_generator','modeling.sam2_base']:
+        sys.modules[f'sam2.{sub}'] = importlib.import_module(f'sam_2.{sub}')
+except ImportError:
+    pass
+# ───── Dependency Checker & Installer (SAM-2) ─────────────────────────────────
+def check_and_install_sam2() -> tuple[bool,str]:
     try:
         from sam2.build_sam import build_sam2
         return True, "SAM-2 already available"
+    except ImportError:
+        # Clone if needed
+        if not os.path.exists("segment-anything-2"):
+            subprocess.run([
+                "git","clone",
+                "https://github.com/facebookresearch/segment-anything-2.git"
+            ], check=True)
+        # Install editable
+        cwd = os.getcwd()
+        os.chdir("segment-anything-2")
+        subprocess.run([sys.executable, "-m", "pip", "install", "-e", "."], check=True)
+        os.chdir(cwd)
+        # Add to path and re-alias
+        path = os.path.abspath("segment-anything-2")
+        if path not in sys.path:
+            sys.path.insert(0, path)
         try:
+            import sam_2, importlib
+            sys.modules['sam2'] = sam_2
+            for sub in ['build_sam','automatic_mask_generator','modeling.sam2_base']:
+                sys.modules[f'sam2.{sub}'] = importlib.import_module(f'sam_2.{sub}')
+        except ImportError:
+            return False, "SAM-2 import failed after install"
+        return True, "SAM-2 installed and aliased"
 SAM2_AVAILABLE, SAM2_STATUS = check_and_install_sam2()
 print(f"SAM-2 Status: {SAM2_STATUS}")
 if SAM2_AVAILABLE:
+    from sam2.build_sam import build_sam2
+    from sam2.automatic_mask_generator import SAM2AutomaticMaskGenerator
+    from sam2.modeling.sam2_base import SAM2Base
+# ───── YOLO Inference ────────────────────────────────────────────────────────
+def infer_parts(
+    img_path: Path,
+    model: YOLO,
+    class_info: dict,
+) -> tuple[List[PostPart], List[PostPart]]:
+    results = model(str(img_path))
+    parts, anomalies = [], []
+    for det in results[0].boxes:
+        x, y, w, h = det.xywh[0].tolist()
+        cls_id = int(det.cls[0].item())
+        conf = float(det.conf[0].item())
+        name = class_info['class_to_name'].get(cls_id, f"unknown-{cls_id}")
+        part = PostPart(name, x, y, w, h, conf)
+        (anomalies if name=='afwijking' else parts).append(part)
+    return parts, anomalies
+# ───── Spatial Validation ────────────────────────────────────────────────────
+def check_position(part: PostPart, img_w: int, img_h: int) -> bool:
+    cx, cy = part.x*img_w, part.y*img_h
+    w_px, h_px = part.width*img_w, part.height*img_h
+    if part.name=='logo':
+        return (cx - w_px/2 >= 0.75*img_w) and (cy + h_px/2 <= 0.25*img_h)
+    return True
+def validate_layout(parts: List[PostPart], image_shape: tuple[int,int]) -> List[str]:
+    img_h, img_w = image_shape
+    return [f"{p.name} out of expected zone" for p in parts if not check_position(p, img_w, img_h)]
+# ───── Confidence Scoring ───────────────────────────────────────────────────
+def compute_confidence(
+    parts: List[PostPart], anomalies: List[PostPart], violations: List[str]
+) -> float:
+    base = sum(p.confidence for p in parts)/len(parts) if parts else 0.3
+    defect_penalty = min(0.1*len(anomalies), 0.5)
+    layout_penalty = min(0.05*len(violations), 0.3)
+    return max(0.0, base - defect_penalty - layout_penalty)
+# ───── Core Analysis ────────────────────────────────────────────────────────
+def analyze_post(
+    img_path: Path, model: YOLO, class_info: dict, quiet: bool=False
+) -> PostAnalysis:
+    parts, anomalies = infer_parts(img_path, model, class_info)
+    img = cv2.imread(str(img_path))
+    if img is None: sys.exit(f"Failed to read image {img_path}")
+    violations = validate_layout(parts, img.shape[:2])
+    score = compute_confidence(parts, anomalies, violations)
+    conform = not anomalies and not violations
+    if not quiet:
+        status = 'CONFORM' if conform else 'NON-CONFORM'
+        print(f"{img_path.name}: {status} | parts={len(parts)}, anomalies={len(anomalies)}, violations={len(violations)} | score={score:.2f}")
+    return PostAnalysis(img_path, parts, anomalies, violations, conform, score)
+# ───── Reporting ─────────────────────────────────────────────────────────────
+def write_analysis_report(analyses: List[PostAnalysis], output_dir: Path) -> Path:
+    output_dir.mkdir(parents=True, exist_ok=True)
+    report = []
+    for a in analyses:
+        report.append({
+            'image': str(a.image_path), 'is_conform': a.is_conform,
+            'confidence_score': a.confidence_score, 'violations': a.violations,
+            'parts': [vars(p) for p in a.parts], 'anomalies': [vars(d) for d in a.anomalies]
+        })
+    fp = output_dir/'post_analysis.json'
+    with fp.open('w',encoding='utf-8') as f: json.dump(report,f,indent=2)
+    return fp
+# ───── Image Download Helper ─────────────────────────────────────────────────
+def download_image(url: str) -> Union[Path,None]:
     try:
+        r = requests.get(url,timeout=10); r.raise_for_status()
+        parsed = urlparse(url)
+        ext = Path(parsed.path).suffix.lower() or '.jpg'
+        tmp = tempfile.NamedTemporaryFile(delete=False, suffix=ext)
+        tmp.write(r.content); tmp.close()
+        return Path(tmp.name)
     except Exception as e:
+        print(f"Download error for {url}: {e}"); return None
+# ───── Process Uploaded Image ─────────────────────────────────────────────────
+def process_uploaded_image(
+    image_data: Union[str,bytes,Path], model: YOLO, class_info: dict,
+    output_dir: Path, quiet: bool=False
+) -> PostAnalysis:
+    tmp=None
     try:
+        if isinstance(image_data,str) and image_data.startswith(('http://','https://')):
+            tmp = download_image(image_data); img_path=tmp or sys.exit()
+        elif isinstance(image_data,bytes):
+            img=Image.open(io.BytesIO(image_data)); fmt=img.format.lower(); ext=f".{fmt if fmt!='jpeg' else 'jpg'}"
+            tmp=tempfile.NamedTemporaryFile(delete=False,suffix=ext); tmp.write(image_data); tmp.close(); img_path=Path(tmp.name)
+        else:
+            img_path=Path(image_data);
+            if not img_path.exists(): sys.exit(f"File not found: {img_path}")
+        analysis = analyze_post(img_path, model, class_info, quiet)
+        out_fp = output_dir/f"analysis_{img_path.stem}.json"
+        with out_fp.open('w',encoding='utf-8') as f: json.dump({
+            'image':str(img_path),'is_conform':analysis.is_conform,
+            'confidence_score':analysis.confidence_score,'violations':analysis.violations,
+            'parts':[vars(p) for p in analysis.parts],'anomalies':[vars(d) for d in analysis.anomalies]
+        },f,indent=2)
+        return analysis
+    finally:
+        if tmp and Path(tmp.name).exists(): os.remove(tmp.name)
+# ───── Process Directory & Uploads ───────────────────────────────────────────
+def process_directory(images_dir: Path, output_dir: Path, data_yaml: Path, weights: str, quiet: bool=False):
+    ci=load_yaml_config(data_yaml); model=YOLO(weights)
+    imgs=[p for p in images_dir.iterdir() if p.suffix.lower() in ['.jpg','.jpeg','.png']]
+    if not imgs: sys.exit("No images found.")
+    output_dir.mkdir(parents=True,exist_ok=True)
+    analyses=[analyze_post(img,model,ci,quiet) for img in imgs]
+    rpt=write_analysis_report(analyses,output_dir)
+    print(f"Report written to {rpt}")
+def process_uploaded_images(images: List[Union[str,bytes,Path]], output_dir: Path, data_yaml: Path, weights: str, quiet: bool=False):
+    ci=load_yaml_config(data_yaml); model=YOLO(weights); output_dir.mkdir(parents=True,exist_ok=True)
+    analyses=[]
+    for img in images:
+        try: analyses.append(process_uploaded_image(img,model,ci,output_dir,quiet))
+        except Exception as e: print(f"Error: {e}")
+    print(f"Processed {len(analyses)} uploads.")
+    return analyses
+# ───── CLI Entrypoint ───────────────────────────────────────────────────────
+def main(argv=None):
+    p=argparse.ArgumentParser(description="Enhanced post analysis tool")
+    p.add_argument("--images",type=Path,help="Directory of images")
+    p.add_argument("--upload",nargs="+",help="URLs, paths, or bytes to analyze")
+    p.add_argument("--output",type=Path,default="post_analysis_results")
+    p.add_argument("--data",type=Path,default="data.yaml")
+    p.add_argument("--weights",type=str,default="yolov8n.pt")
+    p.add_argument("-q","--quiet",action="store_true")
+    args=p.parse_args(argv)
+    if args.upload:
+        process_uploaded_images(args.upload,args.output,args.data,args.weights,args.quiet)
+    elif args.images:
+        process_directory(args.images,args.output,args.data,args.weights,args.quiet)
     else:
+        p.error("Specify --images or --upload")
+if __name__ == "__main__": main()