Spaces:

Theivaprakasham
/

mleda_landmark_batch

Sleeping

App Files Files Community

Theivaprakasham Hari commited on May 8

Commit

e71a089

1 Parent(s): 4edafab

first commit

Browse files

Files changed (5) hide show

app.py +199 -0
models/DSF_Mleda_250.pt +3 -0
models/DSF_WSF_Mleda_450.pt +3 -0
models/WSF_Mleda_200.pt +3 -0
requirements.txt +14 -0

app.py ADDED Viewed

	@@ -0,0 +1,199 @@

+import gradio as gr
+import numpy as np
+from PIL import Image
+from ultralytics import YOLO
+import cv2
+from pathlib import Path
+import xml.etree.ElementTree as ET
+import tempfile
+import zipfile
+# Base path for model files
+path = Path(__file__).parent
+# Model configurations
+MODEL_CONFIGS = {
+    "Dry Season Form": {
+        "path": path / "models/DSF_Mleda_250.pt",
+        "labels": [
+            "F1", "F2", "F3", "F4", "F5", "F6", "F7", "F8", "F9", "F10", "F11", "F12", "F13", "F14", "F15", "F16",
+            "H1", "H2", "H3", "H4", "H5", "H6", "H7", "H8", "H9", "H10", "H11", "H12", "H13", "H14", "H15", "H16", "H17",
+            "fs1", "fs2", "fs3", "fs4", "fs5",
+            "hs1", "hs2", "hs3", "hs4", "hs5", "hs6",
+            "sc1", "sc2",
+            "sex", "right", "left", "grey", "black", "white"
+        ],
+        "imgsz": 1280
+    },
+    "Wet Season Form": {
+        "path": path / "models/WSF_Mleda_200.pt",
+        "labels": [
+            'F12', 'F14', 'fs1', 'fs2', 'fs3', 'fs4', 'fs5',
+            'H12', 'H14', 'hs1', 'hs2', 'hs3', 'hs4', 'hs5', 'hs6',
+            'white', 'black', 'grey', 'sex', 'blue', 'green', 'red', 'sc1', 'sc2'
+        ],
+        "imgsz": 1280
+    },
+    "All Season Form": {
+        "path": path / "models/DSF_WSF_Mleda_450.pt",
+        "labels": [
+            "F1", "F2", "F3", "F4", "F5", "F6", "F7", "F8", "F9", "F10", "F11", "F12", "F13", "F14", "F15", "F16",
+            "H1", "H2", "H3", "H4", "H5", "H6", "H7", "H8", "H9", "H10", "H11", "H12", "H13", "H14", "H15", "H16", "H17",
+            "fs1", "fs2", "fs3", "fs4", "fs5",
+            "hs1", "hs2", "hs3", "hs4", "hs5", "hs6",
+            "sc1", "sc2",
+            "sex", "right", "left", "grey", "black", "white"
+        ],
+        "imgsz": 1280
+    }
+}
+# Directory for XML annotations
+ANNOTATIONS_DIR = Path(tempfile.gettempdir()) / "annotations"
+ANNOTATIONS_DIR.mkdir(parents=True, exist_ok=True)
+def hex_to_bgr(hex_color: str) -> tuple:
+    """Convert #RRGGBB hex color to BGR tuple."""
+    hex_color = hex_color.lstrip("#")
+    if len(hex_color) != 6:
+        return (0, 255, 0)  # Default to green if invalid
+    r = int(hex_color[0:2], 16)
+    g = int(hex_color[2:4], 16)
+    b = int(hex_color[4:6], 16)
+    return (b, g, r)
+def load_model(path: Path):
+    """Load YOLO model from the given path."""
+    return YOLO(str(path))
+def draw_detections(image: np.ndarray, results, labels, keypoint_threshold: float,
+                    show_labels: bool, point_size: int, point_color: str,
+                    label_size: float) -> np.ndarray:
+    """Draw bounding boxes, keypoints, and labels on the image."""
+    img = image.copy()
+    color_bgr = hex_to_bgr(point_color)
+    for result in results:
+        boxes = result.boxes.xywh.cpu().numpy()
+        cls_ids = result.boxes.cls.int().cpu().numpy()
+        confs = result.boxes.conf.cpu().numpy()
+        kpts_all = result.keypoints.data.cpu().numpy()
+        for (x_c, y_c, w, h), cls_id, conf, kpts in zip(boxes, cls_ids, confs, kpts_all):
+            x1 = int(x_c - w/2); y1 = int(y_c - h/2)
+            x2 = int(x_c + w/2); y2 = int(y_c + h/2)
+            cv2.rectangle(img, (x1, y1), (x2, y2), (255,255,0), 2)
+            text = f"{result.names[int(cls_id)]} {conf:.2f}"
+            (tw, th), _ = cv2.getTextSize(text, cv2.FONT_HERSHEY_SIMPLEX, 0.6, 1)
+            cv2.rectangle(img, (x1, y1 - th - 4), (x1 + tw, y1), (255,255,0), cv2.FILLED)
+            cv2.putText(img, text, (x1, y1 - 4), cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0,0,0), 1)
+            for i, (x, y, v) in enumerate(kpts):
+                if v > keypoint_threshold and i < len(labels):
+                    xi, yi = int(x), int(y)
+                    cv2.circle(img, (xi, yi), int(point_size), color_bgr, -1)
+                    if show_labels:
+                        cv2.putText(img, labels[i], (xi + 3, yi + 3), cv2.FONT_HERSHEY_SIMPLEX,
+                                    label_size, (255,0,0), 2)
+    return img
+def generate_xml(filename: str, width: int, height: int, keypoints: list[tuple[float, float, str]]):
+    """Generate an XML annotation file for a single image."""
+    base_name = Path(filename).stem
+    annotations = ET.Element("annotations")
+    image_tag = ET.SubElement(annotations, "image", filename=filename,
+                               width=str(width), height=str(height))
+    for idx, (x, y, label) in enumerate(keypoints):
+        ET.SubElement(image_tag, "point", id=str(idx), x=str(x), y=str(y), label=label)
+    tree = ET.ElementTree(annotations)
+    xml_filename = f"{base_name}.xml"
+    xml_path = ANNOTATIONS_DIR / xml_filename
+    tree.write(str(xml_path), encoding="utf-8", xml_declaration=True)
+    return xml_path
+def process_images(image_list, conf_threshold: float, keypoint_threshold: float,
+                   model_choice: str, show_labels: bool, point_size: int,
+                   point_color: str, label_size: float):
+    """Process multiple images: annotate and generate XMLs, then package into ZIP."""
+    model_cfg = MODEL_CONFIGS[model_choice]
+    model = load_model(model_cfg["path"])
+    labels = model_cfg["labels"]
+    imgsz = model_cfg["imgsz"]
+    output_images = []
+    xml_paths = []
+    for file_obj in image_list:
+        # Determine path and original filename
+        if isinstance(file_obj, dict):
+            tmp_path = Path(file_obj['name'])
+            orig_name = Path(file_obj['orig_name']).name
+        else:
+            tmp_path = Path(file_obj.name)
+            orig_name = tmp_path.name
+        img = Image.open(tmp_path)
+        img_rgb = np.array(img.convert("RGB"))
+        img_bgr = cv2.cvtColor(img_rgb, cv2.COLOR_RGB2BGR)
+        height, width = img_bgr.shape[:2]
+        results = model(img_bgr, conf=conf_threshold, imgsz=imgsz)
+        annotated = draw_detections(img_bgr, results, labels,
+                                    keypoint_threshold, show_labels,
+                                    point_size, point_color, label_size)
+        output_images.append(Image.fromarray(cv2.cvtColor(annotated, cv2.COLOR_BGR2RGB)))
+        # Collect keypoints for XML
+        keypoints = []
+        for res in results:
+            for kpts in res.keypoints.data.cpu().numpy():
+                for i, (x, y, v) in enumerate(kpts):
+                    if v > keypoint_threshold:
+                        keypoints.append((float(x), float(y), labels[i] if i < len(labels) else f"kp{i}"))
+        xml_path = generate_xml(orig_name, width, height, keypoints)
+        xml_paths.append(xml_path)
+    # Create ZIP of all XMLs
+    zip_path = Path(tempfile.gettempdir()) / "xml_annotations.zip"
+    with zipfile.ZipFile(zip_path, 'w') as zipf:
+        for p in xml_paths:
+            arcname = Path('annotations') / p.name
+            zipf.write(str(p), arcname.as_posix())
+    xml_list_str = "\n".join(str(p) for p in xml_paths)
+    return output_images, xml_list_str, str(zip_path)
+# Gradio Interface
+def main():
+    iface = gr.Interface(
+        fn=process_images,
+        inputs=[
+            gr.File(file_types=["image"], file_count="multiple", label="Upload Images"),
+            gr.Slider(minimum=0.0, maximum=1.0, value=0.25, step=0.01, label="Confidence Threshold"),
+            gr.Slider(minimum=0.0, maximum=1.0, value=0.5, step=0.01, label="Keypoint Visibility Threshold"),
+            gr.Radio(choices=list(MODEL_CONFIGS.keys()), label="Select Model", value="Dry Season Form"),
+            gr.Checkbox(label="Show Keypoint Labels", value=True),
+            gr.Slider(minimum=1, maximum=20, value=8, step=1, label="Keypoint Size"),
+            gr.ColorPicker(label="Keypoint Color", value="#00FF00"),
+            gr.Slider(minimum=0.3, maximum=3.0, value=1.0, step=0.1, label="Keypoint Label Font Size")
+        ],
+        outputs=[
+            gr.Gallery(label="Detection Results"),
+            gr.Textbox(label="Generated XML Paths"),
+            gr.File(label="Download All XMLs as ZIP")
+        ],
+        title="🦋 Melanitis leda Landmark Batch Annotator",
+        description="Upload multiple images. It annotates each with keypoints and packages XMLs in a ZIP archive.",
+        allow_flagging="never"
+    )
+    iface.launch()
+if __name__ == "__main__":
+    main()

models/DSF_Mleda_250.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5b51ea730cb1c03399bc7d1de9fe51ca6f531af0d29c3064de9638a4a8ec701c
+size 56864045

models/DSF_WSF_Mleda_450.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:59cd20c486514ff18080413657d784f76c95937db5d5f6fa8cfae1f95b24951a
+size 56674033

models/WSF_Mleda_200.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:33b8298a9121ae3ccf5b5d5aff000d6dddda6f6e1c3e35a09f1215b8f53dd47c
+size 53621489

requirements.txt ADDED Viewed

	@@ -0,0 +1,14 @@

+ultralytics==8.3.88
+torch==2.6.0
+torchvision==0.21.0
+pycocotools==2.0.7
+PyYAML==6.0.1
+scipy==1.15.2
+gradio==5.29.0
+numpy==1.26.4
+psutil==5.9.8
+py-cpuinfo==9.0.0
+safetensors==0.4.3
+pillow==11.1.0
+opencv-python==4.11.0.86
+opencv-python-headless==4.7.0.72