Spaces:

Ultralytics
/

YOLOv8

Running

App Files Files Community

RizwanMunawar commited on Sep 29, 2024

Commit

783e9d0

1 Parent(s): 8ff935e

add support for video inference

Browse files

Files changed (1) hide show

app.py +58 -8

app.py CHANGED Viewed

@@ -1,11 +1,12 @@
 import gradio as gr
 import PIL.Image as Image
 from ultralytics import ASSETS, YOLO
 model = YOLO("yolov8n.pt")
 def predict_image(img, conf_threshold, iou_threshold):
     """Predicts objects in an image using a YOLOv8 model with adjustable confidence and IOU thresholds."""
     results = model.predict(
@@ -23,19 +24,68 @@ def predict_image(img, conf_threshold, iou_threshold):
     return im
 iface = gr.Interface(
-    fn=predict_image,
     inputs=[
-        gr.Image(type="pil", label="Upload Image"),
         gr.Slider(minimum=0, maximum=1, value=0.25, label="Confidence threshold"),
         gr.Slider(minimum=0, maximum=1, value=0.45, label="IoU threshold"),
     ],
-    outputs=gr.Image(type="pil", label="Result"),
     title="Ultralytics Gradio Application 🚀",
-    description="Upload images for inference. The Ultralytics YOLOv8n model is used by default.",
     examples=[
-        [ASSETS / "bus.jpg", 0.25, 0.45],
-        [ASSETS / "zidane.jpg", 0.25, 0.45],
     ],
 )
 iface.launch(share=True)

 import gradio as gr
 import PIL.Image as Image
+import tempfile
+import cv2
 from ultralytics import ASSETS, YOLO
+# Load YOLOv8 model
 model = YOLO("yolov8n.pt")
 def predict_image(img, conf_threshold, iou_threshold):
     """Predicts objects in an image using a YOLOv8 model with adjustable confidence and IOU thresholds."""
     results = model.predict(
     return im
+def predict_video(video, conf_threshold, iou_threshold):
+    """Predicts objects in a video using a YOLOv8 model with adjustable confidence and IOU thresholds."""
+    # Create a temporary file to save the processed video
+    temp_output = tempfile.NamedTemporaryFile(suffix=".mp4", delete=False)
+    temp_output.close()
+    # Load video
+    cap = cv2.VideoCapture(video)
+    # Get video properties
+    width = int(cap.get(cv2.CAP_PROP_FRAME_WIDTH))
+    height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    fps = int(cap.get(cv2.CAP_PROP_FPS))
+    # Set up VideoWriter to save output video
+    out = cv2.VideoWriter(temp_output.name, cv2.VideoWriter_fourcc(*"mp4v"), fps, (width, height))
+    while cap.isOpened():
+        ret, frame = cap.read()
+        if not ret:
+            break
+        # Perform inference on each frame
+        results = model.predict(
+            source=frame,
+            conf=conf_threshold,
+            iou=iou_threshold,
+            show_labels=True,
+            show_conf=True,
+            imgsz=640,
+        )
+        # Draw the results on the frame
+        for r in results:
+            frame = r.plot()
+        # Write the frame to the output video
+        out.write(frame)
+    # Release resources
+    cap.release()
+    out.release()
+    return temp_output.name
+# Create a Gradio interface with support for both images and videos
 iface = gr.Interface(
+    fn=lambda img, conf_threshold, iou_threshold, is_video: predict_video(img, conf_threshold, iou_threshold) if is_video else predict_image(img, conf_threshold, iou_threshold),
     inputs=[
+        gr.Video(type="file", optional=True, label="Upload Video"),
+        gr.Image(type="pil", optional=True, label="Upload Image"),
         gr.Slider(minimum=0, maximum=1, value=0.25, label="Confidence threshold"),
         gr.Slider(minimum=0, maximum=1, value=0.45, label="IoU threshold"),
+        gr.Checkbox(label="Is Video?", default=False),
     ],
+    outputs=gr.Image(type="pil", label="Result") if not gr.Checkbox else gr.Video(type="file", label="Result"),
     title="Ultralytics Gradio Application 🚀",
+    description="Upload images or videos for inference. The Ultralytics YOLOv8n model is used by default.",
     examples=[
+        [ASSETS / "bus.jpg", 0.25, 0.45, False],
+        [ASSETS / "zidane.jpg", 0.25, 0.45, False],
     ],
 )
 iface.launch(share=True)