Spaces:

Aumkeshchy2003
/

Object_Detection

Sleeping

App Files Files Community

Aumkeshchy2003 commited on Feb 22

Commit

b5a364c

verified ·

1 Parent(s): ab96246

Update app.py

Browse files

Files changed (1) hide show

app.py +47 -10

app.py CHANGED Viewed

@@ -2,49 +2,86 @@ import torch
 import numpy as np
 import gradio as gr
 from PIL import Image
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
 model = torch.hub.load('ultralytics/yolov5', 'yolov5s', pretrained=True).to(device)
 model.conf = 0.5
 if device.type == 'cuda':
     model.half()
-def process_frame(image):
-    if image is None:
-        print("No image received!")
         return None
     try:
         print("Processing frame...")
-        image_pil = Image.fromarray(image)
         with torch.no_grad():
             results = model(image_pil)
         rendered_images = results.render()
-        processed_image = np.array(rendered_images[0]) if rendered_images else image
         print("Frame processed successfully!")
         return processed_image
     except Exception as e:
         print(f"Processing error: {e}")
         return image
 with gr.Blocks(title="Real-Time Object Detection") as app:
     gr.Markdown("# Real-Time Object Detection with Dual Input")
     with gr.Tabs():
         with gr.TabItem("📷 Live Camera"):
             with gr.Row():
-                webcam_input = gr.Image(source="webcam", streaming=True, label="Live Feed")  # ✅ FIXED
                 live_output = gr.Image(label="Processed Feed")
-            webcam_input.stream(process_frame, inputs=webcam_input, outputs=live_output)  # ✅ FIXED
         with gr.TabItem("🖼️ Image Upload"):
             with gr.Row():
                 upload_input = gr.Image(type="numpy", label="Upload Image")
                 upload_output = gr.Image(label="Detection Result")
-            upload_input.change(process_frame, upload_input, upload_output)
 app.queue().launch(server_name="0.0.0.0", server_port=7860, share=False)

 import numpy as np
 import gradio as gr
 from PIL import Image
+import cv2
+# Device configuration
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+# Load optimized YOLOv5s model
 model = torch.hub.load('ultralytics/yolov5', 'yolov5s', pretrained=True).to(device)
+# Set model confidence threshold
 model.conf = 0.5
 if device.type == 'cuda':
     model.half()
+def process_frame(video):
+    """Reads a frame from the webcam video stream and applies YOLOv5 detection."""
+    cap = cv2.VideoCapture(video)  # Open the webcam stream
+    if not cap.isOpened():
+        print("Error: Could not open video stream.")
         return None
+    ret, frame = cap.read()
+    cap.release()
+    if not ret:
+        print("Error: Could not read frame.")
+        return None
     try:
         print("Processing frame...")
+        image_pil = Image.fromarray(cv2.cvtColor(frame, cv2.COLOR_BGR2RGB))
         with torch.no_grad():
             results = model(image_pil)
         rendered_images = results.render()
+        processed_image = np.array(rendered_images[0]) if rendered_images else frame
         print("Frame processed successfully!")
         return processed_image
     except Exception as e:
         print(f"Processing error: {e}")
+        return frame
+def process_uploaded_image(image):
+    """Processes the uploaded image and applies YOLOv5 object detection."""
+    if image is None:
+        return None
+    try:
+        image_pil = Image.fromarray(image)
+        with torch.no_grad():
+            results = model(image_pil)
+        rendered_images = results.render()
+        return np.array(rendered_images[0]) if rendered_images else image
+    except Exception as e:
+        print(f"Error processing image: {e}")
         return image
+# Create Gradio UI
 with gr.Blocks(title="Real-Time Object Detection") as app:
     gr.Markdown("# Real-Time Object Detection with Dual Input")
     with gr.Tabs():
+        # 📷 Live Webcam Tab
         with gr.TabItem("📷 Live Camera"):
             with gr.Row():
+                webcam_input = gr.Video(label="Live Feed")
                 live_output = gr.Image(label="Processed Feed")
+            webcam_input.stream(process_frame, inputs=webcam_input, outputs=live_output)
+        # 🖼️ Image Upload Tab (With Submit Button)
         with gr.TabItem("🖼️ Image Upload"):
             with gr.Row():
                 upload_input = gr.Image(type="numpy", label="Upload Image")
+                submit_button = gr.Button("Submit")
                 upload_output = gr.Image(label="Detection Result")
+            submit_button.click(process_uploaded_image, inputs=upload_input, outputs=upload_output)
 app.queue().launch(server_name="0.0.0.0", server_port=7860, share=False)