tarinmodel4

Sleeping

App Files Files Community

nagasurendra commited on Jun 13

Commit

d552a3c

verified ·

1 Parent(s): 7a25fd2

Update app.py

Browse files

Files changed (1) hide show

app.py +59 -17

app.py CHANGED Viewed

@@ -3,6 +3,7 @@ import torch
 import gradio as gr
 import numpy as np
 from ultralytics import YOLO, __version__ as ultralytics_version
 # Debug: Check environment
 print(f"Torch version: {torch.__version__}")
@@ -10,16 +11,20 @@ print(f"Gradio version: {gr.__version__}")
 print(f"Ultralytics version: {ultralytics_version}")
 print(f"CUDA available: {torch.cuda.is_available()}")
-# Load YOLOv8 model
 device = "cuda" if torch.cuda.is_available() else "cpu"
 print(f"Using device: {device}")
 model = YOLO('./data/best.pt').to(device)
-def process_video(video):
     if video is None:
         return "Error: No video uploaded"
-    # Open the input video
     cap = cv2.VideoCapture(video)
     if not cap.isOpened():
         return "Error: Could not open video file"
@@ -29,17 +34,20 @@ def process_video(video):
     frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
     fps = cap.get(cv2.CAP_PROP_FPS)
     total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
-    # Use original resolution to avoid resizing issues (optional: keep 320x240 if needed)
-    # frame_width, frame_height = 320, 240
-    print(f"Input video: {frame_width}x{frame_height}, {fps} FPS, {total_frames} frames")
     # Set up video writer
     output_path = "processed_output.mp4"
-    fourcc = cv2.VideoWriter_fourcc(*'mp4v')
-    out = cv2.VideoWriter(output_path, fourcc, fps, (frame_width, frame_height))
     frame_count = 0
     while True:
         ret, frame = cap.read()
@@ -47,31 +55,65 @@ def process_video(video):
             break
         frame_count += 1
         print(f"Processing frame {frame_count}/{total_frames}")
-        # Optional: Resize if needed (remove if using original resolution)
-        # frame = cv2.resize(frame, (frame_width, frame_height))
-        # Run YOLOv8 inference
-        results = model(frame)
         annotated_frame = results[0].plot()
-        # Write the annotated frame to the output video
         out.write(annotated_frame)
     # Release resources
     cap.release()
     out.release()
-    print(f"Output video saved as {output_path}")
     return output_path
 # Gradio interface
 iface = gr.Interface(
     fn=process_video,
-    inputs=gr.Video(label="Upload Video"),
     outputs=gr.Video(label="Processed Video"),
-    title="YOLOv8 Object Detection",
-    description="Upload a short video for object detection"
 )
 if __name__ == "__main__":

 import gradio as gr
 import numpy as np
 from ultralytics import YOLO, __version__ as ultralytics_version
+import time
 # Debug: Check environment
 print(f"Torch version: {torch.__version__}")
 print(f"Ultralytics version: {ultralytics_version}")
 print(f"CUDA available: {torch.cuda.is_available()}")
+# Load custom YOLO model
 device = "cuda" if torch.cuda.is_available() else "cpu"
 print(f"Using device: {device}")
 model = YOLO('./data/best.pt').to(device)
+print(f"Model classes: {model.names}")  # Print classes (should include cracks, potholes)
+def process_video(video, resize_width=640, resize_height=480, frame_skip=1):
     if video is None:
         return "Error: No video uploaded"
+    # Start timer
+    start_time = time.time()
+    # Open input video
     cap = cv2.VideoCapture(video)
     if not cap.isOpened():
         return "Error: Could not open video file"
     frame_height = int(cap.get(cv2.CAP_PROP_FRAME_HEIGHT))
     fps = cap.get(cv2.CAP_PROP_FPS)
     total_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+    expected_duration = total_frames / fps
+    print(f"Input video: {frame_width}x{frame_height}, {fps} FPS, {total_frames} frames, {expected_duration:.2f} seconds")
+    # Set output resolution
+    out_width, out_height = resize_width, resize_height
+    print(f"Output resolution: {out_width}x{out_height}")
     # Set up video writer
     output_path = "processed_output.mp4"
+    fourcc = cv2.VideoWriter_fourcc(*'mp4v')  # Use 'H264' if mp4v fails
+    out = cv2.VideoWriter(output_path, fourcc, fps, (out_width, out_height))
     frame_count = 0
+    processed_frames = 0
     while True:
         ret, frame = cap.read()
             break
         frame_count += 1
+        # Skip frames if frame_skip > 1
+        if frame_count % frame_skip != 0:
+            continue
+        processed_frames += 1
         print(f"Processing frame {frame_count}/{total_frames}")
+        # Resize frame for faster inference
+        frame = cv2.resize(frame, (out_width, out_height))
+        # Run YOLO inference (detect cracks and potholes)
+        results = model(frame, verbose=False, conf=0.5)  # Confidence threshold 0.5
         annotated_frame = results[0].plot()
+        # Log detections
+        for detection in results[0].boxes:
+            cls = int(detection.cls)
+            conf = float(detection.conf)
+            print(f"Frame {frame_count}: Detected {model.names[cls]} with confidence {conf:.2f}")
+        # Write annotated frame
         out.write(annotated_frame)
+        # Duplicate frames if skipping to maintain duration
+        if frame_skip > 1:
+            for _ in range(frame_skip - 1):
+                if frame_count + 1 <= total_frames:
+                    out.write(annotated_frame)
+                    frame_count += 1
     # Release resources
     cap.release()
     out.release()
+    # Verify output duration
+    cap = cv2.VideoCapture(output_path)
+    output_frames = int(cap.get(cv2.CAP_PROP_FRAME_COUNT))
+    output_fps = cap.get(cv2.CAP_PROP_FPS)
+    output_duration = output_frames / output_fps
+    cap.release()
+    print(f"Output video: {output_frames} frames, {output_fps} FPS, {output_duration:.2f} seconds")
+    print(f"Processing time: {time.time() - start_time:.2f} seconds")
     return output_path
 # Gradio interface
 iface = gr.Interface(
     fn=process_video,
+    inputs=[
+        gr.Video(label="Upload Video"),
+        gr.Slider(minimum=320, maximum=1280, value=640, label="Output Width", step=1),
+        gr.Slider(minimum=240, maximum=720, value=480, label="Output Height", step=1),
+        gr.Slider(minimum=1, maximum=5, value=1, label="Frame Skip (1 = process all frames)", step=1)
+    ],
     outputs=gr.Video(label="Processed Video"),
+    title="Crack and Pothole Detection with YOLO",
+    description="Upload a video to detect cracks and potholes. Adjust resolution and frame skip for faster processing."
 )
 if __name__ == "__main__":