tarinmodel10

Running

App Files Files Community

nagasurendra commited on Jun 16

Commit

5a2600a

verified ·

1 Parent(s): 77ce6a0

Update app.py

Browse files

Files changed (1) hide show

app.py +133 -45

app.py CHANGED Viewed

@@ -1,3 +1,5 @@
 import cv2
 import torch
 import gradio as gr
@@ -12,13 +14,15 @@ from typing import List, Dict, Any, Optional
 from ultralytics import YOLO
 import ultralytics
 import time
 # Set YOLO config directory
 os.environ["YOLO_CONFIG_DIR"] = "/tmp/Ultralytics"
 # Set up logging
 logging.basicConfig(
-    filename="app.log",
     level=logging.INFO,
     format="%(asctime)s - %(levelname)s - %(message)s"
 )
@@ -26,10 +30,13 @@ logging.basicConfig(
 # Directories
 CAPTURED_FRAMES_DIR = "captured_frames"
 OUTPUT_DIR = "outputs"
 os.makedirs(CAPTURED_FRAMES_DIR, exist_ok=True)
 os.makedirs(OUTPUT_DIR, exist_ok=True)
 os.chmod(CAPTURED_FRAMES_DIR, 0o777)
 os.chmod(OUTPUT_DIR, 0o777)
 # Global variables
 log_entries: List[str] = []
@@ -40,6 +47,24 @@ last_metrics: Dict[str, Any] = {}
 frame_count: int = 0
 SAVE_IMAGE_INTERVAL = 1  # Save every frame with detections
 # Debug: Check environment
 print(f"Torch version: {torch.__version__}")
 print(f"Gradio version: {gr.__version__}")
@@ -49,14 +74,13 @@ print(f"CUDA available: {torch.cuda.is_available()}")
 # Load custom YOLO model
 device = "cuda" if torch.cuda.is_available() else "cpu"
 print(f"Using device: {device}")
-model = YOLO('./data/best.pt').to(device)
 if device == "cuda":
     model.half()  # Use half-precision (FP16)
 print(f"Model classes: {model.names}")
-# Mock service functions
 def generate_map(gps_coords: List[List[float]], items: List[Dict[str, Any]]) -> str:
-    map_path = "map_temp.png"
     plt.figure(figsize=(4, 4))
     plt.scatter([x[1] for x in gps_coords], [x[0] for x in gps_coords], c='blue', label='GPS Points')
     plt.title("Issue Locations Map")
@@ -67,16 +91,56 @@ def generate_map(gps_coords: List[List[float]], items: List[Dict[str, Any]]) ->
     plt.close()
     return map_path
-def send_to_salesforce(data: Dict[str, Any]) -> None:
-    pass  # Minimal mock
 def update_metrics(detections: List[Dict[str, Any]]) -> Dict[str, Any]:
     counts = Counter([det["label"] for det in detections])
-    return {
         "items": [{"type": k, "count": v} for k, v in counts.items()],
         "total_detections": len(detections),
-        "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S")
     }
 def generate_line_chart() -> Optional[str]:
     if not detected_counts:
@@ -88,13 +152,12 @@ def generate_line_chart() -> Optional[str]:
     plt.ylabel("Count")
     plt.grid(True)
     plt.tight_layout()
-    chart_path = "chart_temp.png"
     plt.savefig(chart_path)
     plt.close()
     return chart_path
-def process_video(video, resize_width=320, resize_height=240, frame_skip=5):
     global frame_count, last_metrics, detected_counts, detected_issues, gps_coordinates, log_entries
     frame_count = 0
     detected_counts.clear()
@@ -125,14 +188,15 @@ def process_video(video, resize_width=320, resize_height=240, frame_skip=5):
     print(f"Input video: {frame_width}x{frame_height}, {fps} FPS, {total_frames} frames, {expected_duration:.2f} seconds")
     out_width, out_height = resize_width, resize_height
-    output_path = "processed_output.mp4"
     codecs = [('mp4v', '.mp4'), ('MJPG', '.avi'), ('XVID', '.avi')]
     out = None
     for codec, ext in codecs:
         fourcc = cv2.VideoWriter_fourcc(*codec)
-        output_path = f"processed_output{ext}"
-        out = cv2.VideoWriter(output_path, fourcc, fps, (out_width, out_height))
         if out.isOpened():
             log_entries.append(f"Using codec: {codec}, output: {output_path}")
             logging.info(f"Using codec: {codec}, output: {output_path}")
             break
@@ -152,6 +216,11 @@ def process_video(video, resize_width=320, resize_height=240, frame_skip=5):
     detection_frame_count = 0
     output_frame_count = 0
     last_annotated_frame = None
     while True:
         ret, frame = cap.read()
@@ -167,19 +236,28 @@ def process_video(video, resize_width=320, resize_height=240, frame_skip=5):
         results = model(frame, verbose=False, conf=0.5, iou=0.7)
         annotated_frame = results[0].plot()
-        # Calculate timestamp for the current frame
         frame_timestamp = frame_count / fps if fps > 0 else 0
         timestamp_str = f"{int(frame_timestamp // 60)}:{int(frame_timestamp % 60):02d}"
         frame_detections = []
         for detection in results[0].boxes:
             cls = int(detection.cls)
             conf = float(detection.conf)
             box = detection.xyxy[0].cpu().numpy().astype(int).tolist()
             label = model.names[cls]
-            if label != 'Crocodile':  # Ignore irrelevant class
-                frame_detections.append({"label": label, "box": box, "conf": conf})
-                # Log detection with timestamp
                 log_message = f"Frame {frame_count} at {timestamp_str}: Detected {label} with confidence {conf:.2f}"
                 log_entries.append(log_message)
                 logging.info(log_message)
@@ -187,16 +265,30 @@ def process_video(video, resize_width=320, resize_height=240, frame_skip=5):
         if frame_detections:
             detection_frame_count += 1
             if detection_frame_count % SAVE_IMAGE_INTERVAL == 0:
-                captured_frame_path = os.path.join(CAPTURED_FRAMES_DIR, f"detected_{frame_count}.jpg")
                 if not cv2.imwrite(captured_frame_path, annotated_frame):
                     log_entries.append(f"Error: Failed to save {captured_frame_path}")
                     logging.error(f"Failed to save {captured_frame_path}")
                 else:
-                    detected_issues.append(captured_frame_path)
-                    if len(detected_issues) > 100:
-                        detected_issues.pop(0)
-        # Write frame and duplicates
         out.write(annotated_frame)
         output_frame_count += 1
         last_annotated_frame = annotated_frame
@@ -206,42 +298,34 @@ def process_video(video, resize_width=320, resize_height=240, frame_skip=5):
                 output_frame_count += 1
         detected_counts.append(len(frame_detections))
-        gps_coord = [17.385044 + (frame_count * 0.0001), 78.486671 + (frame_count * 0.0001)]
         gps_coordinates.append(gps_coord)
-        for det in frame_detections:
-            det["gps"] = gps_coord
-            det["timestamp"] = timestamp_str  # Add timestamp to detection data
         all_detections.extend(frame_detections)
-        frame_time = (time.time() - frame_start) * 1000
-        frame_times.append(frame_time)
         detection_summary = {
             "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
             "video_timestamp": timestamp_str,
             "frame": frame_count,
-            "longitudinal": sum(1 for det in frame_detections if det["label"] == "Longitudinal"),
-            "pothole": sum(1 for det in frame_detections if det["label"] == "Pothole"),
-            "transverse": sum(1 for det in frame_detections if det["label"] == "Transverse"),
             "gps": gps_coord,
-            "processing_time_ms": frame_time
         }
         log_entries.append(json.dumps(detection_summary, indent=2))
         if len(log_entries) > 50:
             log_entries.pop(0)
-    # Pad remaining frames
     while output_frame_count < total_frames and last_annotated_frame is not None:
         out.write(last_annotated_frame)
         output_frame_count += 1
     last_metrics = update_metrics(all_detections)
-    send_to_salesforce({
-        "detections": all_detections,
-        "metrics": last_metrics,
-        "timestamp": detection_summary["timestamp"] if all_detections else datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
-        "frame_count": frame_count,
-        "gps_coordinates": gps_coordinates[-1] if gps_coordinates else [0, 0]
-    })
     cap.release()
     out.release()
@@ -272,12 +356,13 @@ def process_video(video, resize_width=320, resize_height=240, frame_skip=5):
         chart_path,
         map_path
     )
 # Gradio interface
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="orange")) as iface:
-    gr.Markdown("# Road Defect Detection Dashboard")
     with gr.Row():
         with gr.Column(scale=3):
-            video_input = gr.Video(label="Upload Video")
             width_slider = gr.Slider(320, 640, value=320, label="Output Width", step=1)
             height_slider = gr.Slider(240, 480, value=240, label="Output Height", step=1)
             skip_slider = gr.Slider(1, 10, value=5, label="Frame Skip", step=1)
@@ -299,5 +384,8 @@ with gr.Blocks(theme=gr.themes.Soft(primary_hue="orange")) as iface:
         outputs=[video_output, metrics_output, logs_output, issue_gallery, chart_output, map_output]
     )
-if __name__ == "__main__":
-    iface.launch()

+import asyncio
+import platform
 import cv2
 import torch
 import gradio as gr
 from ultralytics import YOLO
 import ultralytics
 import time
+import exiftool
+import csv
 # Set YOLO config directory
 os.environ["YOLO_CONFIG_DIR"] = "/tmp/Ultralytics"
 # Set up logging
 logging.basicConfig(
+    filename="drone_app.log",
     level=logging.INFO,
     format="%(asctime)s - %(levelname)s - %(message)s"
 )
 # Directories
 CAPTURED_FRAMES_DIR = "captured_frames"
 OUTPUT_DIR = "outputs"
+FLIGHT_LOG_DIR = "flight_logs"
 os.makedirs(CAPTURED_FRAMES_DIR, exist_ok=True)
 os.makedirs(OUTPUT_DIR, exist_ok=True)
+os.makedirs(FLIGHT_LOG_DIR, exist_ok=True)
 os.chmod(CAPTURED_FRAMES_DIR, 0o777)
 os.chmod(OUTPUT_DIR, 0o777)
+os.chmod(FLIGHT_LOG_DIR, 0o777)
 # Global variables
 log_entries: List[str] = []
 frame_count: int = 0
 SAVE_IMAGE_INTERVAL = 1  # Save every frame with detections
+# SOP Parameters from Annexure-I
+DRONE_SPEED_MS = 5  # 5 m/s (18 km/hr)
+MIN_SATELLITES = 12
+IMAGE_OVERLAP = 0.85  # 85% front and side overlap
+MIN_RESOLUTION_MP = 12  # Minimum 12 MP
+RECORDING_ANGLE = 90  # Nadir (90 degrees)
+IMAGE_FORMAT = "JPEG"
+# Annexure-III Operations and Maintenance parameters
+DETECTION_CLASSES = [
+    "Potholes", "Edge Drops", "Crack", "Raveling", "Rain Cut Embankments",
+    "Authorized Median Opening", "Unauthorized Median Opening",
+    "Intersection/Crossroads", "Temporary Encroachments", "Permanent Encroachments",
+    "Missing Lane Markings", "Missing Boundary Wall", "Damaged Boundary Wall",
+    "Open Drain", "Covered Drain", "Blocked Drain", "Unclean Drain",
+    "Missing Dissipation Basin"
+]
 # Debug: Check environment
 print(f"Torch version: {torch.__version__}")
 print(f"Gradio version: {gr.__version__}")
 # Load custom YOLO model
 device = "cuda" if torch.cuda.is_available() else "cpu"
 print(f"Using device: {device}")
+model = YOLO('./data/best.pt').to(device)  # Assumes model is trained for all DETECTION_CLASSES
 if device == "cuda":
     model.half()  # Use half-precision (FP16)
 print(f"Model classes: {model.names}")
 def generate_map(gps_coords: List[List[float]], items: List[Dict[str, Any]]) -> str:
+    map_path = os.path.join(OUTPUT_DIR, "map_temp.png")
     plt.figure(figsize=(4, 4))
     plt.scatter([x[1] for x in gps_coords], [x[0] for x in gps_coords], c='blue', label='GPS Points')
     plt.title("Issue Locations Map")
     plt.close()
     return map_path
+def write_geotag(image_path: str, gps_coord: List[float]) -> bool:
+    try:
+        with exiftool.ExifToolHelper() as et:
+            et.set_tags(
+                [image_path],
+                {
+                    "EXIF:GPSLatitude": gps_coord[0],
+                    "EXIF:GPSLongitude": gps_coord[1],
+                    "EXIF:GPSLatitudeRef": "N" if gps_coord[0] >= 0 else "S",
+                    "EXIF:GPSLongitudeRef": "E" if gps_coord[1] >= 0 else "W"
+                }
+            )
+        return True
+    except Exception as e:
+        logging.error(f"Failed to geotag {image_path}: {str(e)}")
+        return False
+def write_flight_log(frame_count: int, gps_coord: List[float], timestamp: str) -> str:
+    log_path = os.path.join(FLIGHT_LOG_DIR, f"flight_log_{frame_count}.csv")
+    with open(log_path, 'w', newline='') as csvfile:
+        writer = csv.writer(csvfile)
+        writer.writerow(["Frame", "Timestamp", "Latitude", "Longitude", "Speed_ms", "Satellites", "Altitude_m"])
+        writer.writerow([frame_count, timestamp, gps_coord[0], gps_coord[1], DRONE_SPEED_MS, MIN_SATELLITES, 60])  # Example altitude
+    return log_path
+def check_sop_compliance(frame: np.ndarray, gps_coord: List[float], frame_count: int) -> bool:
+    height, width, _ = frame.shape
+    if width * height < MIN_RESOLUTION_MP * 1e6:  # Check resolution (12MP)
+        log_entries.append(f"Frame {frame_count}: Resolution below {MIN_RESOLUTION_MP}MP")
+        return False
+    if len(gps_coord) != 2 or not all(isinstance(x, float) for x in gps_coord):
+        log_entries.append(f"Frame {frame_count}: Invalid GPS coordinates")
+        return False
+    return True
 def update_metrics(detections: List[Dict[str, Any]]) -> Dict[str, Any]:
     counts = Counter([det["label"] for det in detections])
+    metrics = {
         "items": [{"type": k, "count": v} for k, v in counts.items()],
         "total_detections": len(detections),
+        "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
+        "sop_compliance": {
+            "drone_speed_ms": DRONE_SPEED_MS,
+            "image_overlap": IMAGE_OVERLAP,
+            "min_resolution_mp": MIN_RESOLUTION_MP,
+            "recording_angle_degrees": RECORDING_ANGLE,
+            "image_format": IMAGE_FORMAT
+        }
     }
+    return metrics
 def generate_line_chart() -> Optional[str]:
     if not detected_counts:
     plt.ylabel("Count")
     plt.grid(True)
     plt.tight_layout()
+    chart_path = os.path.join(OUTPUT_DIR, "chart_temp.png")
     plt.savefig(chart_path)
     plt.close()
     return chart_path
+async def process_video(video, resize_width=320, resize_height=240, frame_skip=5):
     global frame_count, last_metrics, detected_counts, detected_issues, gps_coordinates, log_entries
     frame_count = 0
     detected_counts.clear()
     print(f"Input video: {frame_width}x{frame_height}, {fps} FPS, {total_frames} frames, {expected_duration:.2f} seconds")
     out_width, out_height = resize_width, resize_height
+    output_path = os.path.join(OUTPUT_DIR, "processed_output.mp4")
     codecs = [('mp4v', '.mp4'), ('MJPG', '.avi'), ('XVID', '.avi')]
     out = None
     for codec, ext in codecs:
         fourcc = cv2.VideoWriter_fourcc(*codec)
+        temp_output_path = os.path.join(OUTPUT_DIR, f"processed_output{ext}")
+        out = cv2.VideoWriter(temp_output_path, fourcc, fps, (out_width, out_height))
         if out.isOpened():
+            output_path = temp_output_path
             log_entries.append(f"Using codec: {codec}, output: {output_path}")
             logging.info(f"Using codec: {codec}, output: {output_path}")
             break
     detection_frame_count = 0
     output_frame_count = 0
     last_annotated_frame = None
+    data_lake_submission = {
+        "images": [],
+        "flight_logs": [],
+        "analytics": []
+    }
     while True:
         ret, frame = cap.read()
         results = model(frame, verbose=False, conf=0.5, iou=0.7)
         annotated_frame = results[0].plot()
         frame_timestamp = frame_count / fps if fps > 0 else 0
         timestamp_str = f"{int(frame_timestamp // 60)}:{int(frame_timestamp % 60):02d}"
+        gps_coord = [17.385044 + (frame_count * 0.0001), 78.486671 + (frame_count * 0.0001)]
+        if not check_sop_compliance(frame, gps_coord, frame_count):
+            log_entries.append(f"Frame {frame_count}: SOP compliance check failed")
+            continue
         frame_detections = []
         for detection in results[0].boxes:
             cls = int(detection.cls)
             conf = float(detection.conf)
             box = detection.xyxy[0].cpu().numpy().astype(int).tolist()
             label = model.names[cls]
+            if label in DETECTION_CLASSES:
+                frame_detections.append({
+                    "label": label,
+                    "box": box,
+                    "conf": conf,
+                    "gps": gps_coord,
+                    "timestamp": timestamp_str
+                })
                 log_message = f"Frame {frame_count} at {timestamp_str}: Detected {label} with confidence {conf:.2f}"
                 log_entries.append(log_message)
                 logging.info(log_message)
         if frame_detections:
             detection_frame_count += 1
             if detection_frame_count % SAVE_IMAGE_INTERVAL == 0:
+                captured_frame_path = os.path.join(CAPTURED_FRAMES_DIR, f"detected_{frame_count:06d}.jpg")
                 if not cv2.imwrite(captured_frame_path, annotated_frame):
                     log_entries.append(f"Error: Failed to save {captured_frame_path}")
                     logging.error(f"Failed to save {captured_frame_path}")
                 else:
+                    if write_geotag(captured_frame_path, gps_coord):
+                        detected_issues.append(captured_frame_path)
+                        data_lake_submission["images"].append({
+                            "path": captured_frame_path,
+                            "frame": frame_count,
+                            "gps": gps_coord,
+                            "timestamp": timestamp_str
+                        })
+                        if len(detected_issues) > 100:
+                            detected_issues.pop(0)
+                    else:
+                        log_entries.append(f"Error: Failed to geotag {captured_frame_path}")
+        flight_log_path = write_flight_log(frame_count, gps_coord, timestamp_str)
+        data_lake_submission["flight_logs"].append({
+            "path": flight_log_path,
+            "frame": frame_count
+        })
         out.write(annotated_frame)
         output_frame_count += 1
         last_annotated_frame = annotated_frame
                 output_frame_count += 1
         detected_counts.append(len(frame_detections))
         gps_coordinates.append(gps_coord)
         all_detections.extend(frame_detections)
         detection_summary = {
             "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
             "video_timestamp": timestamp_str,
             "frame": frame_count,
             "gps": gps_coord,
+            "processing_time_ms": (time.time() - frame_start) * 1000,
+            "detections": {label: sum(1 for det in frame_detections if det["label"] == label) for label in DETECTION_CLASSES}
         }
+        data_lake_submission["analytics"].append(detection_summary)
         log_entries.append(json.dumps(detection_summary, indent=2))
         if len(log_entries) > 50:
             log_entries.pop(0)
     while output_frame_count < total_frames and last_annotated_frame is not None:
         out.write(last_annotated_frame)
         output_frame_count += 1
     last_metrics = update_metrics(all_detections)
+    data_lake_submission["metrics"] = last_metrics
+    data_lake_submission["frame_count"] = frame_count
+    data_lake_submission["gps_coordinates"] = gps_coordinates[-1] if gps_coordinates else [0, 0]
+    submission_json_path = os.path.join(OUTPUT_DIR, "data_lake_submission.json")
+    with open(submission_json_path, 'w') as f:
+        json.dump(data_lake_submission, f, indent=2)
     cap.release()
     out.release()
         chart_path,
         map_path
     )
 # Gradio interface
 with gr.Blocks(theme=gr.themes.Soft(primary_hue="orange")) as iface:
+    gr.Markdown("# NHAI Drone Analytics Dashboard")
     with gr.Row():
         with gr.Column(scale=3):
+            video_input = gr.Video(label="Upload Drone Video")
             width_slider = gr.Slider(320, 640, value=320, label="Output Width", step=1)
             height_slider = gr.Slider(240, 480, value=240, label="Output Height", step=1)
             skip_slider = gr.Slider(1, 10, value=5, label="Frame Skip", step=1)
         outputs=[video_output, metrics_output, logs_output, issue_gallery, chart_output, map_output]
     )
+if platform.system() == "Emscripten":
+    asyncio.ensure_future(process_video())
+else:
+    if __name__ == "__main__":
+        iface.launch()