Spaces:

Testys
/

drive-paddy

Sleeping

App Files Files Community

Testys commited on 23 days ago

Commit

a7ec466

verified ·

1 Parent(s): 8e7b22f

Update app.py

Browse files

Files changed (1) hide show

app.py +150 -72

app.py CHANGED Viewed

@@ -1,8 +1,3 @@
-# app_gradio.py
-# ──────────────────────────────────────────────────────────
-# Webcam → geometric detector → static WAV alert (with cooldown)
-# Live console logs of per-frame latency + status.
-# ──────────────────────────────────────────────────────────
 import time
 import os
 import yaml
@@ -10,9 +5,12 @@ import logging
 import numpy as np
 import gradio as gr
 import soundfile as sf
 from dotenv import load_dotenv
-from src.detection.factory import get_detector  # your existing factory
 # ───────────────────────────── logging
 logging.basicConfig(
@@ -28,88 +26,168 @@ with open("config.yaml") as f:
 detector = get_detector(CFG)
-# ───────────────────────────── alert sound (read once)
-wav_path = CFG["alerting"].get("alert_sound_path")
-logging.info(f"Processing {wav_path}")
-try:
-    ALERT_SR, ALERT_DATA = sf.read(wav_path, dtype="float32")
-    logging.info(f"Loaded alert sound: {wav_path}  ({len(ALERT_DATA)/ALERT_SR:.2f}s)")
-except Exception as e:
-    ALERT_SR, ALERT_DATA = None, None
-    logging.warning(f"Failed to load alert sound: {e}")
 # ───────────────────────────── frame processing
-def process_live_frame(frame, last_alert_ts):
     if frame is None:
         return (
             np.zeros((480, 640, 3), dtype=np.uint8),
             "Status: Inactive",
-            None,
-            last_alert_ts
         )
     t0 = time.perf_counter()
     try:
-        processed, indic, _ = detector.process_frame(frame)
     except Exception as e:
         logging.error(f"Error processing frame: {e}")
         processed = np.zeros_like(frame)
-        indic = {"drowsiness_level": "Error", "lighting": "Unknown", "details": {"Score": 0.0}}
     level = indic.get("drowsiness_level", "Awake")
     lighting = indic.get("lighting", "Good")
     score = indic.get("details", {}).get("Score", 0.0)
     dt_ms = (time.perf_counter() - t0) * 1000.0
     logging.info(f"{dt_ms:6.1f} ms │ {lighting:<4} │ {level:<14} │ score={score:.2f}")
-    status_txt = (
-        f"Lighting: {lighting}\n"
-        + ("Detection paused – low light." if lighting == "Low"
-           else f"Status: {level}\nScore: {score:.2f}")
-    )
     audio_out = None
-    new_last_alert_ts = last_alert_ts
-    ALERT_COOLDOWN = CFG["alerting"].get("alert_cooldown_seconds", 5)
-    if (
-        ALERT_DATA is not None
-        and level != "Awake"
-        and lighting != "Low"
-        and (time.monotonic() - last_alert_ts) > ALERT_COOLDOWN
-    ):
-        new_last_alert_ts = time.monotonic()
-        audio_out = (ALERT_SR, ALERT_DATA.copy())
-    return processed, status_txt, audio_out, new_last_alert_ts
-# ───────────────────────────── UI
-with gr.Blocks(title="Drive Paddy – Drowsiness Detection") as app:
-    gr.Markdown("# 🚗 **Drive Paddy** – Static-file Alert Demo")
-    gr.Markdown("Webcam-based drowsiness detection · console shows real-time logs.")
-    with gr.Row():
-        with gr.Column(scale=2):
-            cam = gr.Image(sources=["webcam"], streaming=True, label="Live Camera Feed")
-        with gr.Column(scale=1):
-            out_img = gr.Image(label="Processed Feed")
-            out_text = gr.Textbox(label="Live Status", lines=3, interactive=False)
-            out_audio = gr.Audio(
-                label="Alert",
-                autoplay=True,
-                type="numpy",
-                visible=True,
-            )
-            last_alert_state = gr.State(value=0.0)
-    cam.stream(
-        fn=process_live_frame,
-        inputs=[cam, last_alert_state],
-        outputs=[out_img, out_text, out_audio, last_alert_state]
-    )
 if __name__ == "__main__":
-    logging.info("Launching Gradio app …")
-    app.launch(debug=True)

 import time
 import os
 import yaml
 import numpy as np
 import gradio as gr
 import soundfile as sf
 from dotenv import load_dotenv
+from threading import Lock
+from queue import Queue
+import threading
+from src.detection.factory import get_detector
 # ───────────────────────────── logging
 logging.basicConfig(
 detector = get_detector(CFG)
+# ───────────────────────────── alert sound manager
+class AlertManager:
+    def __init__(self, wav_path, cooldown_seconds=5):
+        self.cooldown_seconds = cooldown_seconds
+        self.last_alert_time = 0
+        self.lock = Lock()
+        self.alert_queue = Queue(maxsize=1)
+        # Load alert sound
+        try:
+            self.sample_rate, self.audio_data = sf.read(wav_path, dtype="float32")
+            # Ensure stereo format for Gradio
+            if self.audio_data.ndim == 1:
+                self.audio_data = np.column_stack([self.audio_data, self.audio_data])
+            # Normalize to [-1, 1] range
+            max_val = np.abs(self.audio_data).max()
+            if max_val > 0:
+                self.audio_data = self.audio_data / max_val
+            logging.info(f"Loaded alert sound: {wav_path} "
+                        f"({len(self.audio_data)/self.sample_rate:.2f}s, "
+                        f"shape: {self.audio_data.shape})")
+            self.is_loaded = True
+        except Exception as e:
+            logging.error(f"Failed to load alert sound: {e}")
+            self.is_loaded = False
+            self.sample_rate = 44100
+            self.audio_data = None
+    def should_alert(self, drowsiness_level, lighting):
+        """Check if we should trigger an alert"""
+        if not self.is_loaded:
+            return False
+        with self.lock:
+            current_time = time.monotonic()
+            if (drowsiness_level != "Awake"
+                and lighting != "Low"
+                and (current_time - self.last_alert_time) > self.cooldown_seconds):
+                self.last_alert_time = current_time
+                return True
+        return False
+    def get_alert_audio(self):
+        """Get the alert audio data"""
+        if self.is_loaded:
+            return (int(self.sample_rate), self.audio_data.copy())
+        return None
+# Initialize alert manager
+alert_manager = AlertManager(
+    wav_path=CFG["alerting"].get("alert_sound_path"),
+    cooldown_seconds=CFG["alerting"].get("alert_cooldown_seconds", 5)
+)
 # ───────────────────────────── frame processing
+def process_live_frame(frame):
+    """Process frame for drowsiness detection"""
     if frame is None:
         return (
             np.zeros((480, 640, 3), dtype=np.uint8),
             "Status: Inactive",
+            None
         )
     t0 = time.perf_counter()
     try:
+        # Process frame through detector
+        processed, indic = detector.process_frame(frame)
     except Exception as e:
         logging.error(f"Error processing frame: {e}")
         processed = np.zeros_like(frame)
+        indic = {
+            "drowsiness_level": "Error",
+            "lighting": "Unknown",
+            "details": {"Score": 0.0}
+        }
+    # Extract detection results
     level = indic.get("drowsiness_level", "Awake")
     lighting = indic.get("lighting", "Good")
     score = indic.get("details", {}).get("Score", 0.0)
+    # Log performance
     dt_ms = (time.perf_counter() - t0) * 1000.0
     logging.info(f"{dt_ms:6.1f} ms │ {lighting:<4} │ {level:<14} │ score={score:.2f}")
+    # Create status text
+    status_txt = f"Lighting: {lighting}\n"
+    if lighting == "Low":
+        status_txt += "Detection paused – low light."
+    else:
+        status_txt += f"Status: {level}\nScore: {score:.2f}"
+    # Check if we should trigger alert
     audio_out = None
+    if alert_manager.should_alert(level, lighting):
+        audio_out = alert_manager.get_alert_audio()
+        if audio_out:
+            logging.info("🔊 Alert triggered!")
+    return processed, status_txt, audio_out
+# ───────────────────────────── UI with error handling
+def create_ui():
+    with gr.Blocks(title="Drive Paddy – Drowsiness Detection") as app:
+        gr.Markdown("# 🚗 **Drive Paddy** – Real-time Drowsiness Detection")
+        gr.Markdown("Webcam-based drowsiness detection with audio alerts.")
+        with gr.Row():
+            with gr.Column(scale=2):
+                cam = gr.Image(
+                    sources=["webcam"],
+                    streaming=True,
+                    label="Live Camera Feed"
+                )
+            with gr.Column(scale=1):
+                out_img = gr.Image(label="Processed Feed")
+                out_text = gr.Textbox(
+                    label="Live Status",
+                    lines=4,
+                    interactive=False
+                )
+                out_audio = gr.Audio(
+                    label="Alert Sound",
+                    autoplay=True,
+                    type="numpy",
+                    visible=True,
+                )
+        # Add system info
+        with gr.Row():
+            gr.Markdown(f"""
+            **System Info:**
+            - Alert cooldown: {CFG['alerting'].get('alert_cooldown_seconds', 5)}s
+            - Alert sound loaded: {'✓' if alert_manager.is_loaded else '✗'}
+            """)
+        # Connect the streaming
+        cam.stream(
+            fn=process_live_frame,
+            inputs=[cam],
+            outputs=[out_img, out_text, out_audio]
+        )
+    return app
+# ───────────────────────────── main
 if __name__ == "__main__":
+    logging.info("Initializing Drive Paddy...")
+    # Create and launch app
+    app = create_ui()
+    logging.info("Launching Gradio app...")
+    app.launch(
+        debug=True,
+        share=False,  # Set to True if you want a public link
+        server_name="0.0.0.0",  # Allow external connections
+        server_port=7860
+    )