Spaces:

Testys
/

drive-paddy

Sleeping

App Files Files Community

Testys commited on 23 days ago

Commit

8ae9de4

verified ·

1 Parent(s): a7ec466

Update app.py

Browse files

Files changed (1) hide show

app.py +94 -138

app.py CHANGED Viewed

@@ -1,3 +1,11 @@
 import time
 import os
 import yaml
@@ -6,10 +14,9 @@ import numpy as np
 import gradio as gr
 import soundfile as sf
 from dotenv import load_dotenv
-from threading import Lock
-from queue import Queue
-import threading
 from src.detection.factory import get_detector
 # ───────────────────────────── logging
@@ -26,168 +33,117 @@ with open("config.yaml") as f:
 detector = get_detector(CFG)
-# ───────────────────────────── alert sound manager
 class AlertManager:
-    def __init__(self, wav_path, cooldown_seconds=5):
-        self.cooldown_seconds = cooldown_seconds
         self.last_alert_time = 0
-        self.lock = Lock()
-        self.alert_queue = Queue(maxsize=1)
-        # Load alert sound
         try:
-            self.sample_rate, self.audio_data = sf.read(wav_path, dtype="float32")
-            # Ensure stereo format for Gradio
-            if self.audio_data.ndim == 1:
-                self.audio_data = np.column_stack([self.audio_data, self.audio_data])
-            # Normalize to [-1, 1] range
-            max_val = np.abs(self.audio_data).max()
-            if max_val > 0:
-                self.audio_data = self.audio_data / max_val
-            logging.info(f"Loaded alert sound: {wav_path} "
-                        f"({len(self.audio_data)/self.sample_rate:.2f}s, "
-                        f"shape: {self.audio_data.shape})")
-            self.is_loaded = True
         except Exception as e:
             logging.error(f"Failed to load alert sound: {e}")
-            self.is_loaded = False
-            self.sample_rate = 44100
-            self.audio_data = None
-    def should_alert(self, drowsiness_level, lighting):
-        """Check if we should trigger an alert"""
-        if not self.is_loaded:
-            return False
-        with self.lock:
-            current_time = time.monotonic()
-            if (drowsiness_level != "Awake"
-                and lighting != "Low"
-                and (current_time - self.last_alert_time) > self.cooldown_seconds):
-                self.last_alert_time = current_time
-                return True
-        return False
-    def get_alert_audio(self):
-        """Get the alert audio data"""
-        if self.is_loaded:
-            return (int(self.sample_rate), self.audio_data.copy())
         return None
-# Initialize alert manager
-alert_manager = AlertManager(
-    wav_path=CFG["alerting"].get("alert_sound_path"),
-    cooldown_seconds=CFG["alerting"].get("alert_cooldown_seconds", 5)
-)
-# ───────────────────────────── frame processing
 def process_live_frame(frame):
-    """Process frame for drowsiness detection"""
     if frame is None:
         return (
             np.zeros((480, 640, 3), dtype=np.uint8),
             "Status: Inactive",
-            None
         )
     t0 = time.perf_counter()
     try:
-        # Process frame through detector
         processed, indic = detector.process_frame(frame)
     except Exception as e:
         logging.error(f"Error processing frame: {e}")
         processed = np.zeros_like(frame)
-        indic = {
-            "drowsiness_level": "Error",
-            "lighting": "Unknown",
-            "details": {"Score": 0.0}
-        }
-    # Extract detection results
     level = indic.get("drowsiness_level", "Awake")
     lighting = indic.get("lighting", "Good")
     score = indic.get("details", {}).get("Score", 0.0)
-    # Log performance
     dt_ms = (time.perf_counter() - t0) * 1000.0
     logging.info(f"{dt_ms:6.1f} ms │ {lighting:<4} │ {level:<14} │ score={score:.2f}")
-    # Create status text
-    status_txt = f"Lighting: {lighting}\n"
-    if lighting == "Low":
-        status_txt += "Detection paused – low light."
     else:
-        status_txt += f"Status: {level}\nScore: {score:.2f}"
-    # Check if we should trigger alert
-    audio_out = None
-    if alert_manager.should_alert(level, lighting):
-        audio_out = alert_manager.get_alert_audio()
-        if audio_out:
-            logging.info("🔊 Alert triggered!")
-    return processed, status_txt, audio_out
-# ───────────────────────────── UI with error handling
-def create_ui():
-    with gr.Blocks(title="Drive Paddy – Drowsiness Detection") as app:
-        gr.Markdown("# 🚗 **Drive Paddy** – Real-time Drowsiness Detection")
-        gr.Markdown("Webcam-based drowsiness detection with audio alerts.")
-        with gr.Row():
-            with gr.Column(scale=2):
-                cam = gr.Image(
-                    sources=["webcam"],
-                    streaming=True,
-                    label="Live Camera Feed"
-                )
-            with gr.Column(scale=1):
-                out_img = gr.Image(label="Processed Feed")
-                out_text = gr.Textbox(
-                    label="Live Status",
-                    lines=4,
-                    interactive=False
-                )
-                out_audio = gr.Audio(
-                    label="Alert Sound",
-                    autoplay=True,
-                    type="numpy",
-                    visible=True,
-                )
-        # Add system info
-        with gr.Row():
-            gr.Markdown(f"""
-            **System Info:**
-            - Alert cooldown: {CFG['alerting'].get('alert_cooldown_seconds', 5)}s
-            - Alert sound loaded: {'✓' if alert_manager.is_loaded else '✗'}
-            """)
-        # Connect the streaming
-        cam.stream(
-            fn=process_live_frame,
-            inputs=[cam],
-            outputs=[out_img, out_text, out_audio]
-        )
-    return app
-# ───────────────────────────── main
 if __name__ == "__main__":
-    logging.info("Initializing Drive Paddy...")
-    # Create and launch app
-    app = create_ui()
-    logging.info("Launching Gradio app...")
-    app.launch(
-        debug=True,
-        share=False,  # Set to True if you want a public link
-        server_name="0.0.0.0",  # Allow external connections
-        server_port=7860
-    )

+# app_gradio.py
+# ──────────────────────────────────────────────────────────
+# Webcam → geometric detector → static WAV alert (with cooldown)
+# Live console logs of per-frame latency + status.
+#
+# EDITED: This version uses a more robust method for audio playback
+# in Gradio by dynamically creating the Audio component.
+# ──────────────────────────────────────────────────────────
 import time
 import os
 import yaml
 import gradio as gr
 import soundfile as sf
 from dotenv import load_dotenv
+# This is a mock factory and detector for demonstration.
+# Replace with your actual import.
 from src.detection.factory import get_detector
 # ───────────────────────────── logging
 detector = get_detector(CFG)
+# ───────────────────────────── Alert Manager Class <--- CHANGE
+# Encapsulating the alert logic makes the code much cleaner.
+# It handles its own state (last alert time) internally.
 class AlertManager:
+    def __init__(self, config):
+        self.cooldown_seconds = config.get("alert_cooldown_seconds", 5)
         self.last_alert_time = 0
+        self.alert_data = None
+        self.sample_rate = None
+        self._load_sound(config.get("alert_sound_path"))
+    def _load_sound(self, wav_path):
+        if not wav_path:
+            logging.warning("No 'alert_sound_path' found in config.")
+            return
         try:
+            data, sr = sf.read(wav_path, dtype="float32")
+            self.alert_data = data
+            self.sample_rate = sr
+            logging.info(f"Loaded alert sound: {wav_path} ({len(self.alert_data)/self.sample_rate:.2f}s)")
         except Exception as e:
             logging.error(f"Failed to load alert sound: {e}")
+            self.alert_data = None
+    def trigger_alert(self, level, lighting):
+        """Checks conditions and returns audio payload if an alert should fire."""
+        is_drowsy = level != "Awake"
+        is_good_light = lighting != "Low"
+        is_ready = (time.monotonic() - self.last_alert_time) > self.cooldown_seconds
+        if self.alert_data is not None and is_drowsy and is_good_light and is_ready:
+            self.last_alert_time = time.monotonic()
+            logging.info("🔊 Alert conditions met! Triggering sound.")
+            return (self.sample_rate, self.alert_data.copy())
         return None
+# Initialize the alert manager
+alert_manager = AlertManager(CFG["alerting"])
+# ───────────────────────────── frame processing <--- MAJOR CHANGE
+# Simplified by the AlertManager. No longer needs to pass 'last_alert_ts' back and forth.
 def process_live_frame(frame):
     if frame is None:
         return (
             np.zeros((480, 640, 3), dtype=np.uint8),
             "Status: Inactive",
+            None # No audio output
         )
     t0 = time.perf_counter()
     try:
+        # Assuming your detector returns (processed_image, indicators_dict)
         processed, indic = detector.process_frame(frame)
     except Exception as e:
         logging.error(f"Error processing frame: {e}")
         processed = np.zeros_like(frame)
+        indic = {"drowsiness_level": "Error", "lighting": "Unknown", "details": {"Score": 0.0}}
     level = indic.get("drowsiness_level", "Awake")
     lighting = indic.get("lighting", "Good")
     score = indic.get("details", {}).get("Score", 0.0)
     dt_ms = (time.perf_counter() - t0) * 1000.0
     logging.info(f"{dt_ms:6.1f} ms │ {lighting:<4} │ {level:<14} │ score={score:.2f}")
+    status_txt = (
+        f"Lighting: {lighting}\n"
+        + ("Detection paused – low light." if lighting == "Low"
+           else f"Status: {level}\nScore: {score:.2f}")
+    )
+    # Check for an alert and get the audio payload if ready
+    audio_payload = alert_manager.trigger_alert(level, lighting)
+    # This is the key: return a new gr.Audio component when an alert fires.
+    # Otherwise, return None to clear the component on the frontend.
+    if audio_payload:
+        return processed, status_txt, gr.Audio(value=audio_payload, autoplay=True)
     else:
+        return processed, status_txt, None
+# ───────────────────────────── UI <--- CHANGE
+with gr.Blocks(title="Drive Paddy – Drowsiness Detection") as app:
+    gr.Markdown("# 🚗 **Drive Paddy** – Robust Alert Demo")
+    gr.Markdown("Webcam-based drowsiness detection · console shows real-time logs.")
+    with gr.Row():
+        with gr.Column(scale=2):
+            cam = gr.Image(sources=["webcam"], streaming=True, label="Live Camera Feed")
+        with gr.Column(scale=1):
+            out_img = gr.Image(label="Processed Feed")
+            out_text = gr.Textbox(label="Live Status", lines=3, interactive=False)
+            # This audio component now acts as a placeholder.
+            # We make it invisible because we don't need to show the player controls.
+            # The backend will dynamically send a new, playable component to it.
+            out_audio = gr.Audio(
+                label="Alert",
+                autoplay=True,
+                visible=False, # Hiding the component for a cleaner UX
+            )
+    # The gr.State for managing the timestamp is no longer needed, simplifying the stream call.
+    cam.stream(
+        fn=process_live_frame,
+        inputs=[cam],
+        outputs=[out_img, out_text, out_audio] # The output now targets the placeholder
+    )
 if __name__ == "__main__":
+    logging.info("Launching Gradio app…")
+    app.launch(debug=True)