Spaces:

Testys
/

drive-paddy

Sleeping

File size: 6,180 Bytes

8ae9de4
 
 
 
 
 
 
 
60b383e
 
 
 
 
 
 
 
a7ec466
8ae9de4
 
a7ec466
ba6a8ea
935769d
b9d2bb7
 
935769d
b9d2bb7
 
 
935769d
 
 
 
b9d2bb7
935769d
ba6a8ea
8ae9de4
 
 
a7ec466
8ae9de4
26151a4
a7ec466
8ae9de4
 
 
 
 
 
 
 
a7ec466
e0dcec0
8ae9de4
 
 
a7ec466
 
8ae9de4
 
 
 
 
 
 
 
 
 
 
 
a7ec466
 
 
8ae9de4
 
ba6a8ea
8ae9de4
 
a7ec466
3a175cd
60b383e
 
 
8ae9de4
60b383e
8ae9de4
935769d
8ae9de4
60b383e
8ae9de4
a7ec466
60b383e
 
 
8ae9de4
 
60b383e
935769d
60b383e
8ae9de4
935769d
b9d2bb7
8ae9de4
 
 
 
 
 
 
 
 
 
 
 
 
 
a7ec466
8ae9de4
 
 
 
 
 
 
 
 
 
 
 
 
a7ec466
8ae9de4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5101617
8977de8
8ae9de4

# app_gradio.py
# ──────────────────────────────────────────────────────────
# Webcam → geometric detector → static WAV alert (with cooldown)
# Live console logs of per-frame latency + status.
#
# EDITED: This version uses a more robust method for audio playback
# in Gradio by dynamically creating the Audio component.
# ──────────────────────────────────────────────────────────
import time
import os
import yaml
import logging
import numpy as np
import gradio as gr
import soundfile as sf
from dotenv import load_dotenv

# This is a mock factory and detector for demonstration.
# Replace with your actual import.
from src.detection.factory import get_detector

# ───────────────────────────── logging
logging.basicConfig(
    level=logging.INFO,
    format="%(asctime)s │ %(message)s",
    datefmt="%H:%M:%S",
)

# ───────────────────────────── config / detector
load_dotenv()
with open("config.yaml") as f:
    CFG = yaml.safe_load(f)

detector = get_detector(CFG)

# ───────────────────────────── Alert Manager Class <--- CHANGE
# Encapsulating the alert logic makes the code much cleaner.
# It handles its own state (last alert time) internally.
class AlertManager:
    def __init__(self, config):
        self.cooldown_seconds = config.get("alert_cooldown_seconds", 1)
        self.last_alert_time = 0
        self.alert_data = None
        self.sample_rate = None
        self._load_sound(config.get("alert_sound_path"))

    def _load_sound(self, wav_path):
        if not wav_path:
            logging.warning("No 'alert_sound_path' found in config.")
            return
        try:
            data, sr = sf.read(wav_path, dtype="int16")
            self.alert_data = data
            self.sample_rate = sr
            logging.info(f"Loaded alert sound: {wav_path} ({len(self.alert_data)/self.sample_rate:.2f}s)")
        except Exception as e:
            logging.error(f"Failed to load alert sound: {e}")
            self.alert_data = None

    def trigger_alert(self, level, lighting):
        """Checks conditions and returns audio payload if an alert should fire."""
        is_drowsy = level != "Awake"
        is_good_light = lighting != "Low"
        is_ready = (time.monotonic() - self.last_alert_time) > self.cooldown_seconds
        
        if self.alert_data is not None and is_drowsy and is_good_light and is_ready:
            self.last_alert_time = time.monotonic()
            logging.info("🔊 Alert conditions met! Triggering sound.")
            return (self.sample_rate, self.alert_data.copy())
        
        return None

# Initialize the alert manager
alert_manager = AlertManager(CFG["alerting"])

# ───────────────────────────── frame processing <--- MAJOR CHANGE
# Simplified by the AlertManager. No longer needs to pass 'last_alert_ts' back and forth.
def process_live_frame(frame):
    if frame is None:
        return (
            np.zeros((480, 640, 3), dtype=np.uint8),
            "Status: Inactive",
            None # No audio output
        )

    t0 = time.perf_counter()

    try:
        # Assuming your detector returns (processed_image, indicators_dict)
        processed, indic = detector.process_frame(frame)
    except Exception as e:
        logging.error(f"Error processing frame: {e}")
        processed = np.zeros_like(frame)
        indic = {"drowsiness_level": "Error", "lighting": "Unknown", "details": {"Score": 0.0}}

    level = indic.get("drowsiness_level", "Awake")
    lighting = indic.get("lighting", "Good")
    score = indic.get("details", {}).get("Score", 0.0)

    dt_ms = (time.perf_counter() - t0) * 1000.0
    logging.info(f"{dt_ms:6.1f} ms │ {lighting:<4} │ {level:<14} │ score={score:.2f}")

    status_txt = (
        f"Lighting: {lighting}\n"
        + ("Detection paused – low light." if lighting == "Low"
           else f"Status: {level}\nScore: {score:.2f}")
    )

    # Check for an alert and get the audio payload if ready
    audio_payload = alert_manager.trigger_alert(level, lighting)

    # This is the key: return a new gr.Audio component when an alert fires.
    # Otherwise, return None to clear the component on the frontend.
    if audio_payload:
        return processed, status_txt, gr.Audio(value=audio_payload, autoplay=True)
    else:
        return processed, status_txt, None

# ───────────────────────────── UI <--- CHANGE
with gr.Blocks(title="Drive Paddy – Drowsiness Detection") as app:
    gr.Markdown("# 🚗 **Drive Paddy** – Robust Alert Demo")
    gr.Markdown("Webcam-based drowsiness detection · console shows real-time logs.")

    with gr.Row():
        with gr.Column(scale=2):
            cam = gr.Image(sources=["webcam"], streaming=True, label="Live Camera Feed")
        with gr.Column(scale=1):
            out_img = gr.Image(label="Processed Feed")
            out_text = gr.Textbox(label="Live Status", lines=3, interactive=False)
            
            # This audio component now acts as a placeholder.
            # We make it invisible because we don't need to show the player controls.
            # The backend will dynamically send a new, playable component to it.
            out_audio = gr.Audio(
                label="Alert",
                autoplay=True,
                visible=False, # Hiding the component for a cleaner UX
            )

    # The gr.State for managing the timestamp is no longer needed, simplifying the stream call.
    cam.stream(
        fn=process_live_frame,
        inputs=[cam],
        outputs=[out_img, out_text, out_audio] # The output now targets the placeholder
    )

if __name__ == "__main__":
    logging.info("Launching Gradio app…")
    app.launch(debug=True)