Spaces:

Testys
/

drive-paddy

Sleeping

App Files Files Community

Testys commited on 25 days ago

Commit

fcccf01

verified ·

1 Parent(s): 89d5f02

Update app.py

Browse files

Files changed (1) hide show

app.py +24 -3

app.py CHANGED Viewed

@@ -7,6 +7,8 @@ import os
 import yaml
 from dotenv import load_dotenv
 from threading import Thread
 # --- TTS & AI Imports ---
 from parler_tts import ParlerTTSForConditionalGeneration
@@ -32,6 +34,22 @@ detector = get_detector(config)
 alerter = get_alerter(config, secrets["gemini_api_key"])
 print("Initialization complete. Launching UI...")
 # --- Parler-TTS Model Setup (Requires GPU) ---
 print("Loading Parler-TTS model. This may take a moment...")
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
@@ -48,6 +66,7 @@ feature_extractor = AutoFeatureExtractor.from_pretrained(repo_id)
 print("Parler-TTS model loaded.")
 # --- Audio Streaming Generator Function ---
 def stream_alert_audio(text_prompt):
     """
     A generator function that yields audio chunks for a given text prompt.
@@ -87,6 +106,7 @@ def stream_alert_audio(text_prompt):
         alerter.reset_alert()
 # --- Main Webcam Processing Function ---
 def process_live_frame(frame):
     """
     Processes each webcam frame, performs drowsiness detection, and
@@ -130,7 +150,7 @@ with gr.Blocks(theme=gr.themes.Default(primary_hue="blue")) as app:
     with gr.Row():
         with gr.Column(scale=2):
-            webcam_input = gr.Image(sources=["webcam"], streaming=True, label="Live Camera Feed")
         with gr.Column(scale=1):
             processed_output = gr.Image(label="Processed Feed")
             status_output = gr.Textbox(label="Live Status", lines=3, interactive=False)
@@ -139,14 +159,15 @@ with gr.Blocks(theme=gr.themes.Default(primary_hue="blue")) as app:
             audio_alert_output = gr.Audio(
                 label="Alert System",
                 autoplay=True,
-                visible=False, # Hide the player controls
                 streaming=True
             )
     webcam_input.stream(
         fn=process_live_frame,
         inputs=[webcam_input],
-        outputs=[processed_output, status_output, audio_alert_output]
     )

 import yaml
 from dotenv import load_dotenv
 from threading import Thread
+from gradio_webrtc import WebRTC
+from twilio.rest import Client
 # --- TTS & AI Imports ---
 from parler_tts import ParlerTTSForConditionalGeneration
 alerter = get_alerter(config, secrets["gemini_api_key"])
 print("Initialization complete. Launching UI...")
+account_sid = os.environ.get("TURN_USERNAME")
+auth_token = os.environ.get("TURN_CREDENTIAL)
+if account_sid and auth_token:
+    client = Client(account_sid, auth_token)
+    token = client.tokens.create()
+    rtc_configuration = {
+        "iceServers": token.ice_servers,
+        "iceTransportPolicy": "relay",
+    }
+else:
+    rtc_configuration = None
 # --- Parler-TTS Model Setup (Requires GPU) ---
 print("Loading Parler-TTS model. This may take a moment...")
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 print("Parler-TTS model loaded.")
 # --- Audio Streaming Generator Function ---
+@spaces.GPU
 def stream_alert_audio(text_prompt):
     """
     A generator function that yields audio chunks for a given text prompt.
         alerter.reset_alert()
 # --- Main Webcam Processing Function ---
+@spaces.GPU
 def process_live_frame(frame):
     """
     Processes each webcam frame, performs drowsiness detection, and
     with gr.Row():
         with gr.Column(scale=2):
+            webcam_input = WebRTC(label="Stream", rtc_configuration=rtc_configuration)
         with gr.Column(scale=1):
             processed_output = gr.Image(label="Processed Feed")
             status_output = gr.Textbox(label="Live Status", lines=3, interactive=False)
             audio_alert_output = gr.Audio(
                 label="Alert System",
                 autoplay=True,
+                visible=True, # Hide the player controls
                 streaming=True
             )
     webcam_input.stream(
         fn=process_live_frame,
         inputs=[webcam_input],
+        outputs=[status_output, audio_alert_output],
+        time_limit=10
     )