Spaces:

MicroHealth
/

AV-to-transcripts

Paused

App Files Files Community

bluenevus commited on Apr 24

Commit

aed95f4

verified ·

1 Parent(s): 330af25

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -23

app.py CHANGED Viewed

@@ -127,9 +127,9 @@ Now, please process the following transcribed text:
 def transcribe_video(url):
     try:
-        print(f"Attempting to download audio from URL: {url}")
         audio_bytes = download_audio_from_url(url)
-        print(f"Successfully downloaded {len(audio_bytes)} bytes of audio data")
         with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio:
             AudioSegment.from_file(io.BytesIO(audio_bytes)).export(temp_audio.name, format="wav")
@@ -140,13 +140,21 @@ def transcribe_video(url):
         if len(transcript) < 10:
             raise ValueError("Transcription too short, possibly failed")
-        print("Separating speakers...")
-        separated_transcript = separate_speakers(transcript)
-        return separated_transcript
     except Exception as e:
         error_message = f"An error occurred: {str(e)}"
-        print(error_message)
         return error_message
 app = dash.Dash(__name__, external_stylesheets=[dbc.themes.BOOTSTRAP])
@@ -182,23 +190,17 @@ def update_transcription(n_clicks, url):
     if not url:
         raise PreventUpdate
-    def transcribe():
-        try:
-            transcript = transcribe_video(url)
-            return transcript
-        except Exception as e:
-            logger.exception("Error in transcription:")
-            return f"An error occurred: {str(e)}"
-    # Run transcription in a separate thread
-    thread = threading.Thread(target=transcribe)
-    thread.start()
-    thread.join(timeout=600)  # 10 minutes timeout
-    if thread.is_alive():
-        return "Transcription timed out after 10 minutes", {'display': 'none'}
-    transcript = getattr(thread, 'result', "Transcription failed")
     if transcript and not transcript.startswith("An error occurred"):
         return dbc.Card([

 def transcribe_video(url):
     try:
+        logger.info(f"Attempting to download audio from URL: {url}")
         audio_bytes = download_audio_from_url(url)
+        logger.info(f"Successfully downloaded {len(audio_bytes)} bytes of audio data")
         with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio:
             AudioSegment.from_file(io.BytesIO(audio_bytes)).export(temp_audio.name, format="wav")
         if len(transcript) < 10:
             raise ValueError("Transcription too short, possibly failed")
+        logger.info("Separating speakers...")
+        try:
+            separated_transcript = separate_speakers(transcript)
+            logger.info(f"Speaker separation complete. Result length: {len(separated_transcript)} characters")
+            if len(separated_transcript) < 10:
+                logger.warning("Speaker separation result too short, using original transcript")
+                return transcript
+            return separated_transcript
+        except Exception as e:
+            logger.error(f"Error during speaker separation: {str(e)}")
+            logger.info("Returning original transcript without speaker separation")
+            return transcript
     except Exception as e:
         error_message = f"An error occurred: {str(e)}"
+        logger.error(error_message)
         return error_message
 app = dash.Dash(__name__, external_stylesheets=[dbc.themes.BOOTSTRAP])
     if not url:
         raise PreventUpdate
+    transcript = transcribe_video(url)
+    if transcript and not transcript.startswith("An error occurred"):
+        return dbc.Card([
+            dbc.CardBody([
+                html.H5("Transcription Result with Speaker Separation"),
+                html.Pre(transcript, style={"white-space": "pre-wrap", "word-wrap": "break-word"})
+            ])
+        ]), {'display': 'block'}
+    else:
+        return transcript, {'display': 'none'}
     if transcript and not transcript.startswith("An error occurred"):
         return dbc.Card([