whisper-tg

Paused

App Files Files Community

muhtasham commited on Mar 25

Commit

a231b66

1 Parent(s): 0900fc2

WIP

Browse files

Files changed (1) hide show

app.py +8 -18

app.py CHANGED Viewed

@@ -270,11 +270,6 @@ def transcribe_youtube(url, return_timestamps, generate_subs, chunk_length_s=15,
         logger.info(f"Transcription metadata: {metadata}")
         logger.info(f"Transcription completed in {metadata.get('timing', {}).get('total_time', 0):.2f} seconds")
-        # Format response with segments (without id)
-        logger.info("Formatting response...")
-        formatted_result = result["transcription"]
-        logger.info(f"Formatted result contains {len(formatted_result['segments'])} segments")
         # Generate subtitles if requested
         srt_file = None
         if generate_subs and return_timestamps and "segments" in result["transcription"]:
@@ -284,7 +279,7 @@ def transcribe_youtube(url, return_timestamps, generate_subs, chunk_length_s=15,
             logger.info(f"Generated SRT file: {srt_file}")
         logger.info("YouTube transcription process completed successfully")
-        return {"transcription": formatted_result, "metadata": result["metadata"]}, result, srt_file, ""
     except Exception as e:
         logger.exception(f"Error in YouTube transcription: {str(e)}")
@@ -331,11 +326,6 @@ def transcribe(inputs, return_timestamps, generate_subs, chunk_length_s=15, batc
             logger.info(f"Transcription metadata: {metadata}")
             logger.info(f"Transcription completed in {metadata.get('timing', {}).get('total_time', 0):.2f} seconds")
-            # Format response with segments (without id)
-            logger.info("Formatting response...")
-            formatted_result = result["transcription"]
-            logger.info(f"Formatted result contains {len(formatted_result['segments'])} segments")
             # Generate subtitles if requested
             srt_file = None
             if generate_subs and return_timestamps and "segments" in result["transcription"]:
@@ -345,7 +335,7 @@ def transcribe(inputs, return_timestamps, generate_subs, chunk_length_s=15, batc
                 logger.info(f"Generated SRT file: {srt_file}")
             logger.info("Transcription process completed successfully")
-            return {"transcription": formatted_result, "metadata": result["metadata"]}, result, srt_file, ""
     except requests.exceptions.RequestException as e:
         logger.exception(f"API request failed: {str(e)}")
@@ -368,9 +358,9 @@ youtube_transcribe = gr.Interface(
         gr.Slider(minimum=8, maximum=128, value=8, step=8, label="Batch Size")
     ],
     outputs=[
-        gr.JSON(label="Formatted Response", open=True),
-        gr.JSON(label="Raw API Response", open=True),
         gr.File(label="Subtitles (SRT)", visible=True),
     ],
     title="Tajik Speech Transcription",
     description=(
@@ -393,9 +383,9 @@ mf_transcribe = gr.Interface(
         gr.Slider(minimum=8, maximum=128, value=8, step=8, label="Batch Size")
     ],
     outputs=[
-        gr.JSON(label="Formatted Response", open=True),
-        gr.JSON(label="Raw API Response", open=True),
         gr.File(label="Subtitles (SRT)", visible=True),
     ],
     title="Tajik Speech Transcription",
     description=(
@@ -415,9 +405,9 @@ file_transcribe = gr.Interface(
         gr.Slider(minimum=8, maximum=128, value=8, step=8, label="Batch Size")
     ],
     outputs=[
-        gr.JSON(label="Formatted Response", open=True),
-        gr.JSON(label="Raw API Response", open=True),
         gr.File(label="Subtitles (SRT)", visible=True),
     ],
     title="Tajik Speech Transcription",
     description=(

         logger.info(f"Transcription metadata: {metadata}")
         logger.info(f"Transcription completed in {metadata.get('timing', {}).get('total_time', 0):.2f} seconds")
         # Generate subtitles if requested
         srt_file = None
         if generate_subs and return_timestamps and "segments" in result["transcription"]:
             logger.info(f"Generated SRT file: {srt_file}")
         logger.info("YouTube transcription process completed successfully")
+        return result, srt_file, ""
     except Exception as e:
         logger.exception(f"Error in YouTube transcription: {str(e)}")
             logger.info(f"Transcription metadata: {metadata}")
             logger.info(f"Transcription completed in {metadata.get('timing', {}).get('total_time', 0):.2f} seconds")
             # Generate subtitles if requested
             srt_file = None
             if generate_subs and return_timestamps and "segments" in result["transcription"]:
                 logger.info(f"Generated SRT file: {srt_file}")
             logger.info("Transcription process completed successfully")
+            return result, srt_file, ""
     except requests.exceptions.RequestException as e:
         logger.exception(f"API request failed: {str(e)}")
         gr.Slider(minimum=8, maximum=128, value=8, step=8, label="Batch Size")
     ],
     outputs=[
+        gr.JSON(label="API Response", open=True),
         gr.File(label="Subtitles (SRT)", visible=True),
+        gr.Textbox(label="Error", visible=False)
     ],
     title="Tajik Speech Transcription",
     description=(
         gr.Slider(minimum=8, maximum=128, value=8, step=8, label="Batch Size")
     ],
     outputs=[
+        gr.JSON(label="API Response", open=True),
         gr.File(label="Subtitles (SRT)", visible=True),
+        gr.Textbox(label="Error", visible=False)
     ],
     title="Tajik Speech Transcription",
     description=(
         gr.Slider(minimum=8, maximum=128, value=8, step=8, label="Batch Size")
     ],
     outputs=[
+        gr.JSON(label="API Response", open=True),
         gr.File(label="Subtitles (SRT)", visible=True),
+        gr.Textbox(label="Error", visible=False)
     ],
     title="Tajik Speech Transcription",
     description=(