Spaces:

Pushkar0655g
/

multilingual-subtitle-tool

Running

App Files Files Community

Pushkar0655g commited on Mar 19

Commit

07cf4bd

1 Parent(s): cf544a5

Update utils.py to fix openai-whisper compatibility and improve error handling

Browse files

Files changed (1) hide show

utils.py +23 -6

utils.py CHANGED Viewed

@@ -1,19 +1,32 @@
-import openai_whisper as whisper
 from transformers import MarianMTModel, MarianTokenizer, AutoTokenizer, AutoModelForSeq2SeqLM
 import os
 # Load Whisper model
-model = whisper.load_model("base")
 def process_video(video_file, language):
     # Save uploaded video locally
     video_path = "/tmp/video.mp4"
-    with open(video_path, "wb") as f:
-        f.write(video_file.read())
     try:
         print("Transcribing video to English...")
         result = model.transcribe(video_path, language="en")
         segments = []
         if language == "English":
@@ -42,7 +55,10 @@ def process_video(video_file, language):
                     "Arabic": "Helsinki-NLP/opus-mt-en-ar",
                     "Japanese": "Helsinki-NLP/opus-mt-en-jap"
                 }
-                model_name = model_map[language]
                 tokenizer = MarianTokenizer.from_pretrained(model_name)
                 translation_model = MarianMTModel.from_pretrained(model_name)
                 print(f"Translating to {language}...")
@@ -60,7 +76,8 @@ def process_video(video_file, language):
                 end = f"{segment['end']:.3f}".replace(".", ",")
                 text = segment["text"].strip()
                 f.write(f"{i}\n00:00:{start} --> 00:00:{end}\n{text}\n\n")
         return srt_path
     except Exception as e:
-        return f"Error: {str(e)}"

+import openai_whisper as whisper  # Use the correct import for openai-whisper
 from transformers import MarianMTModel, MarianTokenizer, AutoTokenizer, AutoModelForSeq2SeqLM
 import os
 # Load Whisper model
+try:
+    print("Loading Whisper model...")
+    model = whisper.load_model("base")
+    print("Whisper model loaded successfully!")
+except Exception as e:
+    raise ImportError(f"Failed to load Whisper model: {e}")
 def process_video(video_file, language):
+    """
+    Process the uploaded video and generate subtitles in the specified language.
+    """
     # Save uploaded video locally
     video_path = "/tmp/video.mp4"
+    try:
+        with open(video_path, "wb") as f:
+            f.write(video_file.read())
+        print(f"Video saved to {video_path}")
+    except Exception as e:
+        return f"Error saving video file: {str(e)}"
     try:
         print("Transcribing video to English...")
         result = model.transcribe(video_path, language="en")
+        print("Transcription completed!")
         segments = []
         if language == "English":
                     "Arabic": "Helsinki-NLP/opus-mt-en-ar",
                     "Japanese": "Helsinki-NLP/opus-mt-en-jap"
                 }
+                model_name = model_map.get(language)
+                if not model_name:
+                    return f"Unsupported language: {language}"
                 tokenizer = MarianTokenizer.from_pretrained(model_name)
                 translation_model = MarianMTModel.from_pretrained(model_name)
                 print(f"Translating to {language}...")
                 end = f"{segment['end']:.3f}".replace(".", ",")
                 text = segment["text"].strip()
                 f.write(f"{i}\n00:00:{start} --> 00:00:{end}\n{text}\n\n")
+        print(f"SRT file created at {srt_path}")
         return srt_path
     except Exception as e:
+        return f"Error processing video: {str(e)}"