Spaces:

Pushkar0655g
/

multilingual-subtitle-tool

Running

App Files Files Community

Pushkar0655g commited on Mar 19

Commit

beae951

1 Parent(s): 67a18a1

Fix file type validation and improve UI

Browse files

Files changed (1) hide show

utils.py +21 -28

utils.py CHANGED Viewed

@@ -7,26 +7,23 @@ import subprocess
 # Load Whisper model
 model = whisper.load_model("base")
-def process_video(video_file, language):
-    # Save uploaded video to a temporary file
-    temp_dir = tempfile.gettempdir()
-    video_path = os.path.join(temp_dir, "input_video")  # No extension
-    output_video_path = os.path.join(temp_dir, "converted_video.mp4")  # Convert to MP4 for compatibility
     try:
-        # Save the uploaded file
-        print("Saving uploaded video...")
-        with open(video_path, "wb") as f:
-            f.write(video_file.read())
-        print(f"Video saved to {video_path}")
-        # Convert the video to MP4 using ffmpeg
         print("Converting video to MP4...")
-        subprocess.run(["ffmpeg", "-i", video_path, "-c:v", "libx264", "-preset", "fast", output_video_path], check=True)
-        print(f"Video converted and saved to {output_video_path}")
-        # Transcribe the video
-        print("Transcribing video to English...")
         result = model.transcribe(output_video_path, language="en")
         print("Transcription completed!")
@@ -35,7 +32,6 @@ def process_video(video_file, language):
         if language == "English":
             segments = result["segments"]
         else:
-            # Define translation models
             model_map = {
                 "Hindi": "Helsinki-NLP/opus-mt-en-hi",
                 "Spanish": "Helsinki-NLP/opus-mt-en-es",
@@ -52,12 +48,11 @@ def process_video(video_file, language):
             if not model_name:
                 return f"Unsupported language: {language}"
-            print(f"Loading translation model for {language}: {model_name}")
             if language == "Telugu":
                 tokenizer = AutoTokenizer.from_pretrained(model_name)
                 translation_model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
                 tgt_lang = "tel_Telu"
-                print(f"Translating to Telugu using NLLB-200 Distilled...")
                 for segment in result["segments"]:
                     inputs = tokenizer(segment["text"], return_tensors="pt", padding=True)
                     translated_tokens = translation_model.generate(
@@ -68,7 +63,6 @@ def process_video(video_file, language):
             else:
                 tokenizer = MarianTokenizer.from_pretrained(model_name)
                 translation_model = MarianMTModel.from_pretrained(model_name)
-                print(f"Translating to {language}...")
                 for segment in result["segments"]:
                     inputs = tokenizer(segment["text"], return_tensors="pt", padding=True)
                     translated = translation_model.generate(**inputs)
@@ -76,8 +70,6 @@ def process_video(video_file, language):
                     segments.append({"text": translated_text, "start": segment["start"], "end": segment["end"]})
         # Create SRT file
-        srt_path = os.path.join(tempfile.gettempdir(), "subtitles.srt")
-        print(f"Creating SRT file at {srt_path}")
         with open(srt_path, "w", encoding="utf-8") as f:
             for i, segment in enumerate(segments, 1):
                 start = f"{segment['start']:.3f}".replace(".", ",")
@@ -88,13 +80,14 @@ def process_video(video_file, language):
         return srt_path
     except subprocess.CalledProcessError as e:
-        return f"FFmpeg Error: {str(e)}"
     except Exception as e:
-        return f"Unexpected Error: {str(e)}"
     finally:
         # Clean up temporary files
-        print("Cleaning up temporary files...")
-        if os.path.exists(video_path):
-            os.remove(video_path)
         if os.path.exists(output_video_path):
-            os.remove(output_video_path)

 # Load Whisper model
 model = whisper.load_model("base")
+def process_video(video_path, language):  # Accept file path, not file object
+    output_video_path = os.path.join(tempfile.gettempdir(), "converted_video.mp4")
+    srt_path = os.path.join(tempfile.gettempdir(), "subtitles.srt")
     try:
+        # Convert video to MP4 using ffmpeg
         print("Converting video to MP4...")
+        subprocess.run(
+            ["ffmpeg", "-i", video_path, "-c:v", "libx264", "-preset", "fast", output_video_path],
+            check=True,  # Raise error if ffmpeg fails
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE
+        )
+        print("Video converted successfully!")
+        # Transcribe video
+        print("Transcribing video...")
         result = model.transcribe(output_video_path, language="en")
         print("Transcription completed!")
         if language == "English":
             segments = result["segments"]
         else:
             model_map = {
                 "Hindi": "Helsinki-NLP/opus-mt-en-hi",
                 "Spanish": "Helsinki-NLP/opus-mt-en-es",
             if not model_name:
                 return f"Unsupported language: {language}"
+            print(f"Loading translation model: {model_name}")
             if language == "Telugu":
                 tokenizer = AutoTokenizer.from_pretrained(model_name)
                 translation_model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
                 tgt_lang = "tel_Telu"
                 for segment in result["segments"]:
                     inputs = tokenizer(segment["text"], return_tensors="pt", padding=True)
                     translated_tokens = translation_model.generate(
             else:
                 tokenizer = MarianTokenizer.from_pretrained(model_name)
                 translation_model = MarianMTModel.from_pretrained(model_name)
                 for segment in result["segments"]:
                     inputs = tokenizer(segment["text"], return_tensors="pt", padding=True)
                     translated = translation_model.generate(**inputs)
                     segments.append({"text": translated_text, "start": segment["start"], "end": segment["end"]})
         # Create SRT file
         with open(srt_path, "w", encoding="utf-8") as f:
             for i, segment in enumerate(segments, 1):
                 start = f"{segment['start']:.3f}".replace(".", ",")
         return srt_path
     except subprocess.CalledProcessError as e:
+        print(f"FFmpeg Error: {e.stderr.decode()}")
+        return None
     except Exception as e:
+        print(f"Unexpected Error: {str(e)}")
+        return None
     finally:
         # Clean up temporary files
         if os.path.exists(output_video_path):
+            os.remove(output_video_path)
+        if os.path.exists(video_path):
+            os.remove(video_path)