Spaces:

greg0rs
/

fonetik-fast

Running

App Files Files Community

greg0rs commited on 23 days ago

Commit

a02bc29

verified ·

1 Parent(s): 8f2f9cb

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -3

app.py CHANGED Viewed

@@ -306,7 +306,7 @@ def load_whisperx_models():
     if whisperx_model is None:
         log("Loading WhisperX models for English-only processing...")
         try:
-            # Load WhisperX model with English-only configuration
             whisperx_model = whisperx.load_model("base.en", device="cpu", compute_type="float32", language="en")
             log("WhisperX base.en model loaded successfully")
@@ -314,17 +314,44 @@ def load_whisperx_models():
             whisperx_align_model, whisperx_metadata = whisperx.load_align_model(language_code="en", device="cpu")
             log("WhisperX English alignment model loaded successfully")
         except Exception as e:
             log(f"Error loading WhisperX models: {e}")
             # Fallback: try with smaller English-only model
             try:
                 log("Trying fallback with tiny.en model...")
-                whisperx_model = whisperx.load_model("tiny.en", device="cpu", compute_type="float32", language="en")
                 whisperx_align_model, whisperx_metadata = whisperx.load_align_model(language_code="en", device="cpu")
                 log("WhisperX models loaded with fallback (tiny.en model)")
             except Exception as fallback_error:
                 log(f"Fallback also failed: {fallback_error}")
-                raise
 def convert_webm_to_wav(bts):
     p = subprocess.run(["ffmpeg", "-i", "pipe:0", "-f", "wav", "-ar", "16000", "-ac", "1", "pipe:1"],

     if whisperx_model is None:
         log("Loading WhisperX models for English-only processing...")
         try:
+            # Try loading with base.en first
             whisperx_model = whisperx.load_model("base.en", device="cpu", compute_type="float32", language="en")
             log("WhisperX base.en model loaded successfully")
             whisperx_align_model, whisperx_metadata = whisperx.load_align_model(language_code="en", device="cpu")
             log("WhisperX English alignment model loaded successfully")
+        except ImportError as ie:
+            log(f"Import error loading WhisperX models: {ie}")
+            # Try without ctranslate2 by using int8 compute type
+            try:
+                log("Trying fallback with int8 compute type...")
+                whisperx_model = whisperx.load_model("base.en", device="cpu", compute_type="int8", language="en")
+                whisperx_align_model, whisperx_metadata = whisperx.load_align_model(language_code="en", device="cpu")
+                log("WhisperX models loaded with int8 compute type")
+            except Exception as fallback_error:
+                log(f"Int8 fallback also failed: {fallback_error}")
+                # Last resort: try tiny model with default compute
+                try:
+                    log("Trying final fallback with tiny.en model and default compute...")
+                    whisperx_model = whisperx.load_model("tiny.en", device="cpu", language="en")
+                    whisperx_align_model, whisperx_metadata = whisperx.load_align_model(language_code="en", device="cpu")
+                    log("WhisperX models loaded with tiny.en and default compute")
+                except Exception as final_error:
+                    log(f"All WhisperX loading attempts failed: {final_error}")
+                    raise RuntimeError("Unable to load WhisperX models. Please check environment setup.")
         except Exception as e:
             log(f"Error loading WhisperX models: {e}")
             # Fallback: try with smaller English-only model
             try:
                 log("Trying fallback with tiny.en model...")
+                whisperx_model = whisperx.load_model("tiny.en", device="cpu", compute_type="int8", language="en")
                 whisperx_align_model, whisperx_metadata = whisperx.load_align_model(language_code="en", device="cpu")
                 log("WhisperX models loaded with fallback (tiny.en model)")
             except Exception as fallback_error:
                 log(f"Fallback also failed: {fallback_error}")
+                # Final attempt without compute_type specification
+                try:
+                    log("Final attempt with default settings...")
+                    whisperx_model = whisperx.load_model("tiny.en", device="cpu", language="en")
+                    whisperx_align_model, whisperx_metadata = whisperx.load_align_model(language_code="en", device="cpu")
+                    log("WhisperX models loaded with default settings")
+                except Exception as final_error:
+                    log(f"All attempts failed: {final_error}")
+                    raise RuntimeError("Unable to load WhisperX models in this environment")
 def convert_webm_to_wav(bts):
     p = subprocess.run(["ffmpeg", "-i", "pipe:0", "-f", "wav", "-ar", "16000", "-ac", "1", "pipe:1"],