Spaces:

MothersTongue
/

voice-matcher-api

Running on T4

App Files Files Community

arnabg95 commited on Jun 21, 2024

Commit

b4a191d

1 Parent(s): fcbfe77

model updated

Browse files

Files changed (5) hide show

app/__pycache__/passing.cpython-310.pyc +0 -0
app/__pycache__/transcriber.cpython-310.pyc +0 -0
app/routers/V1/voice/__pycache__/voice_router.cpython-310.pyc +0 -0
app/routers/V1/voice/voice_router.py +17 -17
app/transcriber.py +2 -1

app/__pycache__/passing.cpython-310.pyc CHANGED Viewed

Binary files a/app/__pycache__/passing.cpython-310.pyc and b/app/__pycache__/passing.cpython-310.pyc differ

app/__pycache__/transcriber.cpython-310.pyc CHANGED Viewed

Binary files a/app/__pycache__/transcriber.cpython-310.pyc and b/app/__pycache__/transcriber.cpython-310.pyc differ

app/routers/V1/voice/__pycache__/voice_router.cpython-310.pyc CHANGED Viewed

Binary files a/app/routers/V1/voice/__pycache__/voice_router.cpython-310.pyc and b/app/routers/V1/voice/__pycache__/voice_router.cpython-310.pyc differ

app/routers/V1/voice/voice_router.py CHANGED Viewed

@@ -23,25 +23,25 @@ async def transcribe_audio(
 ):
     try:
         # Validate URL
-        if not original_url.endswith(".wav"):
-            raise HTTPException(
-                status_code=status.HTTP_400_BAD_REQUEST,
-                detail="Invalid URL. Please provide a URL pointing to a wav file.",
-            )
-        # Download the audio file from the URL
-        response = requests.get(original_url)
-        if response.status_code != 200:
-            raise HTTPException(
-                status_code=status.HTTP_400_BAD_REQUEST,
-                detail="Unable to download the audio file from the URL.",
-            )
-        filename_original = f"audio_{int(time.time())}_original.wav"
-        # Save the downloaded file temporarily
-        with open(filename_original, "wb") as buffer:
-            buffer.write(response.content)
         # Read file bytes
         recorded_bytes = await recorded.read()
@@ -65,7 +65,7 @@ async def transcribe_audio(
             )
         finally:
             # Clean up the temporary file
-            os.remove(filename_original)
             os.remove(filename_recorded)
     except Exception as e:

 ):
     try:
         # Validate URL
+        # if not original_url.endswith(".wav"):
+        #     raise HTTPException(
+        #         status_code=status.HTTP_400_BAD_REQUEST,
+        #         detail="Invalid URL. Please provide a URL pointing to a wav file.",
+        #     )
+        # # Download the audio file from the URL
+        # response = requests.get(original_url)
+        # if response.status_code != 200:
+        #     raise HTTPException(
+        #         status_code=status.HTTP_400_BAD_REQUEST,
+        #         detail="Unable to download the audio file from the URL.",
+        #     )
+        # filename_original = f"audio_{int(time.time())}_original.wav"
+        # # Save the downloaded file temporarily
+        # with open(filename_original, "wb") as buffer:
+        #     buffer.write(response.content)
         # Read file bytes
         recorded_bytes = await recorded.read()
             )
         finally:
             # Clean up the temporary file
+            # os.remove(filename_original)
             os.remove(filename_recorded)
     except Exception as e:

app/transcriber.py CHANGED Viewed

@@ -6,8 +6,9 @@ from datasets import load_dataset
 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
-model_id = "openai/whisper-large-v3"
 # model_id = "MothersTongue/mother_tongue_model"
 model = AutoModelForSpeechSeq2Seq.from_pretrained(
     model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True, use_safetensors=True

 device = "cuda:0" if torch.cuda.is_available() else "cpu"
 torch_dtype = torch.float16 if torch.cuda.is_available() else torch.float32
+# model_id = "openai/whisper-large-v3"
 # model_id = "MothersTongue/mother_tongue_model"
+model_id = "MothersTongue/mother_tongue_model_v3"
 model = AutoModelForSpeechSeq2Seq.from_pretrained(
     model_id, torch_dtype=torch_dtype, low_cpu_mem_usage=True, use_safetensors=True