Spaces:

omarxadel
/

egyptian-arabic-speech-to-text

Running

omarxadel commited on Oct 13, 2023

Commit

6249202

1 Parent(s): 9562dfe

feat: created gradio app with model

Files changed (2) hide show

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ .idea

app.py ADDED Viewed

+from transformers import HubertForCTC, Wav2Vec2Processor
+import gradio as gr
+import time
+import torch
+import soundfile as sf
+import requests
+API_URL = "https://api-inference.huggingface.co/models/omarxadel/hubert-large-arabic-egyptian"
+token = os.environ['apikey']
+headers = {"Authorization": token}
+def transcribe(audio, state=""):
+    time.sleep(2)
+    # Load model from HuggingFace Hub
+    with open(audio, "rb") as f:
+        data = f.read()
+    response = requests.post(API_URL, headers=headers, data=data)
+    output = response.json()["text"]
+    state += output + " "
+    return state, state
+gr.Interface(
+    fn=transcribe,
+    inputs=[
+        gr.Audio(source="microphone", type="filepath", streaming=True),
+        "state"
+    ],
+    outputs=[
+        "textbox",
+        "state"
+    ],
+    live=True).launch(share=True)