Spaces:

mehdi364
/

Speech_to_text

Sleeping

mehdi364 commited on 24 days ago

Commit

2b4320d

verified ·

1 Parent(s): 0b41553

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,19 +1,12 @@
 import gradio as gr
-from transformers import pipeline
-def transcribe_audio(audio):
-    transcriber = pipeline("automatic-speech-recognition", model="openai/whisper-base")
-    result = transcriber(audio)
-    return result['text']
-interface = gr.Interface(
-    fn=transcribe_audio,
-    inputs=gr.Audio(source="microphone", type="filepath", label="Input Audio"),
-    outputs="text",
-    live=True,
-    title="Speech to Text - Persian",
-    description="Record your voice in Persian and see the transcription here."
-)
-if __name__ == "__main__":
-    interface.launch()

 import gradio as gr
+import torchaudio
+def transcribe(audio):
+    recognizer = sr.Recognizer()
+    with sr.AudioFile(audio) as source:
+        audio_data = recognizer.record(source)
+        text = recognizer.recognize_google(audio_data, language="fa-IR")
+        return text
+interface = gr.Interface(fn=transcribe, inputs="microphone", outputs="text")
+interface.launch()