Spaces:

RakanAlsheraiwi
/

Pronunciation_feedback

App Files Files Community

RakanAlsheraiwi commited on Aug 14

Commit

938d676

•

1 Parent(s): 2551a01

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -12

app.py CHANGED Viewed

@@ -1,16 +1,35 @@
 import gradio as gr
 import difflib
-# Function to simulate pronunciation feedback
-def pronunciation_feedback(user_audio, sentence):
-    # Simulate a correct pronunciation for the given sentence
-    correct_text = sentence.lower()
-    # Convert audio to text using speech recognition (mocking this part for the example)
-    user_text = "This is a sample text."  # Replace with actual speech recognition result
     # Compare the user's text with the correct text
-    ratio = difflib.SequenceMatcher(None, correct_text, user_text.lower()).ratio()
     # Generate feedback based on similarity
     if ratio > 0.9:
@@ -19,19 +38,20 @@ def pronunciation_feedback(user_audio, sentence):
         feedback = "Good job! But you can improve your pronunciation on some words."
     else:
         feedback = "Keep practicing! Try to mimic the pronunciation more closely."
-    return feedback
 # Gradio Interface
 interface = gr.Interface(
     fn=pronunciation_feedback,
     inputs=[
         gr.Audio(type="filepath", label="Record your pronunciation"),
-        gr.Textbox(lines=2, label="Sentence to pronounce", value="This is a sample text.")
     ],
     outputs="text",
-    title="Pronunciation Trainer",
-    description="Record yourself pronouncing the given sentence and receive feedback on your pronunciation."
 )
 interface.launch()

 import gradio as gr
 import difflib
+import speech_recognition as sr
+import random
+# Function to perform speech recognition and provide feedback
+def pronunciation_feedback(user_audio, language):
+    # Initialize recognizer
+    recognizer = sr.Recognizer()
+    # Load the audio file
+    with sr.AudioFile(user_audio) as source:
+        audio_data = recognizer.record(source)
+    # Convert audio to text
+    try:
+        user_text = recognizer.recognize_google(audio_data, language=language)
+    except sr.UnknownValueError:
+        return "Sorry, I couldn't understand the audio. Please try again."
+    except sr.RequestError:
+        return "There was an error with the speech recognition service. Please try again later."
+    # Provide a sentence for the user to pronounce (could be dynamically generated or chosen)
+    sentence = random.choice([
+        "This is a simple test sentence.",
+        "I would like to improve my pronunciation.",
+        "Artificial intelligence is transforming the world.",
+        "Gradio is a fantastic tool for machine learning applications."
+    ]).lower()
     # Compare the user's text with the correct text
+    ratio = difflib.SequenceMatcher(None, sentence, user_text.lower()).ratio()
     # Generate feedback based on similarity
     if ratio > 0.9:
         feedback = "Good job! But you can improve your pronunciation on some words."
     else:
         feedback = "Keep practicing! Try to mimic the pronunciation more closely."
+    # Return feedback and the correct sentence for comparison
+    return f"Recognized Text: {user_text}\n\nTarget Sentence: {sentence}\n\nFeedback: {feedback}"
 # Gradio Interface
 interface = gr.Interface(
     fn=pronunciation_feedback,
     inputs=[
         gr.Audio(type="filepath", label="Record your pronunciation"),
+        gr.Dropdown(["en-US", "en-GB", "fr-FR", "es-ES"], label="Select Language", value="en-US")
     ],
     outputs="text",
+    title="Smart Pronunciation Trainer",
+    description="Record yourself pronouncing the given sentence in your selected language and receive AI-powered feedback."
 )
 interface.launch()