Spaces:

ar08
/

Voice-assitant

Paused

App Files Files Community

ar08 commited on Oct 15, 2024

Commit

8d734b4

verified ·

1 Parent(s): a96339a

Update app.py

Browse files

Files changed (1) hide show

app.py +29 -58

app.py CHANGED Viewed

@@ -104,78 +104,42 @@ def transcribe_and_chat(audio):
     return response, audio_path
 def create_demo():
-    with gr.Blocks(theme=gr.themes.Soft()) as demo:
         gr.Markdown(
             """
-            # 🎙️ AI Voice Assistant
-            Welcome to your personal voice assistant! Have a natural conversation with an AI-powered assistant.
-            Simply record your voice, and I'll respond with both text and speech.
             """
         )
         with gr.Row():
             with gr.Column(scale=1):
-                audio_input = gr.Audio(
-                    type="filepath",
-                    label="🎤 Speak your message",
-                    elem_id="audio-input"
-                )
-                voice_volume = gr.Slider(
-                    minimum=0,
-                    maximum=2,
-                    value=1,
-                    step=0.1,
-                    label="🔊 Assistant Voice Volume",
-                    elem_id="voice-volume"
-                )
             with gr.Column(scale=1):
-                chat_output = gr.Chatbot(
-                    label="Conversation",
-                    elem_id="chat-output",
-                    height=400
-                )
-                audio_output = gr.Audio(
-                    label="🔈 AI Voice Response",
-                    autoplay=True,
-                    elem_id="audio-output"
-                )
-        with gr.Row():
-            clear_button = gr.Button("🗑️ Clear Chat", variant="secondary", elem_id="clear-button")
-            submit_button = gr.Button("🚀 Submit", variant="primary", elem_id="submit-button")
         # Processing the audio input
-        def process_audio(audio, volume, history):
             logging.info(f"Received audio: {audio}")
             if audio is None:
-                return history + [("No audio detected. Please try recording again.", None)], None
-            transcribed_text = whisper_speech_to_text(audio)
-            if not transcribed_text:
-                return history + [("Sorry, I couldn't understand the audio. Please try again.", None)], None
-            response, audio_path = asyncio.run(chat_with_ai(transcribed_text))
             # Adjust volume for the response audio
             adjusted_audio_path = asyncio.run(text_to_speech_stream(response, volume))
             logging.info(f"Response: {response}, Audio path: {adjusted_audio_path}")
-            new_history = history + [(transcribed_text, response)]
-            return new_history, adjusted_audio_path
-        submit_button.click(
-            process_audio,
-            inputs=[audio_input, voice_volume, chat_output],
-            outputs=[chat_output, audio_output]
-        )
-        clear_button.click(
-            lambda: ([], None),
-            outputs=[chat_output, audio_output]
-        )
-        # JavaScript to handle autoplay and auto-listen
         demo.load(None, js="""
             function() {
                 var recordButton;
@@ -199,17 +163,24 @@ def create_demo():
                     }
                 }
-                document.querySelector("#audio-output").addEventListener("ended", function() {
                     setTimeout(startListening, 500);
                 });
                 function playAssistantAudio() {
-                    var audioElement = document.querySelector('#audio-output audio');
-                    if (audioElement) {
-                        audioElement.play();
                     }
                 }
                 document.addEventListener('gradioUpdated', function(event) {
                     setTimeout(playAssistantAudio, 100);
                 });

     return response, audio_path
 def create_demo():
+    with gr.Blocks() as demo:
         gr.Markdown(
             """
+            # 🗣️ AI Voice Assistant
+            Welcome to your personal voice assistant! Simply record your voice, and I will respond with both text and speech. The assistant will automatically start listening after playing its response. Powered by advanced AI models.
             """
         )
         with gr.Row():
             with gr.Column(scale=1):
+                audio_input = gr.Audio(type="filepath", label="🎤 Record your voice", elem_id="audio-input")
+                clear_button = gr.Button("Clear", variant="secondary", elem_id="clear-button")
+                voice_volume = gr.Slider(minimum=0, maximum=2, value=1, step=0.1, label="Voice Volume", elem_id="voice-volume")
             with gr.Column(scale=1):
+                chat_output = gr.Textbox(label="💬 AI Response", elem_id="chat-output", lines=5, interactive=False)
+                audio_output = gr.Audio(label="🔊 AI Voice Response", autoplay=True, elem_id="audio-output")
+        # Add some spacing and a divider
+        gr.Markdown("---")
         # Processing the audio input
+        def process_audio(audio, volume):
             logging.info(f"Received audio: {audio}")
             if audio is None:
+                return "No audio detected. Please try recording again.", None
+            response, audio_path = transcribe_and_chat(audio)
             # Adjust volume for the response audio
             adjusted_audio_path = asyncio.run(text_to_speech_stream(response, volume))
             logging.info(f"Response: {response}, Audio path: {adjusted_audio_path}")
+            return response, adjusted_audio_path
+        audio_input.change(process_audio, inputs=[audio_input, voice_volume], outputs=[chat_output, audio_output])
+        clear_button.click(lambda: (None, None), None, [chat_output, audio_output])
+        # JavaScript to handle autoplay, automatic submission, and auto-listen
         demo.load(None, js="""
             function() {
                 var recordButton;
                     }
                 }
+                document.querySelector("audio").addEventListener("ended", function() {
                     setTimeout(startListening, 500);
                 });
                 function playAssistantAudio() {
+                    var audioElements = document.querySelectorAll('audio');
+                    if (audioElements.length > 1) {
+                        var assistantAudio = audioElements[1];
+                        if (assistantAudio) {
+                            assistantAudio.play();
+                        }
                     }
                 }
+                document.addEventListener('gradioAudioLoaded', function(event) {
+                    playAssistantAudio();
+                });
                 document.addEventListener('gradioUpdated', function(event) {
                     setTimeout(playAssistantAudio, 100);
                 });