Spaces:

adnaan05
/

VoiceToVoice_ChatBot

Running

adnaan05 commited on Sep 12, 2024

Commit

4846288

verified ·

1 Parent(s): ffebf32

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,41 +8,32 @@ from gtts import gTTS
 import io
 from groq import Groq
-# Initialize the Groq client
 client = Groq(api_key=os.environ.get("GROQ_API_KEY"))
-# Load the Whisper model
-model = whisper.load_model("base")  # You can choose other models like "small", "medium", "large"
 def process_audio(file_path):
     try:
-        # Load the audio file
         audio = whisper.load_audio(file_path)
-        # Transcribe the audio using Whisper
         result = model.transcribe(audio)
         text = result["text"]
-        # Generate a response using Groq
         chat_completion = client.chat.completions.create(
             messages=[{"role": "user", "content": text}],
-            model="llama3-8b-8192",  # Replace with the correct model if necessary
         )
-        # Access the response using dot notation
         response_message = chat_completion.choices[0].message.content.strip()
-        # Convert the response text to speech
         tts = gTTS(response_message)
         response_audio_io = io.BytesIO()
         tts.write_to_fp(response_audio_io)  # Save the audio to the BytesIO object
         response_audio_io.seek(0)
-        # Save audio to a file to ensure it's generated correctly
         with open("response.mp3", "wb") as audio_file:
             audio_file.write(response_audio_io.getvalue())
-        # Return the response text and the path to the saved audio file
         return response_message, "response.mp3"
     except Exception as e:

 import io
 from groq import Groq
 client = Groq(api_key=os.environ.get("GROQ_API_KEY"))
+model = whisper.load_model("base")
 def process_audio(file_path):
     try:
         audio = whisper.load_audio(file_path)
         result = model.transcribe(audio)
         text = result["text"]
         chat_completion = client.chat.completions.create(
             messages=[{"role": "user", "content": text}],
+            model="llama3-8b-8192",
         )
         response_message = chat_completion.choices[0].message.content.strip()
         tts = gTTS(response_message)
         response_audio_io = io.BytesIO()
         tts.write_to_fp(response_audio_io)  # Save the audio to the BytesIO object
         response_audio_io.seek(0)
         with open("response.mp3", "wb") as audio_file:
             audio_file.write(response_audio_io.getvalue())
         return response_message, "response.mp3"
     except Exception as e: