Spaces:

adnaan05
/

VoiceToVoice_ChatBot

Running

File size: 1,703 Bytes

import os
os.environ["GROQ_API_KEY"] = "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"

import os
import gradio as gr
import whisper
from gtts import gTTS
import io
from groq import Groq

client = Groq(api_key=os.environ.get("GROQ_API_KEY"))

model = whisper.load_model("base")

def process_audio(file_path):
    try:
        audio = whisper.load_audio(file_path)

        result = model.transcribe(audio)
        text = result["text"]

        chat_completion = client.chat.completions.create(
            messages=[{"role": "user", "content": text}],
            model="llama3-8b-8192",  
        )

        response_message = chat_completion.choices[0].message.content.strip()

        tts = gTTS(response_message)
        response_audio_io = io.BytesIO()
        tts.write_to_fp(response_audio_io)  # Save the audio to the BytesIO object
        response_audio_io.seek(0)

        with open("response.mp3", "wb") as audio_file:
            audio_file.write(response_audio_io.getvalue())

        return response_message, "response.mp3"

    except Exception as e:
        return f"An error occurred: {e}", None

title = " Voice-to-Voice Chatbot Application"
description = "Developed by [Adnan Tariq](https://www.linkedin.com/in/adnaantariq/) with ❤️"
article = "### Instructions\n1. Upload an audio file.\n2. Wait for the transcription.\n3. Listen to the chatbot's response."


iface = gr.Interface(
    fn=process_audio,
    inputs=gr.Audio(type="filepath"),  # Use type="filepath"
    outputs=[gr.Textbox(label="Response Text"), gr.Audio(label="Response Audio")],
    live=True,
    title=title,
    description=description,
    theme="dark",
    article=article
)

iface.launch()