Spaces:

aiegoo
/

whisper-chatbot-ko

Runtime error

App Files Files Community

aiegoo commited on Jun 15, 2023

Commit

2264c63

1 Parent(s): 048c1a1

add app.py

Browse files

Files changed (1) hide show

app.py +129 -0

app.py ADDED Viewed

	@@ -0,0 +1,129 @@

+import gradio as gr
+import base64
+import requests
+import secrets
+import os
+from io import BytesIO
+from pydub import AudioSegment
+def create_chat_session():
+    r = requests.post("http://121.176.153.117:5000/create")
+    if (r.status_code != 201):
+        raise Exception("Failed to create chat session")
+    # create temp audio folder
+    session_id = r.json()["id"]
+    os.makedirs(f"./temp_audio/{session_id}")
+    return session_id
+session_id = create_chat_session()
+chat_history = []
+def add_text(history, text):
+    history = history + [(text, None)]
+    return history, gr.update(value="", interactive=False)
+def add_audio(history, audio):
+    audio_bytes = base64.b64decode(audio['data'].split(',')[-1].encode('utf-8'))
+    audio_file = BytesIO(audio_bytes)
+    AudioSegment.from_file(audio_file).export(audio_file, format="mp3")
+    # save audio file temporary to disk
+    audio_id = secrets.token_hex(8)
+    AudioSegment.from_file(audio_file).export(f"temp_audio/{session_id}/audio_input_{audio_id}.mp3", format="mp3")
+    history = history + [((f"temp_audio/{session_id}/audio_input_{audio_id}.mp3",), None)]
+    response = requests.post(
+        "http://121.176.153.117:5000/transcribe",
+        files={'audio': audio_file.getvalue()}
+    )
+    if (response.status_code != 200):
+        raise Exception(response.text)
+    text = response.json()['text']
+    history = history + [(text, None)]
+    return history, gr.update(value="", interactive=False)
+def bot(history):
+    if type(history[-1][0]) == str:
+        message = history[-1][0]
+    else:
+        message = history[-2][0]
+    response = requests.post(
+        f"http://121.176.153.117:5000/send/text/{session_id}",
+        headers={'Content-type': 'application/json'},
+        json={
+            'message': message,
+            'role': 'user'
+        }
+    )
+    if (response.status_code != 200):
+        raise Exception(f"Failed to send message, {response.text}")
+    response = response.json()
+    text, audio = response['text'], response['audio']
+    audio_bytes = base64.b64decode(audio.encode('utf-8'))
+    audio_file = BytesIO(audio_bytes)
+    audio_id = secrets.token_hex(8)
+    AudioSegment.from_file(audio_file).export(f"temp_audio/{session_id}/audio_input_{audio_id}.mp3", format="mp3")
+    history = history + [(None, (f"temp_audio/{session_id}/audio_input_{audio_id}.mp3",))]
+    history = history + [(None, text)]
+    global chat_history
+    chat_history = history.copy()
+    return history
+def load_chat_history(history):
+    global chat_history
+    if len(chat_history) > len(history):
+        history = chat_history
+    return history
+with gr.Blocks() as demo:
+    chatbot = gr.Chatbot([], elem_id="chatbot").style(height=750)
+    demo.load(load_chat_history, [chatbot], [chatbot], queue=False)
+    with gr.Row():
+        with gr.Column(scale=0.85):
+            txt = gr.Textbox(
+                show_label=False,
+                placeholder="Enter text and press enter, or record audio",
+            ).style(container=False)
+        with gr.Column(scale=0.15, min_width=0):
+            audio = gr.Audio(
+                source="microphone", type="numpy", show_label=False, format="mp3"
+            ).style(container=False)
+    txt_msg = txt.submit(add_text, [chatbot, txt], [chatbot, txt], queue=False).then(
+        bot, chatbot, chatbot
+    )
+    txt_msg.then(lambda: gr.update(interactive=True), None, [txt], queue=False)
+    audio_msg = audio.change(add_audio, [chatbot, audio], [chatbot, audio], queue=False, preprocess=False, postprocess=False).then(
+        bot, chatbot, chatbot
+    )
+    audio_msg.then(lambda: gr.update(interactive=True, value=None), None, [audio], queue=False)
+demo.launch(show_error=True, server_name='172.30.1.18', share=True)