Sreekumar1608 commited on
Commit
979e0e9
·
1 Parent(s): 9fe3975

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +11 -11
app.py CHANGED
@@ -1,17 +1,18 @@
1
  import gradio as gr
2
  import openai
 
3
  from elevenlabslib import *
4
  from pydub import AudioSegment
5
- from elevenlabs import play
6
  import io
7
- #import winsound
8
 
9
- openai.api_key = "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"
10
- api_key = "929b67c6e533e94018a438d70c960b60"
11
  from elevenlabslib import ElevenLabsUser
12
  user = ElevenLabsUser(api_key)
13
 
14
- messages = ["Respond with voice"]
15
 
16
  def transcribe(audio):
17
  global messages
@@ -33,24 +34,23 @@ def transcribe(audio):
33
  system_message = response["choices"][0]["text"]
34
  messages.append(f"{system_message}")
35
 
36
- voice = user.get_voices_by_name("Bella")[0]
37
  audio = voice.generate_audio_bytes(system_message)
38
 
39
  audio = AudioSegment.from_file(io.BytesIO(audio), format="mp3")
40
  audio.export("output.wav", format="wav")
41
 
42
- #winsound.PlaySound("output.wav", winsound.SND_FILENAME)
43
- audio = generate(text = system_message, voice = voice)
44
- play(audio)
45
 
46
  chat_transcript = "\n".join(messages)
47
  return chat_transcript
48
 
49
  iface = gr.Interface(
50
  fn=transcribe,
51
- inputs=gr.Audio(source="microphone", type="filepath"),
52
  outputs="text",
53
- title="Voice Assistant",
 
54
  )
55
 
56
  iface.launch()
 
1
  import gradio as gr
2
  import openai
3
+ import winsound
4
  from elevenlabslib import *
5
  from pydub import AudioSegment
6
+ from pydub.playback import play
7
  import io
8
+ import config
9
 
10
+ openai.api_key = config.OPENAI_API_KEY
11
+ api_key = config.ELEVENLABS_API_KEY
12
  from elevenlabslib import ElevenLabsUser
13
  user = ElevenLabsUser(api_key)
14
 
15
+ messages = ["Respond in less than 60 words"]
16
 
17
  def transcribe(audio):
18
  global messages
 
34
  system_message = response["choices"][0]["text"]
35
  messages.append(f"{system_message}")
36
 
37
+ voice = user.get_voices_by_name("Antoni")[0]
38
  audio = voice.generate_audio_bytes(system_message)
39
 
40
  audio = AudioSegment.from_file(io.BytesIO(audio), format="mp3")
41
  audio.export("output.wav", format="wav")
42
 
43
+ winsound.PlaySound("output.wav", winsound.SND_FILENAME)
 
 
44
 
45
  chat_transcript = "\n".join(messages)
46
  return chat_transcript
47
 
48
  iface = gr.Interface(
49
  fn=transcribe,
50
+ inputs=gr.Audio(source="microphone", type="filepath", placeholder="Please start speaking..."),
51
  outputs="text",
52
+ title="Voice Assistant ",
53
+ description="Please ask me your question",
54
  )
55
 
56
  iface.launch()