Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -45,6 +45,8 @@ import onnxruntime
|
|
45 |
|
46 |
import glob
|
47 |
import ipywidgets as widgets
|
|
|
|
|
48 |
from IPython.display import display, Audio, Markdown, clear_output
|
49 |
from piper_phonemize import phonemize_codepoints, phonemize_espeak, tashkeel_run
|
50 |
|
@@ -133,6 +135,19 @@ async def main(
|
|
133 |
onnx_model = onnx_models
|
134 |
model, config = load_onnx(onnx_model, sess_options, providers)
|
135 |
print("nuber of speakers = ", config["num_speakers"])
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
136 |
if config["num_speakers"] > 1:
|
137 |
speaker_selection.options = config["speaker_id_map"].values()
|
138 |
speaker_selection.layout.visibility = 'visible'
|
@@ -190,19 +205,7 @@ async def main(
|
|
190 |
else:
|
191 |
sid = None
|
192 |
|
193 |
-
print("hello2")
|
194 |
-
rate = speed_slider.value
|
195 |
-
noise_scale = noise_scale_slider.value
|
196 |
-
noise_scale_w = noise_scale_w_slider.value
|
197 |
-
auto_play = play.value
|
198 |
-
audio = inferencing(model, config, sid, text_input.value, speed_slider.value, noise_scale_slider.value, noise_scale_w_slider, auto_play)
|
199 |
-
temp_audio_file = tempfile.NamedTemporaryFile(delete=False, suffix=".mp3")
|
200 |
-
audio.export(temp_audio_file.name, format="mp3")
|
201 |
|
202 |
-
# Rename the temporary audio file based on the text input
|
203 |
-
global renamed_audio_file
|
204 |
-
renamed_audio_file = os.path.join(tempfile.gettempdir(), f"{text_input}.mp3")
|
205 |
-
os.rename(temp_audio_file.name, renamed_audio_file)
|
206 |
|
207 |
# Save the audio as a temporary WAV file
|
208 |
return templates.TemplateResponse("interface.html", {"request": request, "audio_file": renamed_audio_file, "data": data})
|
|
|
45 |
|
46 |
import glob
|
47 |
import ipywidgets as widgets
|
48 |
+
from pydub import AudioSegment
|
49 |
+
import tempfile
|
50 |
from IPython.display import display, Audio, Markdown, clear_output
|
51 |
from piper_phonemize import phonemize_codepoints, phonemize_espeak, tashkeel_run
|
52 |
|
|
|
135 |
onnx_model = onnx_models
|
136 |
model, config = load_onnx(onnx_model, sess_options, providers)
|
137 |
print("nuber of speakers = ", config["num_speakers"])
|
138 |
+
print("hello2")
|
139 |
+
rate = speed_slider.value
|
140 |
+
noise_scale = noise_scale_slider.value
|
141 |
+
noise_scale_w = noise_scale_w_slider.value
|
142 |
+
auto_play = play.value
|
143 |
+
audio = inferencing(model, config, sid, text_input.value, speed_slider.value, noise_scale_slider.value, noise_scale_w_slider, auto_play)
|
144 |
+
temp_audio_file = tempfile.NamedTemporaryFile(delete=False, suffix=".mp3")
|
145 |
+
audio.export(temp_audio_file.name, format="mp3")
|
146 |
+
|
147 |
+
# Rename the temporary audio file based on the text input
|
148 |
+
global renamed_audio_file
|
149 |
+
renamed_audio_file = os.path.join(tempfile.gettempdir(), f"{text_input}.mp3")
|
150 |
+
os.rename(temp_audio_file.name, renamed_audio_file)
|
151 |
if config["num_speakers"] > 1:
|
152 |
speaker_selection.options = config["speaker_id_map"].values()
|
153 |
speaker_selection.layout.visibility = 'visible'
|
|
|
205 |
else:
|
206 |
sid = None
|
207 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
208 |
|
|
|
|
|
|
|
|
|
209 |
|
210 |
# Save the audio as a temporary WAV file
|
211 |
return templates.TemplateResponse("interface.html", {"request": request, "audio_file": renamed_audio_file, "data": data})
|