Spaces:
Running
Running
Commit
·
f2f284e
1
Parent(s):
7316731
feat: add speed control
Browse files
app.py
CHANGED
@@ -68,6 +68,7 @@ def text_to_speech(
|
|
68 |
speaker_wav,
|
69 |
speaker: str,
|
70 |
dialect,
|
|
|
71 |
text: str,
|
72 |
):
|
73 |
if len(text) == 0:
|
@@ -80,6 +81,7 @@ def text_to_speech(
|
|
80 |
parsed_ipa = parse_ipa(ipa)
|
81 |
if dialect == "nansixian":
|
82 |
dialect = "sixian"
|
|
|
83 |
if use_default_emb_or_custom == "預設語者":
|
84 |
wav = _do_tts(
|
85 |
model_id,
|
@@ -220,6 +222,8 @@ with demo:
|
|
220 |
value="",
|
221 |
)
|
222 |
|
|
|
|
|
223 |
gr.Markdown(
|
224 |
"""
|
225 |
# 臺灣客語語音合成系統
|
@@ -239,6 +243,7 @@ with demo:
|
|
239 |
speaker_wav,
|
240 |
speaker_drop_down,
|
241 |
dialect_radio,
|
|
|
242 |
input_text,
|
243 |
],
|
244 |
outputs=[
|
|
|
68 |
speaker_wav,
|
69 |
speaker: str,
|
70 |
dialect,
|
71 |
+
speed: float,
|
72 |
text: str,
|
73 |
):
|
74 |
if len(text) == 0:
|
|
|
81 |
parsed_ipa = parse_ipa(ipa)
|
82 |
if dialect == "nansixian":
|
83 |
dialect = "sixian"
|
84 |
+
models_config[model_id]["model"].tts_model.length_scale = speed
|
85 |
if use_default_emb_or_custom == "預設語者":
|
86 |
wav = _do_tts(
|
87 |
model_id,
|
|
|
222 |
value="",
|
223 |
)
|
224 |
|
225 |
+
speed = gr.Slider(maximum=1.5, minimum=0.5, value=1, label="語速")
|
226 |
+
|
227 |
gr.Markdown(
|
228 |
"""
|
229 |
# 臺灣客語語音合成系統
|
|
|
243 |
speaker_wav,
|
244 |
speaker_drop_down,
|
245 |
dialect_radio,
|
246 |
+
speed,
|
247 |
input_text,
|
248 |
],
|
249 |
outputs=[
|