pikto isaakkamau commited on
Commit
b691fad
Β·
0 Parent(s):

Duplicate from isaakkamau/Text-To-Speech

Browse files

Co-authored-by: isaak <[email protected]>

Files changed (6) hide show
  1. .gitattributes +31 -0
  2. .gitignore +1 -0
  3. README.md +13 -0
  4. app.py +94 -0
  5. requirements.txt +5 -0
  6. setup.cfg +12 -0
.gitattributes ADDED
@@ -0,0 +1,31 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ *.7z filter=lfs diff=lfs merge=lfs -text
2
+ *.arrow filter=lfs diff=lfs merge=lfs -text
3
+ *.bin filter=lfs diff=lfs merge=lfs -text
4
+ *.bz2 filter=lfs diff=lfs merge=lfs -text
5
+ *.ftz filter=lfs diff=lfs merge=lfs -text
6
+ *.gz filter=lfs diff=lfs merge=lfs -text
7
+ *.h5 filter=lfs diff=lfs merge=lfs -text
8
+ *.joblib filter=lfs diff=lfs merge=lfs -text
9
+ *.lfs.* filter=lfs diff=lfs merge=lfs -text
10
+ *.model filter=lfs diff=lfs merge=lfs -text
11
+ *.msgpack filter=lfs diff=lfs merge=lfs -text
12
+ *.npy filter=lfs diff=lfs merge=lfs -text
13
+ *.npz filter=lfs diff=lfs merge=lfs -text
14
+ *.onnx filter=lfs diff=lfs merge=lfs -text
15
+ *.ot filter=lfs diff=lfs merge=lfs -text
16
+ *.parquet filter=lfs diff=lfs merge=lfs -text
17
+ *.pickle filter=lfs diff=lfs merge=lfs -text
18
+ *.pkl filter=lfs diff=lfs merge=lfs -text
19
+ *.pb filter=lfs diff=lfs merge=lfs -text
20
+ *.pt filter=lfs diff=lfs merge=lfs -text
21
+ *.pth filter=lfs diff=lfs merge=lfs -text
22
+ *.rar filter=lfs diff=lfs merge=lfs -text
23
+ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
24
+ *.tar.* filter=lfs diff=lfs merge=lfs -text
25
+ *.tflite filter=lfs diff=lfs merge=lfs -text
26
+ *.tgz filter=lfs diff=lfs merge=lfs -text
27
+ *.wasm filter=lfs diff=lfs merge=lfs -text
28
+ *.xz filter=lfs diff=lfs merge=lfs -text
29
+ *.zip filter=lfs diff=lfs merge=lfs -text
30
+ *.zst filter=lfs diff=lfs merge=lfs -text
31
+ *tfevents* filter=lfs diff=lfs merge=lfs -text
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ .idea
README.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ title: Text-to-Speech
3
+ emoji: πŸ’¬
4
+ colorFrom: blue
5
+ colorTo: yellow
6
+ sdk: gradio
7
+ sdk_version: 3.4
8
+ app_file: app.py
9
+ pinned: false
10
+ duplicated_from: isaakkamau/Text-To-Speech
11
+ ---
12
+
13
+ Text-to-Speech interactive demo, using (balacoon_tts)[https://balacoon.com].
app.py ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """
2
+
3
+ TTS interactive demo
4
+ """
5
+
6
+ import logging
7
+ from typing import cast
8
+
9
+ import gradio as gr
10
+ from balacoon_tts import TTS
11
+ from huggingface_hub import hf_hub_download, list_repo_files
12
+
13
+ # global tts module, initialized from a model selected
14
+ tts = None
15
+
16
+
17
+ def main():
18
+ logging.basicConfig(level=logging.INFO)
19
+
20
+ with gr.Blocks() as demo:
21
+ gr.Markdown(
22
+ """
23
+ <h1 align="center">Text-to-Speech</h1>
24
+
25
+ 1. Write an utterance to generate,
26
+ 2. Select the model to synthesize with
27
+ 3. Select the speaker
28
+ 4. Hit "Generate" and listen to the result!
29
+
30
+ When you select a Model for the first time,
31
+ it will take a little time to download it.
32
+ """
33
+ )
34
+ with gr.Row(variant="panel"):
35
+ text = gr.Textbox(label="Text", placeholder="Insert your article here...")
36
+
37
+ with gr.Row():
38
+ with gr.Column(variant="panel"):
39
+ repo_files = list_repo_files(repo_id="balacoon/tts")
40
+ model_files = [x for x in repo_files if x.endswith("_cpu.addon")]
41
+ model_name = gr.Dropdown(
42
+ label="Model",
43
+ choices=model_files,
44
+ )
45
+ with gr.Column(variant="panel"):
46
+ speaker = gr.Dropdown(label="Speaker", choices=[])
47
+
48
+ def set_model(model_name_str: str):
49
+ """
50
+ gets value from `model_name`, loads model,
51
+ re-initializes tts object, gets list of
52
+ speakers that model supports and set them to `speaker`
53
+ """
54
+ model_path = hf_hub_download(
55
+ repo_id="balacoon/tts", filename=model_name_str
56
+ )
57
+ global tts
58
+ tts = TTS(model_path)
59
+ speakers = tts.get_speakers()
60
+ value = speakers[-1]
61
+ return gr.Dropdown.update(
62
+ choices=speakers, value=value, visible=True
63
+ )
64
+
65
+ model_name.change(set_model, inputs=model_name, outputs=speaker)
66
+
67
+ with gr.Row(variant="panel"):
68
+ generate = gr.Button("Generate")
69
+ with gr.Row(variant="panel"):
70
+ audio = gr.Audio()
71
+
72
+ def synthesize_audio(text_str: str, speaker_str: str = ""):
73
+ """
74
+ gets utterance to synthesize from `text` Textbox
75
+ and speaker name from `speaker` dropdown list.
76
+ speaker name might be empty for single-speaker models.
77
+ Synthesizes the waveform and updates `audio` with it.
78
+ """
79
+ if not text_str:
80
+ logging.info("text or speaker are not provided")
81
+ return None
82
+ global tts
83
+ if len(text_str) > 1024:
84
+ text_str = text_str[:1024]
85
+ samples = cast(TTS, tts).synthesize(text_str, speaker_str)
86
+ return gr.Audio.update(value=(cast(TTS, tts).get_sampling_rate(), samples))
87
+
88
+ generate.click(synthesize_audio, inputs=[text, speaker], outputs=audio)
89
+
90
+ demo.launch()
91
+
92
+
93
+ if __name__ == "__main__":
94
+ main()
requirements.txt ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ --index-url https://pypi.fury.io/balacoon/
2
+ --extra-index-url https://pypi.org/simple/
3
+ balacoon-tts==0.1.1
4
+ huggingface_hub
5
+ numpy
setup.cfg ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [flake8]
2
+ max_complexity=10
3
+ per-file-ignores=__init__.py:F401,F403
4
+ ignore = E203,W503
5
+ max-line-length=119
6
+
7
+ [isort]
8
+ profile=black
9
+ line_length=119
10
+
11
+ [mypy]
12
+ ignore_missing_imports = True