Spaces:
Running
on
Zero
Running
on
Zero
no message
Browse files- README.md +2 -4
- deploy.sh +9 -7
- requirements_.txt → requirements.txt +0 -0
- webui.py +22 -16
README.md
CHANGED
@@ -1,11 +1,9 @@
|
|
1 |
---
|
2 |
-
license: apache-2.0
|
3 |
title: CosyVoice
|
4 |
sdk: gradio
|
5 |
emoji: 🏃
|
6 |
colorFrom: yellow
|
7 |
colorTo: green
|
8 |
-
python_version: 3.8.
|
9 |
-
|
10 |
-
app_file: deploy.py
|
11 |
---
|
|
|
1 |
---
|
|
|
2 |
title: CosyVoice
|
3 |
sdk: gradio
|
4 |
emoji: 🏃
|
5 |
colorFrom: yellow
|
6 |
colorTo: green
|
7 |
+
python_version: 3.8.9
|
8 |
+
app_file: webui.py
|
|
|
9 |
---
|
deploy.sh
CHANGED
@@ -3,23 +3,23 @@ wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh
|
|
3 |
sh Miniconda3-latest-Linux-x86_64.sh -b
|
4 |
source ~/miniconda3/bin/activate
|
5 |
|
6 |
-
conda create -n cosyvoice python=3.8
|
7 |
-
conda activate cosyvoice
|
8 |
-
conda install -y -c conda-forge pynini==2.1.5
|
9 |
# pynini is required by WeTextProcessing, use conda to install it as it can be executed on all platform.
|
10 |
pip install -r requirements_.txt
|
11 |
|
12 |
# If you encounter sox compatibility issues
|
13 |
# ubuntu
|
14 |
apt-get -y update
|
15 |
-
apt-get install sox libsox-dev
|
16 |
|
17 |
mkdir -p pretrained_models
|
18 |
-
git clone https://www.modelscope.cn/iic/CosyVoice-300M.git pretrained_models/CosyVoice-300M
|
19 |
#git clone https://www.modelscope.cn/iic/CosyVoice-300M-25Hz.git pretrained_models/CosyVoice-300M-25Hz
|
20 |
#git clone https://www.modelscope.cn/iic/CosyVoice-300M-SFT.git pretrained_models/CosyVoice-300M-SFT
|
21 |
#git clone https://www.modelscope.cn/iic/CosyVoice-300M-Instruct.git pretrained_models/CosyVoice-300M-Instruct
|
22 |
-
git clone https://www.modelscope.cn/iic/CosyVoice-ttsfrd.git pretrained_models/CosyVoice-ttsfrd
|
23 |
#huggingface-cli download model-scope/CosyVoice-300M --local-dir pretrained_models/CosyVoice-300M --token=$hf_token
|
24 |
#huggingface-cli download model-scope/CosyVoice-300M-SFT --local-dir pretrained_models/CosyVoice-300M-SFT --token=$hf_token
|
25 |
#huggingface-cli download FunAudioLLM/CosyVoice-ttsfrd --local-dir pretrained_models/CosyVoice-ttsfrd --token=$hf_token
|
@@ -30,4 +30,6 @@ cd pretrained_models/CosyVoice-ttsfrd/
|
|
30 |
unzip resource.zip -d .
|
31 |
pip install ttsfrd-0.3.6-cp38-cp38-linux_x86_64.whl
|
32 |
|
33 |
-
export PYTHONPATH=third_party/Matcha-TTS
|
|
|
|
|
|
3 |
sh Miniconda3-latest-Linux-x86_64.sh -b
|
4 |
source ~/miniconda3/bin/activate
|
5 |
|
6 |
+
#conda create -n cosyvoice python=3.8
|
7 |
+
#conda activate cosyvoice
|
8 |
+
#conda install -y -c conda-forge pynini==2.1.5
|
9 |
# pynini is required by WeTextProcessing, use conda to install it as it can be executed on all platform.
|
10 |
pip install -r requirements_.txt
|
11 |
|
12 |
# If you encounter sox compatibility issues
|
13 |
# ubuntu
|
14 |
apt-get -y update
|
15 |
+
apt-get -y install sox libsox-dev
|
16 |
|
17 |
mkdir -p pretrained_models
|
18 |
+
#git clone https://www.modelscope.cn/iic/CosyVoice-300M.git pretrained_models/CosyVoice-300M
|
19 |
#git clone https://www.modelscope.cn/iic/CosyVoice-300M-25Hz.git pretrained_models/CosyVoice-300M-25Hz
|
20 |
#git clone https://www.modelscope.cn/iic/CosyVoice-300M-SFT.git pretrained_models/CosyVoice-300M-SFT
|
21 |
#git clone https://www.modelscope.cn/iic/CosyVoice-300M-Instruct.git pretrained_models/CosyVoice-300M-Instruct
|
22 |
+
#git clone https://www.modelscope.cn/iic/CosyVoice-ttsfrd.git pretrained_models/CosyVoice-ttsfrd
|
23 |
#huggingface-cli download model-scope/CosyVoice-300M --local-dir pretrained_models/CosyVoice-300M --token=$hf_token
|
24 |
#huggingface-cli download model-scope/CosyVoice-300M-SFT --local-dir pretrained_models/CosyVoice-300M-SFT --token=$hf_token
|
25 |
#huggingface-cli download FunAudioLLM/CosyVoice-ttsfrd --local-dir pretrained_models/CosyVoice-ttsfrd --token=$hf_token
|
|
|
30 |
unzip resource.zip -d .
|
31 |
pip install ttsfrd-0.3.6-cp38-cp38-linux_x86_64.whl
|
32 |
|
33 |
+
export PYTHONPATH=third_party/Matcha-TTS
|
34 |
+
|
35 |
+
python3 webui.py
|
requirements_.txt → requirements.txt
RENAMED
File without changes
|
webui.py
CHANGED
@@ -132,7 +132,7 @@ def generate_audio(tts_text, mode_checkbox_group, sft_dropdown, prompt_text, pro
|
|
132 |
yield (target_sr, i['tts_speech'].numpy().flatten())
|
133 |
|
134 |
|
135 |
-
def main(
|
136 |
with gr.Blocks() as demo:
|
137 |
gr.Markdown("### 代码库 [CosyVoice](https://github.com/FunAudioLLM/CosyVoice) \
|
138 |
预训练模型 [CosyVoice-300M](https://www.modelscope.cn/models/iic/CosyVoice-300M) \
|
@@ -171,18 +171,24 @@ def main(args,sft_spk):
|
|
171 |
demo.launch(server_name='0.0.0.0', server_port=args.port)
|
172 |
|
173 |
|
174 |
-
|
175 |
-
|
176 |
-
|
177 |
-
|
178 |
-
|
179 |
-
|
180 |
-
|
181 |
-
|
182 |
-
|
183 |
-
|
184 |
-
|
185 |
-
|
186 |
-
|
187 |
-
|
188 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
132 |
yield (target_sr, i['tts_speech'].numpy().flatten())
|
133 |
|
134 |
|
135 |
+
def main():
|
136 |
with gr.Blocks() as demo:
|
137 |
gr.Markdown("### 代码库 [CosyVoice](https://github.com/FunAudioLLM/CosyVoice) \
|
138 |
预训练模型 [CosyVoice-300M](https://www.modelscope.cn/models/iic/CosyVoice-300M) \
|
|
|
171 |
demo.launch(server_name='0.0.0.0', server_port=args.port)
|
172 |
|
173 |
|
174 |
+
|
175 |
+
# SDK模型下载
|
176 |
+
from modelscope import snapshot_download
|
177 |
+
snapshot_download('iic/CosyVoice-300M', local_dir='pretrained_models/CosyVoice-300M')
|
178 |
+
|
179 |
+
os.system('apt-get -y update && apt-get -y install sox libsox-dev')
|
180 |
+
|
181 |
+
parser = argparse.ArgumentParser()
|
182 |
+
parser.add_argument('--port',
|
183 |
+
type=int,
|
184 |
+
default=8000)
|
185 |
+
parser.add_argument('--model_dir',
|
186 |
+
type=str,
|
187 |
+
default='pretrained_models/CosyVoice-300M',
|
188 |
+
help='local path or modelscope repo id')
|
189 |
+
args = parser.parse_args()
|
190 |
+
cosyvoice = CosyVoice(args.model_dir)
|
191 |
+
sft_spk = cosyvoice.list_avaliable_spks()
|
192 |
+
prompt_sr, target_sr = 16000, 22050
|
193 |
+
default_data = np.zeros(target_sr)
|
194 |
+
main()
|