Spaces:
Running
on
Zero
Running
on
Zero
update readme
Browse files
README.md
CHANGED
@@ -22,12 +22,9 @@ For `SenseVoice`, visit [SenseVoice repo](https://github.com/FunAudioLLM/SenseVo
|
|
22 |
- [ ] 25hz cosyvoice base model
|
23 |
- [ ] 25hz cosyvoice voice conversion model
|
24 |
|
25 |
-
- [ ] 2024/10
|
26 |
-
|
27 |
-
- [ ] 50hz llama based llm model which supports lora finetune
|
28 |
-
|
29 |
- [ ] TBD
|
30 |
|
|
|
31 |
- [ ] Support more instruction mode
|
32 |
- [ ] Voice conversion
|
33 |
- [ ] Music generation
|
@@ -121,7 +118,7 @@ print(cosyvoice.list_avaliable_spks())
|
|
121 |
for i, j in enumerate(cosyvoice.inference_sft('你好,我是通义生成式语音大模型,请问有什么可以帮您的吗?', '中文女', stream=False)):
|
122 |
torchaudio.save('sft_{}.wav'.format(i), j['tts_speech'], 22050)
|
123 |
|
124 |
-
cosyvoice = CosyVoice('pretrained_models/CosyVoice-300M')
|
125 |
# zero_shot usage, <|zh|><|en|><|jp|><|yue|><|ko|> for Chinese/English/Japanese/Cantonese/Korean
|
126 |
prompt_speech_16k = load_wav('zero_shot_prompt.wav', 16000)
|
127 |
for i, j in enumerate(cosyvoice.inference_zero_shot('收到好友从远方寄来的生日礼物,那份意外的惊喜与深深的祝福让我心中充满了甜蜜的快乐,笑容如花儿般绽放。', '希望你以后能够做的比我还好呦。', prompt_speech_16k, stream=False)):
|
@@ -135,6 +132,13 @@ cosyvoice = CosyVoice('pretrained_models/CosyVoice-300M-Instruct')
|
|
135 |
# instruct usage, support <laughter></laughter><strong></strong>[laughter][breath]
|
136 |
for i, j in enumerate(cosyvoice.inference_instruct('在面对挑战时,他展现了非凡的<strong>勇气</strong>与<strong>智慧</strong>。', '中文男', 'Theo \'Crimson\', is a fiery, passionate rebel leader. Fights with fervor for justice, but struggles with impulsiveness.', stream=False)):
|
137 |
torchaudio.save('instruct_{}.wav'.format(i), j['tts_speech'], 22050)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
138 |
```
|
139 |
|
140 |
**Start web demo**
|
|
|
22 |
- [ ] 25hz cosyvoice base model
|
23 |
- [ ] 25hz cosyvoice voice conversion model
|
24 |
|
|
|
|
|
|
|
|
|
25 |
- [ ] TBD
|
26 |
|
27 |
+
- [ ] 25hz llama based llm model which supports lora finetune
|
28 |
- [ ] Support more instruction mode
|
29 |
- [ ] Voice conversion
|
30 |
- [ ] Music generation
|
|
|
118 |
for i, j in enumerate(cosyvoice.inference_sft('你好,我是通义生成式语音大模型,请问有什么可以帮您的吗?', '中文女', stream=False)):
|
119 |
torchaudio.save('sft_{}.wav'.format(i), j['tts_speech'], 22050)
|
120 |
|
121 |
+
cosyvoice = CosyVoice('pretrained_models/CosyVoice-300M-25Hz')
|
122 |
# zero_shot usage, <|zh|><|en|><|jp|><|yue|><|ko|> for Chinese/English/Japanese/Cantonese/Korean
|
123 |
prompt_speech_16k = load_wav('zero_shot_prompt.wav', 16000)
|
124 |
for i, j in enumerate(cosyvoice.inference_zero_shot('收到好友从远方寄来的生日礼物,那份意外的惊喜与深深的祝福让我心中充满了甜蜜的快乐,笑容如花儿般绽放。', '希望你以后能够做的比我还好呦。', prompt_speech_16k, stream=False)):
|
|
|
132 |
# instruct usage, support <laughter></laughter><strong></strong>[laughter][breath]
|
133 |
for i, j in enumerate(cosyvoice.inference_instruct('在面对挑战时,他展现了非凡的<strong>勇气</strong>与<strong>智慧</strong>。', '中文男', 'Theo \'Crimson\', is a fiery, passionate rebel leader. Fights with fervor for justice, but struggles with impulsiveness.', stream=False)):
|
134 |
torchaudio.save('instruct_{}.wav'.format(i), j['tts_speech'], 22050)
|
135 |
+
|
136 |
+
cosyvoice = CosyVoice('pretrained_models/CosyVoice-VC')
|
137 |
+
# vc usage
|
138 |
+
prompt_speech_16k = load_wav('zero_shot_prompt.wav', 16000)
|
139 |
+
source_speech_16k = load_wav('cross_lingual_prompt.wav', 16000)
|
140 |
+
for i, j in enumerate(cosyvoice.inference_vc(source_speech_16k, prompt_speech_16k, stream=False)):
|
141 |
+
torchaudio.save('vc_{}.wav'.format(i), j['tts_speech'], 22050)
|
142 |
```
|
143 |
|
144 |
**Start web demo**
|