CosyVoice commited on
Commit
d52358f
1 Parent(s): 72b89a5

update readme

Browse files
Files changed (1) hide show
  1. README.md +9 -5
README.md CHANGED
@@ -22,12 +22,9 @@ For `SenseVoice`, visit [SenseVoice repo](https://github.com/FunAudioLLM/SenseVo
22
  - [ ] 25hz cosyvoice base model
23
  - [ ] 25hz cosyvoice voice conversion model
24
 
25
- - [ ] 2024/10
26
-
27
- - [ ] 50hz llama based llm model which supports lora finetune
28
-
29
  - [ ] TBD
30
 
 
31
  - [ ] Support more instruction mode
32
  - [ ] Voice conversion
33
  - [ ] Music generation
@@ -121,7 +118,7 @@ print(cosyvoice.list_avaliable_spks())
121
  for i, j in enumerate(cosyvoice.inference_sft('你好,我是通义生成式语音大模型,请问有什么可以帮您的吗?', '中文女', stream=False)):
122
  torchaudio.save('sft_{}.wav'.format(i), j['tts_speech'], 22050)
123
 
124
- cosyvoice = CosyVoice('pretrained_models/CosyVoice-300M')
125
  # zero_shot usage, <|zh|><|en|><|jp|><|yue|><|ko|> for Chinese/English/Japanese/Cantonese/Korean
126
  prompt_speech_16k = load_wav('zero_shot_prompt.wav', 16000)
127
  for i, j in enumerate(cosyvoice.inference_zero_shot('收到好友从远方寄来的生日礼物,那份意外的惊喜与深深的祝福让我心中充满了甜蜜的快乐,笑容如花儿般绽放。', '希望你以后能够做的比我还好呦。', prompt_speech_16k, stream=False)):
@@ -135,6 +132,13 @@ cosyvoice = CosyVoice('pretrained_models/CosyVoice-300M-Instruct')
135
  # instruct usage, support <laughter></laughter><strong></strong>[laughter][breath]
136
  for i, j in enumerate(cosyvoice.inference_instruct('在面对挑战时,他展现了非凡的<strong>勇气</strong>与<strong>智慧</strong>。', '中文男', 'Theo \'Crimson\', is a fiery, passionate rebel leader. Fights with fervor for justice, but struggles with impulsiveness.', stream=False)):
137
  torchaudio.save('instruct_{}.wav'.format(i), j['tts_speech'], 22050)
 
 
 
 
 
 
 
138
  ```
139
 
140
  **Start web demo**
 
22
  - [ ] 25hz cosyvoice base model
23
  - [ ] 25hz cosyvoice voice conversion model
24
 
 
 
 
 
25
  - [ ] TBD
26
 
27
+ - [ ] 25hz llama based llm model which supports lora finetune
28
  - [ ] Support more instruction mode
29
  - [ ] Voice conversion
30
  - [ ] Music generation
 
118
  for i, j in enumerate(cosyvoice.inference_sft('你好,我是通义生成式语音大模型,请问有什么可以帮您的吗?', '中文女', stream=False)):
119
  torchaudio.save('sft_{}.wav'.format(i), j['tts_speech'], 22050)
120
 
121
+ cosyvoice = CosyVoice('pretrained_models/CosyVoice-300M-25Hz')
122
  # zero_shot usage, <|zh|><|en|><|jp|><|yue|><|ko|> for Chinese/English/Japanese/Cantonese/Korean
123
  prompt_speech_16k = load_wav('zero_shot_prompt.wav', 16000)
124
  for i, j in enumerate(cosyvoice.inference_zero_shot('收到好友从远方寄来的生日礼物,那份意外的惊喜与深深的祝福让我心中充满了甜蜜的快乐,笑容如花儿般绽放。', '希望你以后能够做的比我还好呦。', prompt_speech_16k, stream=False)):
 
132
  # instruct usage, support <laughter></laughter><strong></strong>[laughter][breath]
133
  for i, j in enumerate(cosyvoice.inference_instruct('在面对挑战时,他展现了非凡的<strong>勇气</strong>与<strong>智慧</strong>。', '中文男', 'Theo \'Crimson\', is a fiery, passionate rebel leader. Fights with fervor for justice, but struggles with impulsiveness.', stream=False)):
134
  torchaudio.save('instruct_{}.wav'.format(i), j['tts_speech'], 22050)
135
+
136
+ cosyvoice = CosyVoice('pretrained_models/CosyVoice-VC')
137
+ # vc usage
138
+ prompt_speech_16k = load_wav('zero_shot_prompt.wav', 16000)
139
+ source_speech_16k = load_wav('cross_lingual_prompt.wav', 16000)
140
+ for i, j in enumerate(cosyvoice.inference_vc(source_speech_16k, prompt_speech_16k, stream=False)):
141
+ torchaudio.save('vc_{}.wav'.format(i), j['tts_speech'], 22050)
142
  ```
143
 
144
  **Start web demo**