Spaces:
Runtime error
Runtime error
Upload app.py
Browse files
app.py
CHANGED
@@ -18,7 +18,7 @@ sid_map = {
|
|
18 |
}
|
19 |
def vc_fn(sid, input_audio, vc_transform):
|
20 |
if input_audio is None:
|
21 |
-
return "
|
22 |
sampling_rate, audio = input_audio
|
23 |
# print(audio.shape,sampling_rate)
|
24 |
duration = audio.shape[0] / sampling_rate
|
@@ -34,14 +34,14 @@ def vc_fn(sid, input_audio, vc_transform):
|
|
34 |
sid = sid_map[sid]
|
35 |
out_audio, out_sr = svc_model.infer(sid, vc_transform, out_wav_path)
|
36 |
_audio = out_audio.cpu().numpy()
|
37 |
-
return "
|
38 |
|
39 |
app = gr.Blocks()
|
40 |
with app:
|
41 |
with gr.Tabs():
|
42 |
-
with gr.TabItem("
|
43 |
gr.Markdown(value="""
|
44 |
-
|
45 |
|
46 |
#### 目前模型训练状态:700000steps / 640epochs
|
47 |
|
@@ -52,6 +52,14 @@ with app:
|
|
52 |
#### 更建议参考仓库[README.md上的推理部分](https://github.com/innnky/so-vits-svc#%E6%8E%A8%E7%90%86),在本地使用 inference_main.py 处理
|
53 |
|
54 |
#### 3060Ti 8G可推理一条20(建议) - 30s的音频,过长音频可分割后批量处理
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
55 |
""")
|
56 |
sid = gr.Dropdown(label="音色", choices=["岁己(本音)"], value="岁己(本音)")
|
57 |
vc_input3 = gr.Audio(label="输入音频(长度请控制在25s左右,过长可能会爆内存)")
|
|
|
18 |
}
|
19 |
def vc_fn(sid, input_audio, vc_transform):
|
20 |
if input_audio is None:
|
21 |
+
return "请选择或拖入一段音频", None
|
22 |
sampling_rate, audio = input_audio
|
23 |
# print(audio.shape,sampling_rate)
|
24 |
duration = audio.shape[0] / sampling_rate
|
|
|
34 |
sid = sid_map[sid]
|
35 |
out_audio, out_sr = svc_model.infer(sid, vc_transform, out_wav_path)
|
36 |
_audio = out_audio.cpu().numpy()
|
37 |
+
return "成功", (48000, _audio)
|
38 |
|
39 |
app = gr.Blocks()
|
40 |
with app:
|
41 |
with gr.Tabs():
|
42 |
+
with gr.TabItem("岁己SUI"):
|
43 |
gr.Markdown(value="""
|
44 |
+
## 这是 sovits 3.0 48kHz AI岁己(本音)“歌声(划重点)”音色转换的在线demo
|
45 |
|
46 |
#### 目前模型训练状态:700000steps / 640epochs
|
47 |
|
|
|
52 |
#### 更建议参考仓库[README.md上的推理部分](https://github.com/innnky/so-vits-svc#%E6%8E%A8%E7%90%86),在本地使用 inference_main.py 处理
|
53 |
|
54 |
#### 3060Ti 8G可推理一条20(建议) - 30s的音频,过长音频可分割后批量处理
|
55 |
+
|
56 |
+
### 一点点注意事项:
|
57 |
+
|
58 |
+
#### 输入的音频一定要是纯净的干音,不要把歌曲直接扔进来
|
59 |
+
|
60 |
+
#### 对陈述语气没多大作用,你可以自己唱然后升十几个调慢慢试效果
|
61 |
+
|
62 |
+
#### 因为训练集来自于录播,所以音色偏本音,前期变调用于匹配音域,后期可以升一个调匹配一下岁己的歌音
|
63 |
""")
|
64 |
sid = gr.Dropdown(label="音色", choices=["岁己(本音)"], value="岁己(本音)")
|
65 |
vc_input3 = gr.Audio(label="输入音频(长度请控制在25s左右,过长可能会爆内存)")
|