Spaces:
Runtime error
Runtime error
add cell to generate audios
Browse files- notebooks/test-model.ipynb +35 -3
notebooks/test-model.ipynb
CHANGED
@@ -72,14 +72,23 @@
|
|
72 |
},
|
73 |
{
|
74 |
"cell_type": "code",
|
75 |
-
"execution_count":
|
76 |
-
"id": "
|
77 |
"metadata": {},
|
78 |
"outputs": [],
|
79 |
"source": [
|
80 |
"model_id = \"teticio/audio-diffusion-256\"\n",
|
81 |
"ddpm = DDPMPipeline.from_pretrained(model_id) # you can replace DDPMPipeline with DDIMPipeline or PNDMPipeline for faster inference\n",
|
82 |
-
"ddpm.to(\"cuda\")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
83 |
"images = ddpm(output_type=\"numpy\")[\"sample\"]\n",
|
84 |
"images = (images * 255).round().astype(\"uint8\").transpose(0, 3, 1, 2)"
|
85 |
]
|
@@ -145,6 +154,29 @@
|
|
145 |
"Audio(data=audio, rate=mel.get_sample_rate())"
|
146 |
]
|
147 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
148 |
{
|
149 |
"cell_type": "markdown",
|
150 |
"id": "ef54cef3",
|
|
|
72 |
},
|
73 |
{
|
74 |
"cell_type": "code",
|
75 |
+
"execution_count": null,
|
76 |
+
"id": "e0f6e8fd",
|
77 |
"metadata": {},
|
78 |
"outputs": [],
|
79 |
"source": [
|
80 |
"model_id = \"teticio/audio-diffusion-256\"\n",
|
81 |
"ddpm = DDPMPipeline.from_pretrained(model_id) # you can replace DDPMPipeline with DDIMPipeline or PNDMPipeline for faster inference\n",
|
82 |
+
"ddpm.to(\"cuda\")"
|
83 |
+
]
|
84 |
+
},
|
85 |
+
{
|
86 |
+
"cell_type": "code",
|
87 |
+
"execution_count": 7,
|
88 |
+
"id": "b809fed5",
|
89 |
+
"metadata": {},
|
90 |
+
"outputs": [],
|
91 |
+
"source": [
|
92 |
"images = ddpm(output_type=\"numpy\")[\"sample\"]\n",
|
93 |
"images = (images * 255).round().astype(\"uint8\").transpose(0, 3, 1, 2)"
|
94 |
]
|
|
|
154 |
"Audio(data=audio, rate=mel.get_sample_rate())"
|
155 |
]
|
156 |
},
|
157 |
+
{
|
158 |
+
"cell_type": "markdown",
|
159 |
+
"id": "ba4ccac5",
|
160 |
+
"metadata": {},
|
161 |
+
"source": [
|
162 |
+
"### Generate audios"
|
163 |
+
]
|
164 |
+
},
|
165 |
+
{
|
166 |
+
"cell_type": "code",
|
167 |
+
"execution_count": null,
|
168 |
+
"id": "300a6a8d",
|
169 |
+
"metadata": {},
|
170 |
+
"outputs": [],
|
171 |
+
"source": [
|
172 |
+
"while True:\n",
|
173 |
+
" images = ddpm(output_type=\"numpy\")[\"sample\"]\n",
|
174 |
+
" images = (images * 255).round().astype(\"uint8\").transpose(0, 3, 1, 2)\n",
|
175 |
+
" image = Image.fromarray(images[0][0])\n",
|
176 |
+
" audio = mel.image_to_audio(image)\n",
|
177 |
+
" display(Audio(data=audio, rate=mel.get_sample_rate()))"
|
178 |
+
]
|
179 |
+
},
|
180 |
{
|
181 |
"cell_type": "markdown",
|
182 |
"id": "ef54cef3",
|