End of training
Browse files- README.md +6 -0
- checkpoint-1000/controlnet/config.json +19 -13
- checkpoint-1000/controlnet/diffusion_pytorch_model.safetensors +2 -2
- checkpoint-1000/optimizer.bin +2 -2
- checkpoint-1000/random_states_0.pkl +1 -1
- checkpoint-2000/controlnet/config.json +19 -13
- checkpoint-2000/controlnet/diffusion_pytorch_model.safetensors +2 -2
- checkpoint-2000/optimizer.bin +2 -2
- checkpoint-2000/random_states_0.pkl +2 -2
- checkpoint-3000/controlnet/config.json +19 -13
- checkpoint-3000/controlnet/diffusion_pytorch_model.safetensors +2 -2
- checkpoint-3000/optimizer.bin +2 -2
- checkpoint-3000/random_states_0.pkl +1 -1
- checkpoint-4000/controlnet/config.json +19 -13
- checkpoint-4000/controlnet/diffusion_pytorch_model.safetensors +2 -2
- checkpoint-4000/optimizer.bin +2 -2
- checkpoint-4000/random_states_0.pkl +2 -2
- checkpoint-5000/controlnet/config.json +19 -13
- checkpoint-5000/controlnet/diffusion_pytorch_model.safetensors +2 -2
- checkpoint-5000/optimizer.bin +2 -2
- checkpoint-5000/random_states_0.pkl +1 -1
- config.json +19 -13
- diffusion_pytorch_model.safetensors +2 -2
README.md
CHANGED
@@ -9,6 +9,12 @@ tags:
|
|
9 |
- diffusers
|
10 |
- controlnet
|
11 |
- diffusers-training
|
|
|
|
|
|
|
|
|
|
|
|
|
12 |
inference: true
|
13 |
---
|
14 |
|
|
|
9 |
- diffusers
|
10 |
- controlnet
|
11 |
- diffusers-training
|
12 |
+
- stable-diffusion-xl
|
13 |
+
- stable-diffusion-xl-diffusers
|
14 |
+
- text-to-image
|
15 |
+
- diffusers
|
16 |
+
- controlnet
|
17 |
+
- diffusers-training
|
18 |
inference: true
|
19 |
---
|
20 |
|
checkpoint-1000/controlnet/config.json
CHANGED
@@ -1,15 +1,18 @@
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"act_fn": "silu",
|
5 |
-
"addition_embed_type":
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
-
"addition_time_embed_dim":
|
8 |
-
"attention_head_dim":
|
|
|
|
|
|
|
|
|
9 |
"block_out_channels": [
|
10 |
320,
|
11 |
640,
|
12 |
-
1280,
|
13 |
1280
|
14 |
],
|
15 |
"class_embed_type": null,
|
@@ -21,12 +24,11 @@
|
|
21 |
256
|
22 |
],
|
23 |
"controlnet_conditioning_channel_order": "rgb",
|
24 |
-
"cross_attention_dim":
|
25 |
"down_block_types": [
|
|
|
26 |
"CrossAttnDownBlock2D",
|
27 |
-
"CrossAttnDownBlock2D"
|
28 |
-
"CrossAttnDownBlock2D",
|
29 |
-
"DownBlock2D"
|
30 |
],
|
31 |
"downsample_padding": 1,
|
32 |
"encoder_hid_dim": null,
|
@@ -43,9 +45,13 @@
|
|
43 |
"num_attention_heads": null,
|
44 |
"num_class_embeds": null,
|
45 |
"only_cross_attention": false,
|
46 |
-
"projection_class_embeddings_input_dim":
|
47 |
"resnet_time_scale_shift": "default",
|
48 |
-
"transformer_layers_per_block":
|
49 |
-
|
50 |
-
|
|
|
|
|
|
|
|
|
51 |
}
|
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
+
"_diffusers_version": "0.35.0.dev0",
|
4 |
"act_fn": "silu",
|
5 |
+
"addition_embed_type": "text_time",
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
+
"addition_time_embed_dim": 256,
|
8 |
+
"attention_head_dim": [
|
9 |
+
5,
|
10 |
+
10,
|
11 |
+
20
|
12 |
+
],
|
13 |
"block_out_channels": [
|
14 |
320,
|
15 |
640,
|
|
|
16 |
1280
|
17 |
],
|
18 |
"class_embed_type": null,
|
|
|
24 |
256
|
25 |
],
|
26 |
"controlnet_conditioning_channel_order": "rgb",
|
27 |
+
"cross_attention_dim": 2048,
|
28 |
"down_block_types": [
|
29 |
+
"DownBlock2D",
|
30 |
"CrossAttnDownBlock2D",
|
31 |
+
"CrossAttnDownBlock2D"
|
|
|
|
|
32 |
],
|
33 |
"downsample_padding": 1,
|
34 |
"encoder_hid_dim": null,
|
|
|
45 |
"num_attention_heads": null,
|
46 |
"num_class_embeds": null,
|
47 |
"only_cross_attention": false,
|
48 |
+
"projection_class_embeddings_input_dim": 2816,
|
49 |
"resnet_time_scale_shift": "default",
|
50 |
+
"transformer_layers_per_block": [
|
51 |
+
1,
|
52 |
+
2,
|
53 |
+
10
|
54 |
+
],
|
55 |
+
"upcast_attention": null,
|
56 |
+
"use_linear_projection": true
|
57 |
}
|
checkpoint-1000/controlnet/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0734204635cfe55040059aa58cea0c732ab50620b61ca44ca8ac5597b371206c
|
3 |
+
size 5004167864
|
checkpoint-1000/optimizer.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d08d48073aef84329905df4bf609f2dfa9d07ac9360b24ada2b3037d496f6b02
|
3 |
+
size 2510393614
|
checkpoint-1000/random_states_0.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14408
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:196e4fcfd0dc67028502faaa92729774ca4a68325575f7b3553a6484afb49ac3
|
3 |
size 14408
|
checkpoint-2000/controlnet/config.json
CHANGED
@@ -1,15 +1,18 @@
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"act_fn": "silu",
|
5 |
-
"addition_embed_type":
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
-
"addition_time_embed_dim":
|
8 |
-
"attention_head_dim":
|
|
|
|
|
|
|
|
|
9 |
"block_out_channels": [
|
10 |
320,
|
11 |
640,
|
12 |
-
1280,
|
13 |
1280
|
14 |
],
|
15 |
"class_embed_type": null,
|
@@ -21,12 +24,11 @@
|
|
21 |
256
|
22 |
],
|
23 |
"controlnet_conditioning_channel_order": "rgb",
|
24 |
-
"cross_attention_dim":
|
25 |
"down_block_types": [
|
|
|
26 |
"CrossAttnDownBlock2D",
|
27 |
-
"CrossAttnDownBlock2D"
|
28 |
-
"CrossAttnDownBlock2D",
|
29 |
-
"DownBlock2D"
|
30 |
],
|
31 |
"downsample_padding": 1,
|
32 |
"encoder_hid_dim": null,
|
@@ -43,9 +45,13 @@
|
|
43 |
"num_attention_heads": null,
|
44 |
"num_class_embeds": null,
|
45 |
"only_cross_attention": false,
|
46 |
-
"projection_class_embeddings_input_dim":
|
47 |
"resnet_time_scale_shift": "default",
|
48 |
-
"transformer_layers_per_block":
|
49 |
-
|
50 |
-
|
|
|
|
|
|
|
|
|
51 |
}
|
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
+
"_diffusers_version": "0.35.0.dev0",
|
4 |
"act_fn": "silu",
|
5 |
+
"addition_embed_type": "text_time",
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
+
"addition_time_embed_dim": 256,
|
8 |
+
"attention_head_dim": [
|
9 |
+
5,
|
10 |
+
10,
|
11 |
+
20
|
12 |
+
],
|
13 |
"block_out_channels": [
|
14 |
320,
|
15 |
640,
|
|
|
16 |
1280
|
17 |
],
|
18 |
"class_embed_type": null,
|
|
|
24 |
256
|
25 |
],
|
26 |
"controlnet_conditioning_channel_order": "rgb",
|
27 |
+
"cross_attention_dim": 2048,
|
28 |
"down_block_types": [
|
29 |
+
"DownBlock2D",
|
30 |
"CrossAttnDownBlock2D",
|
31 |
+
"CrossAttnDownBlock2D"
|
|
|
|
|
32 |
],
|
33 |
"downsample_padding": 1,
|
34 |
"encoder_hid_dim": null,
|
|
|
45 |
"num_attention_heads": null,
|
46 |
"num_class_embeds": null,
|
47 |
"only_cross_attention": false,
|
48 |
+
"projection_class_embeddings_input_dim": 2816,
|
49 |
"resnet_time_scale_shift": "default",
|
50 |
+
"transformer_layers_per_block": [
|
51 |
+
1,
|
52 |
+
2,
|
53 |
+
10
|
54 |
+
],
|
55 |
+
"upcast_attention": null,
|
56 |
+
"use_linear_projection": true
|
57 |
}
|
checkpoint-2000/controlnet/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:022c2c7e62360ea64552fe0a7e9075bf27c95e849b3eef271b67188fb7027f00
|
3 |
+
size 5004167864
|
checkpoint-2000/optimizer.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:915d2aaccf8beff3d8274ebc0529c858e40ab86373e5ec24ee60e0cdd75044ba
|
3 |
+
size 2510393614
|
checkpoint-2000/random_states_0.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b74b7db71964a1040fda20a42d565a3dd95b465980105cae6faf3860b55158b8
|
3 |
+
size 14408
|
checkpoint-3000/controlnet/config.json
CHANGED
@@ -1,15 +1,18 @@
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"act_fn": "silu",
|
5 |
-
"addition_embed_type":
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
-
"addition_time_embed_dim":
|
8 |
-
"attention_head_dim":
|
|
|
|
|
|
|
|
|
9 |
"block_out_channels": [
|
10 |
320,
|
11 |
640,
|
12 |
-
1280,
|
13 |
1280
|
14 |
],
|
15 |
"class_embed_type": null,
|
@@ -21,12 +24,11 @@
|
|
21 |
256
|
22 |
],
|
23 |
"controlnet_conditioning_channel_order": "rgb",
|
24 |
-
"cross_attention_dim":
|
25 |
"down_block_types": [
|
|
|
26 |
"CrossAttnDownBlock2D",
|
27 |
-
"CrossAttnDownBlock2D"
|
28 |
-
"CrossAttnDownBlock2D",
|
29 |
-
"DownBlock2D"
|
30 |
],
|
31 |
"downsample_padding": 1,
|
32 |
"encoder_hid_dim": null,
|
@@ -43,9 +45,13 @@
|
|
43 |
"num_attention_heads": null,
|
44 |
"num_class_embeds": null,
|
45 |
"only_cross_attention": false,
|
46 |
-
"projection_class_embeddings_input_dim":
|
47 |
"resnet_time_scale_shift": "default",
|
48 |
-
"transformer_layers_per_block":
|
49 |
-
|
50 |
-
|
|
|
|
|
|
|
|
|
51 |
}
|
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
+
"_diffusers_version": "0.35.0.dev0",
|
4 |
"act_fn": "silu",
|
5 |
+
"addition_embed_type": "text_time",
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
+
"addition_time_embed_dim": 256,
|
8 |
+
"attention_head_dim": [
|
9 |
+
5,
|
10 |
+
10,
|
11 |
+
20
|
12 |
+
],
|
13 |
"block_out_channels": [
|
14 |
320,
|
15 |
640,
|
|
|
16 |
1280
|
17 |
],
|
18 |
"class_embed_type": null,
|
|
|
24 |
256
|
25 |
],
|
26 |
"controlnet_conditioning_channel_order": "rgb",
|
27 |
+
"cross_attention_dim": 2048,
|
28 |
"down_block_types": [
|
29 |
+
"DownBlock2D",
|
30 |
"CrossAttnDownBlock2D",
|
31 |
+
"CrossAttnDownBlock2D"
|
|
|
|
|
32 |
],
|
33 |
"downsample_padding": 1,
|
34 |
"encoder_hid_dim": null,
|
|
|
45 |
"num_attention_heads": null,
|
46 |
"num_class_embeds": null,
|
47 |
"only_cross_attention": false,
|
48 |
+
"projection_class_embeddings_input_dim": 2816,
|
49 |
"resnet_time_scale_shift": "default",
|
50 |
+
"transformer_layers_per_block": [
|
51 |
+
1,
|
52 |
+
2,
|
53 |
+
10
|
54 |
+
],
|
55 |
+
"upcast_attention": null,
|
56 |
+
"use_linear_projection": true
|
57 |
}
|
checkpoint-3000/controlnet/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c01d53f8299ada75eea82872941c4b0d936788a2598d3f9e09b5a6b0f9586e22
|
3 |
+
size 5004167864
|
checkpoint-3000/optimizer.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5227e59e6e9688b1619cef0381488200a24052c39b9334cd95c87d73fbca884e
|
3 |
+
size 2510393614
|
checkpoint-3000/random_states_0.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14408
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30db01d6364583d05e85e8326c408d47d042b5b3f1c56142e1735750a03017a0
|
3 |
size 14408
|
checkpoint-4000/controlnet/config.json
CHANGED
@@ -1,15 +1,18 @@
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"act_fn": "silu",
|
5 |
-
"addition_embed_type":
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
-
"addition_time_embed_dim":
|
8 |
-
"attention_head_dim":
|
|
|
|
|
|
|
|
|
9 |
"block_out_channels": [
|
10 |
320,
|
11 |
640,
|
12 |
-
1280,
|
13 |
1280
|
14 |
],
|
15 |
"class_embed_type": null,
|
@@ -21,12 +24,11 @@
|
|
21 |
256
|
22 |
],
|
23 |
"controlnet_conditioning_channel_order": "rgb",
|
24 |
-
"cross_attention_dim":
|
25 |
"down_block_types": [
|
|
|
26 |
"CrossAttnDownBlock2D",
|
27 |
-
"CrossAttnDownBlock2D"
|
28 |
-
"CrossAttnDownBlock2D",
|
29 |
-
"DownBlock2D"
|
30 |
],
|
31 |
"downsample_padding": 1,
|
32 |
"encoder_hid_dim": null,
|
@@ -43,9 +45,13 @@
|
|
43 |
"num_attention_heads": null,
|
44 |
"num_class_embeds": null,
|
45 |
"only_cross_attention": false,
|
46 |
-
"projection_class_embeddings_input_dim":
|
47 |
"resnet_time_scale_shift": "default",
|
48 |
-
"transformer_layers_per_block":
|
49 |
-
|
50 |
-
|
|
|
|
|
|
|
|
|
51 |
}
|
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
+
"_diffusers_version": "0.35.0.dev0",
|
4 |
"act_fn": "silu",
|
5 |
+
"addition_embed_type": "text_time",
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
+
"addition_time_embed_dim": 256,
|
8 |
+
"attention_head_dim": [
|
9 |
+
5,
|
10 |
+
10,
|
11 |
+
20
|
12 |
+
],
|
13 |
"block_out_channels": [
|
14 |
320,
|
15 |
640,
|
|
|
16 |
1280
|
17 |
],
|
18 |
"class_embed_type": null,
|
|
|
24 |
256
|
25 |
],
|
26 |
"controlnet_conditioning_channel_order": "rgb",
|
27 |
+
"cross_attention_dim": 2048,
|
28 |
"down_block_types": [
|
29 |
+
"DownBlock2D",
|
30 |
"CrossAttnDownBlock2D",
|
31 |
+
"CrossAttnDownBlock2D"
|
|
|
|
|
32 |
],
|
33 |
"downsample_padding": 1,
|
34 |
"encoder_hid_dim": null,
|
|
|
45 |
"num_attention_heads": null,
|
46 |
"num_class_embeds": null,
|
47 |
"only_cross_attention": false,
|
48 |
+
"projection_class_embeddings_input_dim": 2816,
|
49 |
"resnet_time_scale_shift": "default",
|
50 |
+
"transformer_layers_per_block": [
|
51 |
+
1,
|
52 |
+
2,
|
53 |
+
10
|
54 |
+
],
|
55 |
+
"upcast_attention": null,
|
56 |
+
"use_linear_projection": true
|
57 |
}
|
checkpoint-4000/controlnet/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c61efd37ff8816d8de1db8cd76cf3a92b0b8542f8b81368cdbcac10b26ddca3c
|
3 |
+
size 5004167864
|
checkpoint-4000/optimizer.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11f1019905254b71867d7b7160f0bb0bd8bc80daa971ec709c7c7d4e047e9372
|
3 |
+
size 2510393614
|
checkpoint-4000/random_states_0.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d31cd70c2ba15a4cf4655b2bd65670965992b23da3e91e09a7257c900537bcfd
|
3 |
+
size 14408
|
checkpoint-5000/controlnet/config.json
CHANGED
@@ -1,15 +1,18 @@
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"act_fn": "silu",
|
5 |
-
"addition_embed_type":
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
-
"addition_time_embed_dim":
|
8 |
-
"attention_head_dim":
|
|
|
|
|
|
|
|
|
9 |
"block_out_channels": [
|
10 |
320,
|
11 |
640,
|
12 |
-
1280,
|
13 |
1280
|
14 |
],
|
15 |
"class_embed_type": null,
|
@@ -21,12 +24,11 @@
|
|
21 |
256
|
22 |
],
|
23 |
"controlnet_conditioning_channel_order": "rgb",
|
24 |
-
"cross_attention_dim":
|
25 |
"down_block_types": [
|
|
|
26 |
"CrossAttnDownBlock2D",
|
27 |
-
"CrossAttnDownBlock2D"
|
28 |
-
"CrossAttnDownBlock2D",
|
29 |
-
"DownBlock2D"
|
30 |
],
|
31 |
"downsample_padding": 1,
|
32 |
"encoder_hid_dim": null,
|
@@ -43,9 +45,13 @@
|
|
43 |
"num_attention_heads": null,
|
44 |
"num_class_embeds": null,
|
45 |
"only_cross_attention": false,
|
46 |
-
"projection_class_embeddings_input_dim":
|
47 |
"resnet_time_scale_shift": "default",
|
48 |
-
"transformer_layers_per_block":
|
49 |
-
|
50 |
-
|
|
|
|
|
|
|
|
|
51 |
}
|
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
+
"_diffusers_version": "0.35.0.dev0",
|
4 |
"act_fn": "silu",
|
5 |
+
"addition_embed_type": "text_time",
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
+
"addition_time_embed_dim": 256,
|
8 |
+
"attention_head_dim": [
|
9 |
+
5,
|
10 |
+
10,
|
11 |
+
20
|
12 |
+
],
|
13 |
"block_out_channels": [
|
14 |
320,
|
15 |
640,
|
|
|
16 |
1280
|
17 |
],
|
18 |
"class_embed_type": null,
|
|
|
24 |
256
|
25 |
],
|
26 |
"controlnet_conditioning_channel_order": "rgb",
|
27 |
+
"cross_attention_dim": 2048,
|
28 |
"down_block_types": [
|
29 |
+
"DownBlock2D",
|
30 |
"CrossAttnDownBlock2D",
|
31 |
+
"CrossAttnDownBlock2D"
|
|
|
|
|
32 |
],
|
33 |
"downsample_padding": 1,
|
34 |
"encoder_hid_dim": null,
|
|
|
45 |
"num_attention_heads": null,
|
46 |
"num_class_embeds": null,
|
47 |
"only_cross_attention": false,
|
48 |
+
"projection_class_embeddings_input_dim": 2816,
|
49 |
"resnet_time_scale_shift": "default",
|
50 |
+
"transformer_layers_per_block": [
|
51 |
+
1,
|
52 |
+
2,
|
53 |
+
10
|
54 |
+
],
|
55 |
+
"upcast_attention": null,
|
56 |
+
"use_linear_projection": true
|
57 |
}
|
checkpoint-5000/controlnet/diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0124f2e083b565fd6f304bf709528f7b4d4ad94d71734384bc9b073d2ff266d0
|
3 |
+
size 5004167864
|
checkpoint-5000/optimizer.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed1591a442222e0390b55fd07ddcac5c93be31c180649d36921031845303aa1c
|
3 |
+
size 2510393614
|
checkpoint-5000/random_states_0.pkl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14408
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d9880959925c08f7cff7f53206eda7aedf0ee3cacfdee243598699a2f876dd0
|
3 |
size 14408
|
config.json
CHANGED
@@ -1,15 +1,18 @@
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
-
"_diffusers_version": "0.
|
4 |
"act_fn": "silu",
|
5 |
-
"addition_embed_type":
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
-
"addition_time_embed_dim":
|
8 |
-
"attention_head_dim":
|
|
|
|
|
|
|
|
|
9 |
"block_out_channels": [
|
10 |
320,
|
11 |
640,
|
12 |
-
1280,
|
13 |
1280
|
14 |
],
|
15 |
"class_embed_type": null,
|
@@ -21,12 +24,11 @@
|
|
21 |
256
|
22 |
],
|
23 |
"controlnet_conditioning_channel_order": "rgb",
|
24 |
-
"cross_attention_dim":
|
25 |
"down_block_types": [
|
|
|
26 |
"CrossAttnDownBlock2D",
|
27 |
-
"CrossAttnDownBlock2D"
|
28 |
-
"CrossAttnDownBlock2D",
|
29 |
-
"DownBlock2D"
|
30 |
],
|
31 |
"downsample_padding": 1,
|
32 |
"encoder_hid_dim": null,
|
@@ -43,9 +45,13 @@
|
|
43 |
"num_attention_heads": null,
|
44 |
"num_class_embeds": null,
|
45 |
"only_cross_attention": false,
|
46 |
-
"projection_class_embeddings_input_dim":
|
47 |
"resnet_time_scale_shift": "default",
|
48 |
-
"transformer_layers_per_block":
|
49 |
-
|
50 |
-
|
|
|
|
|
|
|
|
|
51 |
}
|
|
|
1 |
{
|
2 |
"_class_name": "ControlNetModel",
|
3 |
+
"_diffusers_version": "0.35.0.dev0",
|
4 |
"act_fn": "silu",
|
5 |
+
"addition_embed_type": "text_time",
|
6 |
"addition_embed_type_num_heads": 64,
|
7 |
+
"addition_time_embed_dim": 256,
|
8 |
+
"attention_head_dim": [
|
9 |
+
5,
|
10 |
+
10,
|
11 |
+
20
|
12 |
+
],
|
13 |
"block_out_channels": [
|
14 |
320,
|
15 |
640,
|
|
|
16 |
1280
|
17 |
],
|
18 |
"class_embed_type": null,
|
|
|
24 |
256
|
25 |
],
|
26 |
"controlnet_conditioning_channel_order": "rgb",
|
27 |
+
"cross_attention_dim": 2048,
|
28 |
"down_block_types": [
|
29 |
+
"DownBlock2D",
|
30 |
"CrossAttnDownBlock2D",
|
31 |
+
"CrossAttnDownBlock2D"
|
|
|
|
|
32 |
],
|
33 |
"downsample_padding": 1,
|
34 |
"encoder_hid_dim": null,
|
|
|
45 |
"num_attention_heads": null,
|
46 |
"num_class_embeds": null,
|
47 |
"only_cross_attention": false,
|
48 |
+
"projection_class_embeddings_input_dim": 2816,
|
49 |
"resnet_time_scale_shift": "default",
|
50 |
+
"transformer_layers_per_block": [
|
51 |
+
1,
|
52 |
+
2,
|
53 |
+
10
|
54 |
+
],
|
55 |
+
"upcast_attention": null,
|
56 |
+
"use_linear_projection": true
|
57 |
}
|
diffusion_pytorch_model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0124f2e083b565fd6f304bf709528f7b4d4ad94d71734384bc9b073d2ff266d0
|
3 |
+
size 5004167864
|