End of training
Browse files- README.md +39 -0
- checkpoint-3000/optimizer.bin +3 -0
- checkpoint-3000/random_states_0.pkl +3 -0
- checkpoint-3000/scaler.pt +3 -0
- checkpoint-3000/scheduler.bin +3 -0
- checkpoint-4000/controlnet/config.json +56 -0
- checkpoint-4000/controlnet/diffusion_pytorch_model.bin +3 -0
- checkpoint-4000/optimizer.bin +3 -0
- checkpoint-4000/random_states_0.pkl +3 -0
- checkpoint-4000/scaler.pt +3 -0
- checkpoint-4000/scheduler.bin +3 -0
- checkpoint-5000/controlnet/config.json +56 -0
- checkpoint-5000/controlnet/diffusion_pytorch_model.bin +3 -0
- checkpoint-5000/optimizer.bin +3 -0
- checkpoint-5000/random_states_0.pkl +3 -0
- checkpoint-5000/scaler.pt +3 -0
- checkpoint-5000/scheduler.bin +3 -0
- config.json +56 -0
- diffusion_pytorch_model.bin +3 -0
- image_control.png +0 -0
- images_0.png +0 -0
- images_1.png +0 -0
- images_2.png +0 -0
- images_3.png +0 -0
- images_4.png +0 -0
- images_5.png +0 -0
- images_6.png +0 -0
- images_7.png +0 -0
README.md
ADDED
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
---
|
3 |
+
license: creativeml-openrail-m
|
4 |
+
base_model: stabilityai/stable-diffusion-xl-base-1.0
|
5 |
+
tags:
|
6 |
+
- stable-diffusion-xl
|
7 |
+
- stable-diffusion-xl-diffusers
|
8 |
+
- text-to-image
|
9 |
+
- diffusers
|
10 |
+
- controlnet
|
11 |
+
inference: true
|
12 |
+
---
|
13 |
+
|
14 |
+
# controlnet-SargeZT/controlnet-sd-xl-1.0-depth-16bit-zoe
|
15 |
+
|
16 |
+
These are controlnet weights trained on stabilityai/stable-diffusion-xl-base-1.0 with new type of conditioning.
|
17 |
+
You can find some example images below.
|
18 |
+
prompt: a black and white cat laying on top of a keyboard
|
19 |
+
![images_0)](./images_0.png)
|
20 |
+
prompt: a wooden bench sitting in the middle of a forest
|
21 |
+
![images_1)](./images_1.png)
|
22 |
+
prompt: a ripe banana sitting on top of a wooden table
|
23 |
+
![images_2)](./images_2.png)
|
24 |
+
prompt: a large jetliner sitting on top of an airport tarmac
|
25 |
+
![images_3)](./images_3.png)
|
26 |
+
prompt: two girls are playing soccer on a field
|
27 |
+
![images_4)](./images_4.png)
|
28 |
+
prompt: a laptop computer sitting on top of a desk
|
29 |
+
![images_5)](./images_5.png)
|
30 |
+
prompt: a man riding skis on top of a body of water
|
31 |
+
![images_6)](./images_6.png)
|
32 |
+
prompt: a small plane is flying through the air
|
33 |
+
![images_7)](./images_7.png)
|
34 |
+
|
35 |
+
|
36 |
+
|
37 |
+
## License
|
38 |
+
|
39 |
+
[SDXL 1.0 License](https://huggingface.co/stabilityai/stable-diffusion-xl-base-1.0/blob/main/LICENSE.md)
|
checkpoint-3000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ad657580563cd47a6d01fad4dbbbd94718abfc2147c2401659726e0fe215e91
|
3 |
+
size 20017245213
|
checkpoint-3000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b10a64b8ec4ab1ee81407f331b71f59e737c3472e62148fa3f3491eda1460d58
|
3 |
+
size 14727
|
checkpoint-3000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fb1f9398b77268202e8e1465734a63d123b1ef11c27f20f2473677e9883a6869
|
3 |
+
size 557
|
checkpoint-3000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aa5239ab2381305ae3898ff682944f2f2d00b994d0812b456736063d20ca7a10
|
3 |
+
size 563
|
checkpoint-4000/controlnet/config.json
ADDED
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "ControlNetModel",
|
3 |
+
"_diffusers_version": "0.19.3",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": "text_time",
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"addition_time_embed_dim": 256,
|
8 |
+
"attention_head_dim": [
|
9 |
+
5,
|
10 |
+
10,
|
11 |
+
20
|
12 |
+
],
|
13 |
+
"block_out_channels": [
|
14 |
+
320,
|
15 |
+
640,
|
16 |
+
1280
|
17 |
+
],
|
18 |
+
"class_embed_type": null,
|
19 |
+
"conditioning_channels": 3,
|
20 |
+
"conditioning_embedding_out_channels": [
|
21 |
+
16,
|
22 |
+
32,
|
23 |
+
96,
|
24 |
+
256
|
25 |
+
],
|
26 |
+
"controlnet_conditioning_channel_order": "rgb",
|
27 |
+
"cross_attention_dim": 2048,
|
28 |
+
"down_block_types": [
|
29 |
+
"DownBlock2D",
|
30 |
+
"CrossAttnDownBlock2D",
|
31 |
+
"CrossAttnDownBlock2D"
|
32 |
+
],
|
33 |
+
"downsample_padding": 1,
|
34 |
+
"encoder_hid_dim": null,
|
35 |
+
"encoder_hid_dim_type": null,
|
36 |
+
"flip_sin_to_cos": true,
|
37 |
+
"freq_shift": 0,
|
38 |
+
"global_pool_conditions": false,
|
39 |
+
"in_channels": 4,
|
40 |
+
"layers_per_block": 2,
|
41 |
+
"mid_block_scale_factor": 1,
|
42 |
+
"norm_eps": 1e-05,
|
43 |
+
"norm_num_groups": 32,
|
44 |
+
"num_attention_heads": null,
|
45 |
+
"num_class_embeds": null,
|
46 |
+
"only_cross_attention": false,
|
47 |
+
"projection_class_embeddings_input_dim": 2816,
|
48 |
+
"resnet_time_scale_shift": "default",
|
49 |
+
"transformer_layers_per_block": [
|
50 |
+
1,
|
51 |
+
2,
|
52 |
+
10
|
53 |
+
],
|
54 |
+
"upcast_attention": null,
|
55 |
+
"use_linear_projection": true
|
56 |
+
}
|
checkpoint-4000/controlnet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2594d899512bd4c7f815cdb406489aa361027d3c36951a3d6ac31ed1b6e54c96
|
3 |
+
size 5004438321
|
checkpoint-4000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af91808b8221f30880be6ed96f5dba336ec210d224bb255f6c70d3f5124963f5
|
3 |
+
size 20017245213
|
checkpoint-4000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d927d8aa94b6725fc2a7b48150b6b54a375bb9cd96f83ab1b5298628de9ed43
|
3 |
+
size 14727
|
checkpoint-4000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09a61ecdaa4a69ba865e0b9e19169660549c34c60a83537ab5ece413678520ab
|
3 |
+
size 557
|
checkpoint-4000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:105d6580de739d529fa465e32f1833e2248ffd7e0f899527364081ef0bdb1475
|
3 |
+
size 563
|
checkpoint-5000/controlnet/config.json
ADDED
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "ControlNetModel",
|
3 |
+
"_diffusers_version": "0.19.3",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": "text_time",
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"addition_time_embed_dim": 256,
|
8 |
+
"attention_head_dim": [
|
9 |
+
5,
|
10 |
+
10,
|
11 |
+
20
|
12 |
+
],
|
13 |
+
"block_out_channels": [
|
14 |
+
320,
|
15 |
+
640,
|
16 |
+
1280
|
17 |
+
],
|
18 |
+
"class_embed_type": null,
|
19 |
+
"conditioning_channels": 3,
|
20 |
+
"conditioning_embedding_out_channels": [
|
21 |
+
16,
|
22 |
+
32,
|
23 |
+
96,
|
24 |
+
256
|
25 |
+
],
|
26 |
+
"controlnet_conditioning_channel_order": "rgb",
|
27 |
+
"cross_attention_dim": 2048,
|
28 |
+
"down_block_types": [
|
29 |
+
"DownBlock2D",
|
30 |
+
"CrossAttnDownBlock2D",
|
31 |
+
"CrossAttnDownBlock2D"
|
32 |
+
],
|
33 |
+
"downsample_padding": 1,
|
34 |
+
"encoder_hid_dim": null,
|
35 |
+
"encoder_hid_dim_type": null,
|
36 |
+
"flip_sin_to_cos": true,
|
37 |
+
"freq_shift": 0,
|
38 |
+
"global_pool_conditions": false,
|
39 |
+
"in_channels": 4,
|
40 |
+
"layers_per_block": 2,
|
41 |
+
"mid_block_scale_factor": 1,
|
42 |
+
"norm_eps": 1e-05,
|
43 |
+
"norm_num_groups": 32,
|
44 |
+
"num_attention_heads": null,
|
45 |
+
"num_class_embeds": null,
|
46 |
+
"only_cross_attention": false,
|
47 |
+
"projection_class_embeddings_input_dim": 2816,
|
48 |
+
"resnet_time_scale_shift": "default",
|
49 |
+
"transformer_layers_per_block": [
|
50 |
+
1,
|
51 |
+
2,
|
52 |
+
10
|
53 |
+
],
|
54 |
+
"upcast_attention": null,
|
55 |
+
"use_linear_projection": true
|
56 |
+
}
|
checkpoint-5000/controlnet/diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05b5555c93a67a621d021a8fbd5ca1e1b2078d1c20a45f2d786cb59ece16da74
|
3 |
+
size 5004438321
|
checkpoint-5000/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26854861fa554476886918017e6ce2d50ec50b0fe928a9cd6cfb1e4e7d33dee5
|
3 |
+
size 20017245213
|
checkpoint-5000/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c09f3525a2133cee4c46a75b89306446311c2b3db230b63acabcbe77696baf7c
|
3 |
+
size 14727
|
checkpoint-5000/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a41313b6733b65c1acca917a7c2ced06503c11b898e6cd5de1e6a9f13bfb54ef
|
3 |
+
size 557
|
checkpoint-5000/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a36607a976be36244ad46bcfa4be6fb5bea011d713149f3a57643bfc07960ced
|
3 |
+
size 563
|
config.json
ADDED
@@ -0,0 +1,56 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "ControlNetModel",
|
3 |
+
"_diffusers_version": "0.19.3",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"addition_embed_type": "text_time",
|
6 |
+
"addition_embed_type_num_heads": 64,
|
7 |
+
"addition_time_embed_dim": 256,
|
8 |
+
"attention_head_dim": [
|
9 |
+
5,
|
10 |
+
10,
|
11 |
+
20
|
12 |
+
],
|
13 |
+
"block_out_channels": [
|
14 |
+
320,
|
15 |
+
640,
|
16 |
+
1280
|
17 |
+
],
|
18 |
+
"class_embed_type": null,
|
19 |
+
"conditioning_channels": 3,
|
20 |
+
"conditioning_embedding_out_channels": [
|
21 |
+
16,
|
22 |
+
32,
|
23 |
+
96,
|
24 |
+
256
|
25 |
+
],
|
26 |
+
"controlnet_conditioning_channel_order": "rgb",
|
27 |
+
"cross_attention_dim": 2048,
|
28 |
+
"down_block_types": [
|
29 |
+
"DownBlock2D",
|
30 |
+
"CrossAttnDownBlock2D",
|
31 |
+
"CrossAttnDownBlock2D"
|
32 |
+
],
|
33 |
+
"downsample_padding": 1,
|
34 |
+
"encoder_hid_dim": null,
|
35 |
+
"encoder_hid_dim_type": null,
|
36 |
+
"flip_sin_to_cos": true,
|
37 |
+
"freq_shift": 0,
|
38 |
+
"global_pool_conditions": false,
|
39 |
+
"in_channels": 4,
|
40 |
+
"layers_per_block": 2,
|
41 |
+
"mid_block_scale_factor": 1,
|
42 |
+
"norm_eps": 1e-05,
|
43 |
+
"norm_num_groups": 32,
|
44 |
+
"num_attention_heads": null,
|
45 |
+
"num_class_embeds": null,
|
46 |
+
"only_cross_attention": false,
|
47 |
+
"projection_class_embeddings_input_dim": 2816,
|
48 |
+
"resnet_time_scale_shift": "default",
|
49 |
+
"transformer_layers_per_block": [
|
50 |
+
1,
|
51 |
+
2,
|
52 |
+
10
|
53 |
+
],
|
54 |
+
"upcast_attention": null,
|
55 |
+
"use_linear_projection": true
|
56 |
+
}
|
diffusion_pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7045e46da30684d8df4b08490d02f81881be146fe9d175559e393800a0353e61
|
3 |
+
size 5004438321
|
image_control.png
ADDED
images_0.png
ADDED
images_1.png
ADDED
images_2.png
ADDED
images_3.png
ADDED
images_4.png
ADDED
images_5.png
ADDED
images_6.png
ADDED
images_7.png
ADDED