rcannizzaro
commited on
Commit
•
17ed67a
1
Parent(s):
d6de8bb
End of training
Browse files- README.md +54 -0
- checkpoint-10/optimizer.bin +3 -0
- checkpoint-10/random_states_0.pkl +3 -0
- checkpoint-10/scaler.pt +3 -0
- checkpoint-10/scheduler.bin +3 -0
- checkpoint-10/vae/config.json +36 -0
- checkpoint-10/vae/diffusion_pytorch_model.safetensors +3 -0
- checkpoint-5/optimizer.bin +3 -0
- checkpoint-5/random_states_0.pkl +3 -0
- checkpoint-5/scaler.pt +3 -0
- checkpoint-5/scheduler.bin +3 -0
- checkpoint-5/vae/config.json +36 -0
- checkpoint-5/vae/diffusion_pytorch_model.safetensors +3 -0
- config.json +36 -0
- diffusion_pytorch_model.safetensors +3 -0
- val_imgs_grid.png +0 -0
README.md
ADDED
@@ -0,0 +1,54 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: creativeml-openrail-m
|
3 |
+
library_name: diffusers
|
4 |
+
tags:
|
5 |
+
- stable-diffusion
|
6 |
+
- stable-diffusion-diffusers
|
7 |
+
- text-to-image
|
8 |
+
- diffusers
|
9 |
+
- diffusers-training
|
10 |
+
inference: true
|
11 |
+
---
|
12 |
+
|
13 |
+
<!-- This model card has been generated automatically according to the information the training script had access to. You
|
14 |
+
should probably proofread and complete it, then remove this comment. -->
|
15 |
+
|
16 |
+
|
17 |
+
# Text-to-image finetuning - rcannizzaro/vae-dsprites-counterfactual
|
18 |
+
|
19 |
+
This pipeline was finetuned from **None** on the **osazuwa/dsprite-counterfactual** dataset. Below are some example images generated with the finetuned pipeline using the following prompts:
|
20 |
+
|
21 |
+
![val_imgs_grid](./val_imgs_grid.png)
|
22 |
+
|
23 |
+
|
24 |
+
|
25 |
+
## Training info
|
26 |
+
|
27 |
+
These are the key hyperparameters used during training:
|
28 |
+
|
29 |
+
* Epochs: 1
|
30 |
+
* Learning rate: 1e-05
|
31 |
+
* Batch size: 250
|
32 |
+
* Gradient accumulation steps: 1
|
33 |
+
* Image resolution: 64
|
34 |
+
* Mixed-precision: fp16
|
35 |
+
|
36 |
+
|
37 |
+
More information on all the CLI arguments and the environment are available on your [`wandb` run page](https://microsoft-research.wandb.io/t-ricardoc/vae-dsprites-counterfactual/runs/ju56tobe).
|
38 |
+
|
39 |
+
|
40 |
+
## Intended uses & limitations
|
41 |
+
|
42 |
+
#### How to use
|
43 |
+
|
44 |
+
```python
|
45 |
+
# TODO: add an example code snippet for running this diffusion pipeline
|
46 |
+
```
|
47 |
+
|
48 |
+
#### Limitations and bias
|
49 |
+
|
50 |
+
[TODO: provide examples of latent issues and potential remediations]
|
51 |
+
|
52 |
+
## Training details
|
53 |
+
|
54 |
+
[TODO: describe the data used to train the model]
|
checkpoint-10/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d340d62245ed3691226236c66b1b89a4694a5814dec2e77a42512479b3e7796
|
3 |
+
size 1640
|
checkpoint-10/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecfa6f85341e8e319b00c22dd3828c39c4bfc92734d5b06a42a9147e27a53941
|
3 |
+
size 14344
|
checkpoint-10/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9da5697df775cfff0a9ff85d168c3edb6195eebc2da426dd4afe6b731480e7a7
|
3 |
+
size 988
|
checkpoint-10/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d844ae8442bf0a85e668fb349e07cdc6c2d015de122d8d84e559ff95250e2a6c
|
3 |
+
size 1000
|
checkpoint-10/vae/config.json
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "AutoencoderKL",
|
3 |
+
"_diffusers_version": "0.30.0.dev0",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"block_out_channels": [
|
6 |
+
128,
|
7 |
+
256,
|
8 |
+
512,
|
9 |
+
512
|
10 |
+
],
|
11 |
+
"down_block_types": [
|
12 |
+
"DownEncoderBlock2D",
|
13 |
+
"DownEncoderBlock2D",
|
14 |
+
"DownEncoderBlock2D",
|
15 |
+
"DownEncoderBlock2D"
|
16 |
+
],
|
17 |
+
"force_upcast": true,
|
18 |
+
"in_channels": 1,
|
19 |
+
"latent_channels": 4,
|
20 |
+
"latents_mean": null,
|
21 |
+
"latents_std": null,
|
22 |
+
"layers_per_block": 2,
|
23 |
+
"norm_num_groups": 32,
|
24 |
+
"out_channels": 1,
|
25 |
+
"sample_size": 64,
|
26 |
+
"scaling_factor": 0.18215,
|
27 |
+
"shift_factor": null,
|
28 |
+
"up_block_types": [
|
29 |
+
"UpDecoderBlock2D",
|
30 |
+
"UpDecoderBlock2D",
|
31 |
+
"UpDecoderBlock2D",
|
32 |
+
"UpDecoderBlock2D"
|
33 |
+
],
|
34 |
+
"use_post_quant_conv": true,
|
35 |
+
"use_quant_conv": true
|
36 |
+
}
|
checkpoint-10/vae/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d38d5589837d83fd5e7cc02743dd47d487a678f6c0a67e4e6c352f8d528c61e1
|
3 |
+
size 334624828
|
checkpoint-5/optimizer.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d340d62245ed3691226236c66b1b89a4694a5814dec2e77a42512479b3e7796
|
3 |
+
size 1640
|
checkpoint-5/random_states_0.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6104ee28a6a4352b7b51eb0ac6939d120b3a9305536eba8b822fbe1ab221d3b8
|
3 |
+
size 14344
|
checkpoint-5/scaler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11c2ec697a3b8b5a4895af88c59dbba480386a7d5b8df6ae55e6659177ce0be4
|
3 |
+
size 988
|
checkpoint-5/scheduler.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d844ae8442bf0a85e668fb349e07cdc6c2d015de122d8d84e559ff95250e2a6c
|
3 |
+
size 1000
|
checkpoint-5/vae/config.json
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "AutoencoderKL",
|
3 |
+
"_diffusers_version": "0.30.0.dev0",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"block_out_channels": [
|
6 |
+
128,
|
7 |
+
256,
|
8 |
+
512,
|
9 |
+
512
|
10 |
+
],
|
11 |
+
"down_block_types": [
|
12 |
+
"DownEncoderBlock2D",
|
13 |
+
"DownEncoderBlock2D",
|
14 |
+
"DownEncoderBlock2D",
|
15 |
+
"DownEncoderBlock2D"
|
16 |
+
],
|
17 |
+
"force_upcast": true,
|
18 |
+
"in_channels": 1,
|
19 |
+
"latent_channels": 4,
|
20 |
+
"latents_mean": null,
|
21 |
+
"latents_std": null,
|
22 |
+
"layers_per_block": 2,
|
23 |
+
"norm_num_groups": 32,
|
24 |
+
"out_channels": 1,
|
25 |
+
"sample_size": 64,
|
26 |
+
"scaling_factor": 0.18215,
|
27 |
+
"shift_factor": null,
|
28 |
+
"up_block_types": [
|
29 |
+
"UpDecoderBlock2D",
|
30 |
+
"UpDecoderBlock2D",
|
31 |
+
"UpDecoderBlock2D",
|
32 |
+
"UpDecoderBlock2D"
|
33 |
+
],
|
34 |
+
"use_post_quant_conv": true,
|
35 |
+
"use_quant_conv": true
|
36 |
+
}
|
checkpoint-5/vae/diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d38d5589837d83fd5e7cc02743dd47d487a678f6c0a67e4e6c352f8d528c61e1
|
3 |
+
size 334624828
|
config.json
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_class_name": "AutoencoderKL",
|
3 |
+
"_diffusers_version": "0.30.0.dev0",
|
4 |
+
"act_fn": "silu",
|
5 |
+
"block_out_channels": [
|
6 |
+
128,
|
7 |
+
256,
|
8 |
+
512,
|
9 |
+
512
|
10 |
+
],
|
11 |
+
"down_block_types": [
|
12 |
+
"DownEncoderBlock2D",
|
13 |
+
"DownEncoderBlock2D",
|
14 |
+
"DownEncoderBlock2D",
|
15 |
+
"DownEncoderBlock2D"
|
16 |
+
],
|
17 |
+
"force_upcast": true,
|
18 |
+
"in_channels": 1,
|
19 |
+
"latent_channels": 4,
|
20 |
+
"latents_mean": null,
|
21 |
+
"latents_std": null,
|
22 |
+
"layers_per_block": 2,
|
23 |
+
"norm_num_groups": 32,
|
24 |
+
"out_channels": 1,
|
25 |
+
"sample_size": 64,
|
26 |
+
"scaling_factor": 0.18215,
|
27 |
+
"shift_factor": null,
|
28 |
+
"up_block_types": [
|
29 |
+
"UpDecoderBlock2D",
|
30 |
+
"UpDecoderBlock2D",
|
31 |
+
"UpDecoderBlock2D",
|
32 |
+
"UpDecoderBlock2D"
|
33 |
+
],
|
34 |
+
"use_post_quant_conv": true,
|
35 |
+
"use_quant_conv": true
|
36 |
+
}
|
diffusion_pytorch_model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d38d5589837d83fd5e7cc02743dd47d487a678f6c0a67e4e6c352f8d528c61e1
|
3 |
+
size 334624828
|
val_imgs_grid.png
ADDED