juliajoanna commited on
Commit
c89dc3d
1 Parent(s): 3c81b81

End of training

Browse files
Files changed (44) hide show
  1. checkpoint-30000/optimizer.bin +3 -0
  2. checkpoint-30000/random_states_0.pkl +3 -0
  3. checkpoint-30000/scheduler.bin +3 -0
  4. checkpoint-30000/unet/config.json +73 -0
  5. checkpoint-30000/unet/diffusion_pytorch_model.safetensors +3 -0
  6. checkpoint-35000/optimizer.bin +3 -0
  7. checkpoint-35000/random_states_0.pkl +3 -0
  8. checkpoint-35000/scheduler.bin +3 -0
  9. checkpoint-35000/unet/config.json +73 -0
  10. checkpoint-35000/unet/diffusion_pytorch_model.safetensors +3 -0
  11. checkpoint-36000/optimizer.bin +3 -0
  12. checkpoint-36000/random_states_0.pkl +3 -0
  13. checkpoint-36000/scheduler.bin +3 -0
  14. checkpoint-36000/unet/config.json +73 -0
  15. checkpoint-36000/unet/diffusion_pytorch_model.safetensors +3 -0
  16. checkpoint-38000/optimizer.bin +3 -0
  17. checkpoint-38000/random_states_0.pkl +3 -0
  18. checkpoint-38000/scheduler.bin +3 -0
  19. checkpoint-38000/unet/config.json +73 -0
  20. checkpoint-38000/unet/diffusion_pytorch_model.safetensors +3 -0
  21. checkpoint-40000/optimizer.bin +3 -0
  22. checkpoint-40000/random_states_0.pkl +3 -0
  23. checkpoint-40000/scheduler.bin +3 -0
  24. checkpoint-40000/unet/config.json +73 -0
  25. checkpoint-40000/unet/diffusion_pytorch_model.safetensors +3 -0
  26. checkpoint-42000/optimizer.bin +3 -0
  27. checkpoint-42000/random_states_0.pkl +3 -0
  28. checkpoint-42000/scheduler.bin +3 -0
  29. checkpoint-42000/unet/config.json +73 -0
  30. checkpoint-42000/unet/diffusion_pytorch_model.safetensors +3 -0
  31. image_0.png +2 -2
  32. image_1.png +2 -2
  33. image_2.png +2 -2
  34. image_3.png +2 -2
  35. logs/text2image-fine-tune-sdxl/1699656452.4887972/events.out.tfevents.1699656452.4124gs01.2650294.1 +3 -0
  36. logs/text2image-fine-tune-sdxl/1699656452.491553/hparams.yml +56 -0
  37. logs/text2image-fine-tune-sdxl/1699656954.4301672/events.out.tfevents.1699656954.4124gs01.2655943.1 +3 -0
  38. logs/text2image-fine-tune-sdxl/1699656954.4332438/hparams.yml +56 -0
  39. logs/text2image-fine-tune-sdxl/1699823207.5531957/events.out.tfevents.1699823207.4124gs01.3988910.1 +3 -0
  40. logs/text2image-fine-tune-sdxl/1699823207.5553815/hparams.yml +56 -0
  41. logs/text2image-fine-tune-sdxl/events.out.tfevents.1699656452.4124gs01.2650294.0 +3 -0
  42. logs/text2image-fine-tune-sdxl/events.out.tfevents.1699656954.4124gs01.2655943.0 +3 -0
  43. logs/text2image-fine-tune-sdxl/events.out.tfevents.1699823207.4124gs01.3988910.0 +3 -0
  44. unet/diffusion_pytorch_model.safetensors +1 -1
checkpoint-30000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8d8363733395c84a0f8bf07c709d038bf8d7fab761a0085eda78b73fc8daa77
3
+ size 20541257440
checkpoint-30000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95f42ee69f77022bdd94e02f67bd7504b1a48b70a5cd656d5a447e2f61a1f82d
3
+ size 14408
checkpoint-30000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d2faaf212aa126fcd796f16fbf64e7b7d1c2ed68667cd1f56cf1968fa847cc3
3
+ size 1000
checkpoint-30000/unet/config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "juliajoanna/sdxl-one_hot_encoding",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "attention_type": "default",
15
+ "block_out_channels": [
16
+ 320,
17
+ 640,
18
+ 1280
19
+ ],
20
+ "center_input_sample": false,
21
+ "class_embed_type": null,
22
+ "class_embeddings_concat": false,
23
+ "conv_in_kernel": 3,
24
+ "conv_out_kernel": 3,
25
+ "cross_attention_dim": 2048,
26
+ "cross_attention_norm": null,
27
+ "down_block_types": [
28
+ "DownBlock2D",
29
+ "CrossAttnDownBlock2D",
30
+ "CrossAttnDownBlock2D"
31
+ ],
32
+ "downsample_padding": 1,
33
+ "dropout": 0.0,
34
+ "dual_cross_attention": false,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "in_channels": 4,
40
+ "layers_per_block": 2,
41
+ "mid_block_only_cross_attention": null,
42
+ "mid_block_scale_factor": 1,
43
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
44
+ "norm_eps": 1e-05,
45
+ "norm_num_groups": 32,
46
+ "num_attention_heads": null,
47
+ "num_class_embeds": null,
48
+ "only_cross_attention": false,
49
+ "out_channels": 4,
50
+ "projection_class_embeddings_input_dim": 2816,
51
+ "resnet_out_scale_factor": 1.0,
52
+ "resnet_skip_time_act": false,
53
+ "resnet_time_scale_shift": "default",
54
+ "reverse_transformer_layers_per_block": null,
55
+ "sample_size": 128,
56
+ "time_cond_proj_dim": null,
57
+ "time_embedding_act_fn": null,
58
+ "time_embedding_dim": null,
59
+ "time_embedding_type": "positional",
60
+ "timestep_post_act": null,
61
+ "transformer_layers_per_block": [
62
+ 1,
63
+ 2,
64
+ 10
65
+ ],
66
+ "up_block_types": [
67
+ "CrossAttnUpBlock2D",
68
+ "CrossAttnUpBlock2D",
69
+ "UpBlock2D"
70
+ ],
71
+ "upcast_attention": null,
72
+ "use_linear_projection": true
73
+ }
checkpoint-30000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afa278820e5efeff55e3df9483e2ab3de65a75a80a6ac75610c3fd9de7e19a43
3
+ size 10270118880
checkpoint-35000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6caca421eb88dda18aa3e373f2dd9422eed3c7ee2a5851b5e8573dec55c1c7c7
3
+ size 20541257440
checkpoint-35000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:823c3b2e482e11f848d652553a65ee385331f803a1d5a403d219f37dccfdd269
3
+ size 14408
checkpoint-35000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8026b51bbdda9168a22fae82204316690f6b74d4230d31ebb84f6bcfbb02bef
3
+ size 1000
checkpoint-35000/unet/config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "juliajoanna/sdxl-one_hot_encoding",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "attention_type": "default",
15
+ "block_out_channels": [
16
+ 320,
17
+ 640,
18
+ 1280
19
+ ],
20
+ "center_input_sample": false,
21
+ "class_embed_type": null,
22
+ "class_embeddings_concat": false,
23
+ "conv_in_kernel": 3,
24
+ "conv_out_kernel": 3,
25
+ "cross_attention_dim": 2048,
26
+ "cross_attention_norm": null,
27
+ "down_block_types": [
28
+ "DownBlock2D",
29
+ "CrossAttnDownBlock2D",
30
+ "CrossAttnDownBlock2D"
31
+ ],
32
+ "downsample_padding": 1,
33
+ "dropout": 0.0,
34
+ "dual_cross_attention": false,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "in_channels": 4,
40
+ "layers_per_block": 2,
41
+ "mid_block_only_cross_attention": null,
42
+ "mid_block_scale_factor": 1,
43
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
44
+ "norm_eps": 1e-05,
45
+ "norm_num_groups": 32,
46
+ "num_attention_heads": null,
47
+ "num_class_embeds": null,
48
+ "only_cross_attention": false,
49
+ "out_channels": 4,
50
+ "projection_class_embeddings_input_dim": 2816,
51
+ "resnet_out_scale_factor": 1.0,
52
+ "resnet_skip_time_act": false,
53
+ "resnet_time_scale_shift": "default",
54
+ "reverse_transformer_layers_per_block": null,
55
+ "sample_size": 128,
56
+ "time_cond_proj_dim": null,
57
+ "time_embedding_act_fn": null,
58
+ "time_embedding_dim": null,
59
+ "time_embedding_type": "positional",
60
+ "timestep_post_act": null,
61
+ "transformer_layers_per_block": [
62
+ 1,
63
+ 2,
64
+ 10
65
+ ],
66
+ "up_block_types": [
67
+ "CrossAttnUpBlock2D",
68
+ "CrossAttnUpBlock2D",
69
+ "UpBlock2D"
70
+ ],
71
+ "upcast_attention": null,
72
+ "use_linear_projection": true
73
+ }
checkpoint-35000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ead72fea11a8f175ed8648aa22523d8334dd291294f54955b7bb75faa035c117
3
+ size 10270118880
checkpoint-36000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2592153b82aa7554ec1fe055ff4c58fe0f0e3584e8d5e53554d2c655455c9d5
3
+ size 20541257440
checkpoint-36000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fb705cabc409eb301ee615dca7ac261957bd322f0bfe50fb0e463c133c54a0c
3
+ size 14408
checkpoint-36000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6489f6f9cd54e4e175d47407ead6426c363a86411ea0f4ea9dda3526c82b8d13
3
+ size 1000
checkpoint-36000/unet/config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "sdxl-flintstones-one_hot_encoding/checkpoint-35000",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "attention_type": "default",
15
+ "block_out_channels": [
16
+ 320,
17
+ 640,
18
+ 1280
19
+ ],
20
+ "center_input_sample": false,
21
+ "class_embed_type": null,
22
+ "class_embeddings_concat": false,
23
+ "conv_in_kernel": 3,
24
+ "conv_out_kernel": 3,
25
+ "cross_attention_dim": 2048,
26
+ "cross_attention_norm": null,
27
+ "down_block_types": [
28
+ "DownBlock2D",
29
+ "CrossAttnDownBlock2D",
30
+ "CrossAttnDownBlock2D"
31
+ ],
32
+ "downsample_padding": 1,
33
+ "dropout": 0.0,
34
+ "dual_cross_attention": false,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "in_channels": 4,
40
+ "layers_per_block": 2,
41
+ "mid_block_only_cross_attention": null,
42
+ "mid_block_scale_factor": 1,
43
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
44
+ "norm_eps": 1e-05,
45
+ "norm_num_groups": 32,
46
+ "num_attention_heads": null,
47
+ "num_class_embeds": null,
48
+ "only_cross_attention": false,
49
+ "out_channels": 4,
50
+ "projection_class_embeddings_input_dim": 2816,
51
+ "resnet_out_scale_factor": 1.0,
52
+ "resnet_skip_time_act": false,
53
+ "resnet_time_scale_shift": "default",
54
+ "reverse_transformer_layers_per_block": null,
55
+ "sample_size": 128,
56
+ "time_cond_proj_dim": null,
57
+ "time_embedding_act_fn": null,
58
+ "time_embedding_dim": null,
59
+ "time_embedding_type": "positional",
60
+ "timestep_post_act": null,
61
+ "transformer_layers_per_block": [
62
+ 1,
63
+ 2,
64
+ 10
65
+ ],
66
+ "up_block_types": [
67
+ "CrossAttnUpBlock2D",
68
+ "CrossAttnUpBlock2D",
69
+ "UpBlock2D"
70
+ ],
71
+ "upcast_attention": null,
72
+ "use_linear_projection": true
73
+ }
checkpoint-36000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:549f99662c9f37725b4bd27de36dbfa5fb3610027d6191896530e13a773274c7
3
+ size 10270118880
checkpoint-38000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1532f2f6211b27a2d36cb9b7a8c79e4f5167dfa4264b99e68728a73ea0f9854
3
+ size 20541257440
checkpoint-38000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:473bdd915fcd3dfb7474e63748a71816106c5cd0782afc15cabfa4d39e90840a
3
+ size 14408
checkpoint-38000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31623982e167dcb660754a465ba48aa312ac3e645ccfee0c89bccc3e415a027c
3
+ size 1000
checkpoint-38000/unet/config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "sdxl-flintstones-one_hot_encoding/checkpoint-35000",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "attention_type": "default",
15
+ "block_out_channels": [
16
+ 320,
17
+ 640,
18
+ 1280
19
+ ],
20
+ "center_input_sample": false,
21
+ "class_embed_type": null,
22
+ "class_embeddings_concat": false,
23
+ "conv_in_kernel": 3,
24
+ "conv_out_kernel": 3,
25
+ "cross_attention_dim": 2048,
26
+ "cross_attention_norm": null,
27
+ "down_block_types": [
28
+ "DownBlock2D",
29
+ "CrossAttnDownBlock2D",
30
+ "CrossAttnDownBlock2D"
31
+ ],
32
+ "downsample_padding": 1,
33
+ "dropout": 0.0,
34
+ "dual_cross_attention": false,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "in_channels": 4,
40
+ "layers_per_block": 2,
41
+ "mid_block_only_cross_attention": null,
42
+ "mid_block_scale_factor": 1,
43
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
44
+ "norm_eps": 1e-05,
45
+ "norm_num_groups": 32,
46
+ "num_attention_heads": null,
47
+ "num_class_embeds": null,
48
+ "only_cross_attention": false,
49
+ "out_channels": 4,
50
+ "projection_class_embeddings_input_dim": 2816,
51
+ "resnet_out_scale_factor": 1.0,
52
+ "resnet_skip_time_act": false,
53
+ "resnet_time_scale_shift": "default",
54
+ "reverse_transformer_layers_per_block": null,
55
+ "sample_size": 128,
56
+ "time_cond_proj_dim": null,
57
+ "time_embedding_act_fn": null,
58
+ "time_embedding_dim": null,
59
+ "time_embedding_type": "positional",
60
+ "timestep_post_act": null,
61
+ "transformer_layers_per_block": [
62
+ 1,
63
+ 2,
64
+ 10
65
+ ],
66
+ "up_block_types": [
67
+ "CrossAttnUpBlock2D",
68
+ "CrossAttnUpBlock2D",
69
+ "UpBlock2D"
70
+ ],
71
+ "upcast_attention": null,
72
+ "use_linear_projection": true
73
+ }
checkpoint-38000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3231c83425bdfbb53baff7bd6737db7b816c487584036b4ab971547220bf4ae
3
+ size 10270118880
checkpoint-40000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c499ffc7774d2750070842ec854a0173dddd5c0a1c9014daf55acf79356e549
3
+ size 20541257440
checkpoint-40000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fab5ea89eeefcbf728c4961507ad533c9631a287b992921155b8fd4b3a13a91d
3
+ size 14408
checkpoint-40000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:75f2643b5c13a9dffe551c00261dd7710fb82717e4dee239483895407e584871
3
+ size 1000
checkpoint-40000/unet/config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "sdxl-flintstones-one_hot_encoding/checkpoint-35000",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "attention_type": "default",
15
+ "block_out_channels": [
16
+ 320,
17
+ 640,
18
+ 1280
19
+ ],
20
+ "center_input_sample": false,
21
+ "class_embed_type": null,
22
+ "class_embeddings_concat": false,
23
+ "conv_in_kernel": 3,
24
+ "conv_out_kernel": 3,
25
+ "cross_attention_dim": 2048,
26
+ "cross_attention_norm": null,
27
+ "down_block_types": [
28
+ "DownBlock2D",
29
+ "CrossAttnDownBlock2D",
30
+ "CrossAttnDownBlock2D"
31
+ ],
32
+ "downsample_padding": 1,
33
+ "dropout": 0.0,
34
+ "dual_cross_attention": false,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "in_channels": 4,
40
+ "layers_per_block": 2,
41
+ "mid_block_only_cross_attention": null,
42
+ "mid_block_scale_factor": 1,
43
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
44
+ "norm_eps": 1e-05,
45
+ "norm_num_groups": 32,
46
+ "num_attention_heads": null,
47
+ "num_class_embeds": null,
48
+ "only_cross_attention": false,
49
+ "out_channels": 4,
50
+ "projection_class_embeddings_input_dim": 2816,
51
+ "resnet_out_scale_factor": 1.0,
52
+ "resnet_skip_time_act": false,
53
+ "resnet_time_scale_shift": "default",
54
+ "reverse_transformer_layers_per_block": null,
55
+ "sample_size": 128,
56
+ "time_cond_proj_dim": null,
57
+ "time_embedding_act_fn": null,
58
+ "time_embedding_dim": null,
59
+ "time_embedding_type": "positional",
60
+ "timestep_post_act": null,
61
+ "transformer_layers_per_block": [
62
+ 1,
63
+ 2,
64
+ 10
65
+ ],
66
+ "up_block_types": [
67
+ "CrossAttnUpBlock2D",
68
+ "CrossAttnUpBlock2D",
69
+ "UpBlock2D"
70
+ ],
71
+ "upcast_attention": null,
72
+ "use_linear_projection": true
73
+ }
checkpoint-40000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb4d050284412762c8d95d707626862db8973fd0f9aa71210a36926fd1f00b40
3
+ size 10270118880
checkpoint-42000/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:155bf2eeb0a204f5af43ea33fe865781bb0b492ac303cbc8173c1d41b6441058
3
+ size 20541257440
checkpoint-42000/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c89e8a09220a0207340bd46651f211a09f7c28ff9955700aa838ecbd45771e35
3
+ size 14408
checkpoint-42000/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e37b0301a40b52b14559c7525909cf8e5374cd9d2b87d0e26a3cf878c2f016d3
3
+ size 1000
checkpoint-42000/unet/config.json ADDED
@@ -0,0 +1,73 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_class_name": "UNet2DConditionModel",
3
+ "_diffusers_version": "0.22.0.dev0",
4
+ "_name_or_path": "sdxl-flintstones-one_hot_encoding/checkpoint-35000",
5
+ "act_fn": "silu",
6
+ "addition_embed_type": "text_time",
7
+ "addition_embed_type_num_heads": 64,
8
+ "addition_time_embed_dim": 256,
9
+ "attention_head_dim": [
10
+ 5,
11
+ 10,
12
+ 20
13
+ ],
14
+ "attention_type": "default",
15
+ "block_out_channels": [
16
+ 320,
17
+ 640,
18
+ 1280
19
+ ],
20
+ "center_input_sample": false,
21
+ "class_embed_type": null,
22
+ "class_embeddings_concat": false,
23
+ "conv_in_kernel": 3,
24
+ "conv_out_kernel": 3,
25
+ "cross_attention_dim": 2048,
26
+ "cross_attention_norm": null,
27
+ "down_block_types": [
28
+ "DownBlock2D",
29
+ "CrossAttnDownBlock2D",
30
+ "CrossAttnDownBlock2D"
31
+ ],
32
+ "downsample_padding": 1,
33
+ "dropout": 0.0,
34
+ "dual_cross_attention": false,
35
+ "encoder_hid_dim": null,
36
+ "encoder_hid_dim_type": null,
37
+ "flip_sin_to_cos": true,
38
+ "freq_shift": 0,
39
+ "in_channels": 4,
40
+ "layers_per_block": 2,
41
+ "mid_block_only_cross_attention": null,
42
+ "mid_block_scale_factor": 1,
43
+ "mid_block_type": "UNetMidBlock2DCrossAttn",
44
+ "norm_eps": 1e-05,
45
+ "norm_num_groups": 32,
46
+ "num_attention_heads": null,
47
+ "num_class_embeds": null,
48
+ "only_cross_attention": false,
49
+ "out_channels": 4,
50
+ "projection_class_embeddings_input_dim": 2816,
51
+ "resnet_out_scale_factor": 1.0,
52
+ "resnet_skip_time_act": false,
53
+ "resnet_time_scale_shift": "default",
54
+ "reverse_transformer_layers_per_block": null,
55
+ "sample_size": 128,
56
+ "time_cond_proj_dim": null,
57
+ "time_embedding_act_fn": null,
58
+ "time_embedding_dim": null,
59
+ "time_embedding_type": "positional",
60
+ "timestep_post_act": null,
61
+ "transformer_layers_per_block": [
62
+ 1,
63
+ 2,
64
+ 10
65
+ ],
66
+ "up_block_types": [
67
+ "CrossAttnUpBlock2D",
68
+ "CrossAttnUpBlock2D",
69
+ "UpBlock2D"
70
+ ],
71
+ "upcast_attention": null,
72
+ "use_linear_projection": true
73
+ }
checkpoint-42000/unet/diffusion_pytorch_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c792d307d583900177ea676e58df7044d55662a85abbe1c907e71b10831a0d9
3
+ size 10270118880
image_0.png CHANGED

Git LFS Details

  • SHA256: d0aa6a6a6f913e5a0855d9ee91b4070946987590e298c7f31cba3967bbd5015d
  • Pointer size: 132 Bytes
  • Size of remote file: 1.28 MB

Git LFS Details

  • SHA256: 14be188a8520ed5b4dbc1d3573b25d54745ebd7a1d5c070675a8a6b3ce6031f2
  • Pointer size: 132 Bytes
  • Size of remote file: 1.18 MB
image_1.png CHANGED

Git LFS Details

  • SHA256: c643c50860476aa57bd1bee2e99a3f1375dc5df85d6efb00e804dc08a42d061a
  • Pointer size: 132 Bytes
  • Size of remote file: 1.09 MB

Git LFS Details

  • SHA256: 5f390b9ad92e86ae7e37196fc52b253751d85a124a99f05888789166092b79bd
  • Pointer size: 132 Bytes
  • Size of remote file: 1.24 MB
image_2.png CHANGED

Git LFS Details

  • SHA256: cda3d1e343e6a963b8a69ff3979ca5b47332e435a72d37563fd58b81ec5ee190
  • Pointer size: 132 Bytes
  • Size of remote file: 1.24 MB

Git LFS Details

  • SHA256: f58c59295230291773e197f9316a21e69256aed2aaa23cde7c74f47b4a0af25f
  • Pointer size: 132 Bytes
  • Size of remote file: 1.29 MB
image_3.png CHANGED

Git LFS Details

  • SHA256: 86a4ef78d86af1b4e91c8a350a7aace66737b2bc36f1e1b96b28efac6e90c5fc
  • Pointer size: 132 Bytes
  • Size of remote file: 1.17 MB

Git LFS Details

  • SHA256: 20140980d7305b45323df29a6704475ff1af882e57e4109675f2da65888967a3
  • Pointer size: 132 Bytes
  • Size of remote file: 1.29 MB
logs/text2image-fine-tune-sdxl/1699656452.4887972/events.out.tfevents.1699656452.4124gs01.2650294.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1623257be848f086b3512bc98edff203e1ac58e45bd81f3c59f0ad82abe89002
3
+ size 2770
logs/text2image-fine-tune-sdxl/1699656452.491553/hparams.yml ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 2000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ enable_xformers_memory_efficient_attention: true
15
+ gradient_accumulation_steps: 4
16
+ gradient_checkpointing: true
17
+ hub_model_id: null
18
+ hub_token: null
19
+ image_column: image
20
+ learning_rate: 1.0e-06
21
+ local_rank: -1
22
+ logging_dir: logs
23
+ lr_scheduler: constant
24
+ lr_warmup_steps: 0
25
+ max_grad_norm: 1.0
26
+ max_train_samples: null
27
+ max_train_steps: 0
28
+ mixed_precision: null
29
+ noise_offset: 0
30
+ num_train_epochs: 0
31
+ num_validation_images: 4
32
+ output_dir: sdxl-flintstones-one_hot_encoding
33
+ prediction_type: null
34
+ pretrained_model_name_or_path: juliajoanna/sdxl-one_hot_encoding
35
+ pretrained_vae_model_name_or_path: madebyollin/sdxl-vae-fp16-fix
36
+ proportion_empty_prompts: 0.0
37
+ push_to_hub: true
38
+ random_flip: false
39
+ report_to: tensorboard
40
+ resolution: 1024
41
+ resume_from_checkpoint: latest
42
+ revision: null
43
+ scale_lr: false
44
+ seed: null
45
+ snr_gamma: null
46
+ timestep_bias_begin: 0
47
+ timestep_bias_end: 1000
48
+ timestep_bias_multiplier: 1.0
49
+ timestep_bias_portion: 0.25
50
+ timestep_bias_strategy: none
51
+ train_batch_size: 1
52
+ train_data_dir: fake_dataset
53
+ use_8bit_adam: false
54
+ use_ema: false
55
+ validation_epochs: 1
56
+ validation_prompt: Fred is driving a car
logs/text2image-fine-tune-sdxl/1699656954.4301672/events.out.tfevents.1699656954.4124gs01.2655943.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51405945081a9e70ae843121977ae9195023da620bf0ee0298ac4b2f3e48dc5f
3
+ size 2770
logs/text2image-fine-tune-sdxl/1699656954.4332438/hparams.yml ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 2000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ enable_xformers_memory_efficient_attention: true
15
+ gradient_accumulation_steps: 4
16
+ gradient_checkpointing: true
17
+ hub_model_id: null
18
+ hub_token: null
19
+ image_column: image
20
+ learning_rate: 1.0e-06
21
+ local_rank: -1
22
+ logging_dir: logs
23
+ lr_scheduler: constant
24
+ lr_warmup_steps: 0
25
+ max_grad_norm: 1.0
26
+ max_train_samples: null
27
+ max_train_steps: 0
28
+ mixed_precision: null
29
+ noise_offset: 0
30
+ num_train_epochs: 0
31
+ num_validation_images: 4
32
+ output_dir: sdxl-flintstones-one_hot_encoding
33
+ prediction_type: null
34
+ pretrained_model_name_or_path: juliajoanna/sdxl-one_hot_encoding
35
+ pretrained_vae_model_name_or_path: madebyollin/sdxl-vae-fp16-fix
36
+ proportion_empty_prompts: 0.0
37
+ push_to_hub: true
38
+ random_flip: false
39
+ report_to: tensorboard
40
+ resolution: 1024
41
+ resume_from_checkpoint: latest
42
+ revision: null
43
+ scale_lr: false
44
+ seed: null
45
+ snr_gamma: null
46
+ timestep_bias_begin: 0
47
+ timestep_bias_end: 1000
48
+ timestep_bias_multiplier: 1.0
49
+ timestep_bias_portion: 0.25
50
+ timestep_bias_strategy: none
51
+ train_batch_size: 1
52
+ train_data_dir: fake_dataset
53
+ use_8bit_adam: false
54
+ use_ema: false
55
+ validation_epochs: 1
56
+ validation_prompt: Fred is driving a car
logs/text2image-fine-tune-sdxl/1699823207.5531957/events.out.tfevents.1699823207.4124gs01.3988910.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80542f621f151002a1242a9047306ab3b5b38d7b7cb40e1e0206b73c36852bdc
3
+ size 2770
logs/text2image-fine-tune-sdxl/1699823207.5553815/hparams.yml ADDED
@@ -0,0 +1,56 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ cache_dir: null
7
+ caption_column: text
8
+ center_crop: true
9
+ checkpointing_steps: 2000
10
+ checkpoints_total_limit: null
11
+ dataloader_num_workers: 0
12
+ dataset_config_name: null
13
+ dataset_name: null
14
+ enable_xformers_memory_efficient_attention: true
15
+ gradient_accumulation_steps: 4
16
+ gradient_checkpointing: true
17
+ hub_model_id: null
18
+ hub_token: null
19
+ image_column: image
20
+ learning_rate: 1.0e-06
21
+ local_rank: -1
22
+ logging_dir: logs
23
+ lr_scheduler: constant
24
+ lr_warmup_steps: 0
25
+ max_grad_norm: 1.0
26
+ max_train_samples: null
27
+ max_train_steps: 0
28
+ mixed_precision: null
29
+ noise_offset: 0
30
+ num_train_epochs: 0
31
+ num_validation_images: 4
32
+ output_dir: sdxl-flintstones-one_hot_encoding
33
+ prediction_type: null
34
+ pretrained_model_name_or_path: juliajoanna/sdxl-one_hot_encoding
35
+ pretrained_vae_model_name_or_path: madebyollin/sdxl-vae-fp16-fix
36
+ proportion_empty_prompts: 0.0
37
+ push_to_hub: true
38
+ random_flip: false
39
+ report_to: tensorboard
40
+ resolution: 1024
41
+ resume_from_checkpoint: latest
42
+ revision: null
43
+ scale_lr: false
44
+ seed: null
45
+ snr_gamma: null
46
+ timestep_bias_begin: 0
47
+ timestep_bias_end: 1000
48
+ timestep_bias_multiplier: 1.0
49
+ timestep_bias_portion: 0.25
50
+ timestep_bias_strategy: none
51
+ train_batch_size: 1
52
+ train_data_dir: fake_dataset
53
+ use_8bit_adam: false
54
+ use_ema: false
55
+ validation_epochs: 1
56
+ validation_prompt: Fred is driving a car
logs/text2image-fine-tune-sdxl/events.out.tfevents.1699656452.4124gs01.2650294.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9eb1a28995562e0c3202371b0d5701ad81f0af79e6a0b2bf6109601d644cd8b0
3
+ size 88
logs/text2image-fine-tune-sdxl/events.out.tfevents.1699656954.4124gs01.2655943.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3b04eb62fb91afda658dbcbbe9fdf3e2a30376e7c6aca13a9f5d3cab6a7ef60
3
+ size 88
logs/text2image-fine-tune-sdxl/events.out.tfevents.1699823207.4124gs01.3988910.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49c152749958e3868d917c054f27927080892a6a1df75c077d42dbc9e84dcf16
3
+ size 5054840
unet/diffusion_pytorch_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7708d35cd8624da665dc062bb3240dcbd0ded002cc9e185658ae05bbbeba97d9
3
  size 10270118880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de944f5cc24c3a426a7e10da130575258e9d648cdf97e2aac259d596f6ef4abc
3
  size 10270118880