p1atdev commited on
Commit
458f2d9
1 Parent(s): 10eeab0

upload v1-3-0 diffusers weights (#1)

Browse files

- upload v1-3-0 diffusers weights (b20d811cf5190ed17794e54f3ee5a4e59c5e297d)

model_index.json CHANGED
@@ -2,17 +2,17 @@
2
  "_class_name": "StableDiffusionPipeline",
3
  "_diffusers_version": "0.10.2",
4
  "feature_extractor": [
5
- "transformers",
6
- "CLIPImageProcessor"
7
  ],
8
- "requires_safety_checker": true,
9
  "safety_checker": [
10
- "stable_diffusion",
11
- "StableDiffusionSafetyChecker"
12
  ],
13
  "scheduler": [
14
  "diffusers",
15
- "PNDMScheduler"
16
  ],
17
  "text_encoder": [
18
  "transformers",
 
2
  "_class_name": "StableDiffusionPipeline",
3
  "_diffusers_version": "0.10.2",
4
  "feature_extractor": [
5
+ null,
6
+ null
7
  ],
8
+ "requires_safety_checker": null,
9
  "safety_checker": [
10
+ null,
11
+ null
12
  ],
13
  "scheduler": [
14
  "diffusers",
15
+ "DDIMScheduler"
16
  ],
17
  "text_encoder": [
18
  "transformers",
scheduler/scheduler_config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_class_name": "PNDMScheduler",
3
  "_diffusers_version": "0.10.2",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
 
1
  {
2
+ "_class_name": "DDIMScheduler",
3
  "_diffusers_version": "0.10.2",
4
  "beta_end": 0.012,
5
  "beta_schedule": "scaled_linear",
text_encoder/config.json CHANGED
@@ -1,5 +1,4 @@
1
  {
2
- "_name_or_path": "openai/clip-vit-large-patch14",
3
  "architectures": [
4
  "CLIPTextModel"
5
  ],
@@ -7,18 +6,18 @@
7
  "bos_token_id": 0,
8
  "dropout": 0.0,
9
  "eos_token_id": 2,
10
- "hidden_act": "quick_gelu",
11
- "hidden_size": 768,
12
  "initializer_factor": 1.0,
13
  "initializer_range": 0.02,
14
- "intermediate_size": 3072,
15
  "layer_norm_eps": 1e-05,
16
  "max_position_embeddings": 77,
17
  "model_type": "clip_text_model",
18
- "num_attention_heads": 12,
19
- "num_hidden_layers": 12,
20
  "pad_token_id": 1,
21
- "projection_dim": 768,
22
  "torch_dtype": "float32",
23
  "transformers_version": "4.25.1",
24
  "vocab_size": 49408
 
1
  {
 
2
  "architectures": [
3
  "CLIPTextModel"
4
  ],
 
6
  "bos_token_id": 0,
7
  "dropout": 0.0,
8
  "eos_token_id": 2,
9
+ "hidden_act": "gelu",
10
+ "hidden_size": 1024,
11
  "initializer_factor": 1.0,
12
  "initializer_range": 0.02,
13
+ "intermediate_size": 4096,
14
  "layer_norm_eps": 1e-05,
15
  "max_position_embeddings": 77,
16
  "model_type": "clip_text_model",
17
+ "num_attention_heads": 16,
18
+ "num_hidden_layers": 23,
19
  "pad_token_id": 1,
20
+ "projection_dim": 512,
21
  "torch_dtype": "float32",
22
  "transformers_version": "4.25.1",
23
  "vocab_size": 49408
text_encoder/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aad0e7cec126b7ee2a36e52fef25ffc4a8c41ff0b2c7a1cd07f5e693680edab5
3
- size 492307041
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e150a734015803fc60b495d0657b89c17e1d9fb193236d2db476556097b89139
3
+ size 1361671895
tokenizer/special_tokens_map.json CHANGED
@@ -13,7 +13,7 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
- "pad_token": "<|endoftext|>",
17
  "unk_token": {
18
  "content": "<|endoftext|>",
19
  "lstrip": false,
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": "!",
17
  "unk_token": {
18
  "content": "<|endoftext|>",
19
  "lstrip": false,
tokenizer/tokenizer_config.json CHANGED
@@ -19,7 +19,7 @@
19
  },
20
  "errors": "replace",
21
  "model_max_length": 77,
22
- "name_or_path": "openai/clip-vit-large-patch14",
23
  "pad_token": "<|endoftext|>",
24
  "special_tokens_map_file": "./special_tokens_map.json",
25
  "tokenizer_class": "CLIPTokenizer",
 
19
  },
20
  "errors": "replace",
21
  "model_max_length": 77,
22
+ "name_or_path": "D:\\Documents\\Python\\diffusers\\waifu-diffusion",
23
  "pad_token": "<|endoftext|>",
24
  "special_tokens_map_file": "./special_tokens_map.json",
25
  "tokenizer_class": "CLIPTokenizer",
unet/config.json CHANGED
@@ -2,7 +2,12 @@
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.10.2",
4
  "act_fn": "silu",
5
- "attention_head_dim": 8,
 
 
 
 
 
6
  "block_out_channels": [
7
  320,
8
  640,
@@ -10,7 +15,7 @@
10
  1280
11
  ],
12
  "center_input_sample": false,
13
- "cross_attention_dim": 768,
14
  "down_block_types": [
15
  "CrossAttnDownBlock2D",
16
  "CrossAttnDownBlock2D",
@@ -29,7 +34,7 @@
29
  "num_class_embeds": null,
30
  "only_cross_attention": false,
31
  "out_channels": 4,
32
- "sample_size": 64,
33
  "up_block_types": [
34
  "UpBlock2D",
35
  "CrossAttnUpBlock2D",
 
2
  "_class_name": "UNet2DConditionModel",
3
  "_diffusers_version": "0.10.2",
4
  "act_fn": "silu",
5
+ "attention_head_dim": [
6
+ 5,
7
+ 10,
8
+ 20,
9
+ 20
10
+ ],
11
  "block_out_channels": [
12
  320,
13
  640,
 
15
  1280
16
  ],
17
  "center_input_sample": false,
18
+ "cross_attention_dim": 1024,
19
  "down_block_types": [
20
  "CrossAttnDownBlock2D",
21
  "CrossAttnDownBlock2D",
 
34
  "num_class_embeds": null,
35
  "only_cross_attention": false,
36
  "out_channels": 4,
37
+ "sample_size": 32,
38
  "up_block_types": [
39
  "UpBlock2D",
40
  "CrossAttnUpBlock2D",
unet/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0f4d4531f47a3b095c35b1869badc7e9c3d2d4531106fe22c5c8644089094eb
3
- size 3438366373
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ee56a201b46af5e9178be6f4de76c546b0d4cf56e77267714175bde7f25d591
3
+ size 3463913765
vae/config.json CHANGED
@@ -19,7 +19,7 @@
19
  "layers_per_block": 2,
20
  "norm_num_groups": 32,
21
  "out_channels": 3,
22
- "sample_size": 512,
23
  "up_block_types": [
24
  "UpDecoderBlock2D",
25
  "UpDecoderBlock2D",
 
19
  "layers_per_block": 2,
20
  "norm_num_groups": 32,
21
  "out_channels": 3,
22
+ "sample_size": 256,
23
  "up_block_types": [
24
  "UpDecoderBlock2D",
25
  "UpDecoderBlock2D",
vae/diffusion_pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6723bacd3c60b11a2b4e6007338a54c6964c210116c3ccecb3bfc80e218afc8f
3
- size 334711857
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7ba0d96a27ca3a8621b034de4637211707a744265b1fec8b3c7718c42182340
3
+ size 334707217