Veldrovive
commited on
Commit
•
edc2c09
1
Parent(s):
cdb1970
Upload decoder/3B_fp16/decoder_config.json with huggingface_hub
Browse files
decoder/3B_fp16/decoder_config.json
CHANGED
@@ -18,6 +18,10 @@
|
|
18 |
"memory_efficient": true
|
19 |
}
|
20 |
],
|
|
|
|
|
|
|
|
|
21 |
"image_sizes": [64],
|
22 |
"channels": 3,
|
23 |
"timesteps": 1000,
|
@@ -26,13 +30,12 @@
|
|
26 |
"learned_variance": false
|
27 |
},
|
28 |
"data": {
|
29 |
-
"webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/
|
30 |
-
"img_embeddings_url": "s3://s-datasets/laion-aesthetic/ordered_embeddings/",
|
31 |
"num_workers": 6,
|
32 |
"batch_size": 40,
|
33 |
"start_shard": 0,
|
34 |
-
"end_shard":
|
35 |
-
"shard_width":
|
36 |
"index_width": 4,
|
37 |
"splits": {
|
38 |
"train": 0.75,
|
@@ -77,15 +80,15 @@
|
|
77 |
}
|
78 |
},
|
79 |
"tracker": {
|
80 |
-
"data_path": "/fsx/aidan/new/multinode/experiments/
|
81 |
"overwrite_data_path": true,
|
82 |
|
83 |
"log": {
|
84 |
-
"log_type": "
|
85 |
|
86 |
"wandb_entity": "Veldrovive",
|
87 |
"wandb_project": "dalle2_train_decoder",
|
88 |
-
"wandb_run_name": "3B deepspeed fp16",
|
89 |
|
90 |
"auto_resume": true,
|
91 |
"verbose": true
|
@@ -94,7 +97,7 @@
|
|
94 |
"load": {
|
95 |
"load_from": "local",
|
96 |
"only_auto_resume": true,
|
97 |
-
"file_path": "/fsx/aidan/new/multinode/experiments/
|
98 |
},
|
99 |
|
100 |
"save": [{
|
@@ -114,7 +117,7 @@
|
|
114 |
"save_type": "checkpoint"
|
115 |
},{
|
116 |
"save_to": "local",
|
117 |
-
"save_latest_to": "/fsx/aidan/new/multinode/experiments/
|
118 |
|
119 |
"save_type": "checkpoint"
|
120 |
}]
|
|
|
18 |
"memory_efficient": true
|
19 |
}
|
20 |
],
|
21 |
+
"clip": {
|
22 |
+
"make": "openai",
|
23 |
+
"model": "ViT-L/14"
|
24 |
+
},
|
25 |
"image_sizes": [64],
|
26 |
"channels": 3,
|
27 |
"timesteps": 1000,
|
|
|
30 |
"learned_variance": false
|
31 |
},
|
32 |
"data": {
|
33 |
+
"webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/laion5b/laion2B-data/{}.tar -",
|
|
|
34 |
"num_workers": 6,
|
35 |
"batch_size": 40,
|
36 |
"start_shard": 0,
|
37 |
+
"end_shard": 231349,
|
38 |
+
"shard_width": 6,
|
39 |
"index_width": 4,
|
40 |
"splits": {
|
41 |
"train": 0.75,
|
|
|
80 |
}
|
81 |
},
|
82 |
"tracker": {
|
83 |
+
"data_path": "/fsx/aidan/new/multinode/experiments/deepspeed_fp16_2b/.tracker-data",
|
84 |
"overwrite_data_path": true,
|
85 |
|
86 |
"log": {
|
87 |
+
"log_type": "console",
|
88 |
|
89 |
"wandb_entity": "Veldrovive",
|
90 |
"wandb_project": "dalle2_train_decoder",
|
91 |
+
"wandb_run_name": "3B deepspeed fp16 2B",
|
92 |
|
93 |
"auto_resume": true,
|
94 |
"verbose": true
|
|
|
97 |
"load": {
|
98 |
"load_from": "local",
|
99 |
"only_auto_resume": true,
|
100 |
+
"file_path": "/fsx/aidan/new/multinode/experiments/deepspeed_fp16_2b/models/checkpoints/latest.pth"
|
101 |
},
|
102 |
|
103 |
"save": [{
|
|
|
117 |
"save_type": "checkpoint"
|
118 |
},{
|
119 |
"save_to": "local",
|
120 |
+
"save_latest_to": "/fsx/aidan/new/multinode/experiments/deepspeed_fp16_2b/models/checkpoints/latest.pth",
|
121 |
|
122 |
"save_type": "checkpoint"
|
123 |
}]
|