Commit
·
edc2c09
1
Parent(s):
cdb1970
Upload decoder/3B_fp16/decoder_config.json with huggingface_hub
Browse files
decoder/3B_fp16/decoder_config.json
CHANGED
|
@@ -18,6 +18,10 @@
|
|
| 18 |
"memory_efficient": true
|
| 19 |
}
|
| 20 |
],
|
|
|
|
|
|
|
|
|
|
|
|
|
| 21 |
"image_sizes": [64],
|
| 22 |
"channels": 3,
|
| 23 |
"timesteps": 1000,
|
|
@@ -26,13 +30,12 @@
|
|
| 26 |
"learned_variance": false
|
| 27 |
},
|
| 28 |
"data": {
|
| 29 |
-
"webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/
|
| 30 |
-
"img_embeddings_url": "s3://s-datasets/laion-aesthetic/ordered_embeddings/",
|
| 31 |
"num_workers": 6,
|
| 32 |
"batch_size": 40,
|
| 33 |
"start_shard": 0,
|
| 34 |
-
"end_shard":
|
| 35 |
-
"shard_width":
|
| 36 |
"index_width": 4,
|
| 37 |
"splits": {
|
| 38 |
"train": 0.75,
|
|
@@ -77,15 +80,15 @@
|
|
| 77 |
}
|
| 78 |
},
|
| 79 |
"tracker": {
|
| 80 |
-
"data_path": "/fsx/aidan/new/multinode/experiments/
|
| 81 |
"overwrite_data_path": true,
|
| 82 |
|
| 83 |
"log": {
|
| 84 |
-
"log_type": "
|
| 85 |
|
| 86 |
"wandb_entity": "Veldrovive",
|
| 87 |
"wandb_project": "dalle2_train_decoder",
|
| 88 |
-
"wandb_run_name": "3B deepspeed fp16",
|
| 89 |
|
| 90 |
"auto_resume": true,
|
| 91 |
"verbose": true
|
|
@@ -94,7 +97,7 @@
|
|
| 94 |
"load": {
|
| 95 |
"load_from": "local",
|
| 96 |
"only_auto_resume": true,
|
| 97 |
-
"file_path": "/fsx/aidan/new/multinode/experiments/
|
| 98 |
},
|
| 99 |
|
| 100 |
"save": [{
|
|
@@ -114,7 +117,7 @@
|
|
| 114 |
"save_type": "checkpoint"
|
| 115 |
},{
|
| 116 |
"save_to": "local",
|
| 117 |
-
"save_latest_to": "/fsx/aidan/new/multinode/experiments/
|
| 118 |
|
| 119 |
"save_type": "checkpoint"
|
| 120 |
}]
|
|
|
|
| 18 |
"memory_efficient": true
|
| 19 |
}
|
| 20 |
],
|
| 21 |
+
"clip": {
|
| 22 |
+
"make": "openai",
|
| 23 |
+
"model": "ViT-L/14"
|
| 24 |
+
},
|
| 25 |
"image_sizes": [64],
|
| 26 |
"channels": 3,
|
| 27 |
"timesteps": 1000,
|
|
|
|
| 30 |
"learned_variance": false
|
| 31 |
},
|
| 32 |
"data": {
|
| 33 |
+
"webdataset_base_url": "pipe:aws s3 cp --quiet s3://s-datasets/laion5b/laion2B-data/{}.tar -",
|
|
|
|
| 34 |
"num_workers": 6,
|
| 35 |
"batch_size": 40,
|
| 36 |
"start_shard": 0,
|
| 37 |
+
"end_shard": 231349,
|
| 38 |
+
"shard_width": 6,
|
| 39 |
"index_width": 4,
|
| 40 |
"splits": {
|
| 41 |
"train": 0.75,
|
|
|
|
| 80 |
}
|
| 81 |
},
|
| 82 |
"tracker": {
|
| 83 |
+
"data_path": "/fsx/aidan/new/multinode/experiments/deepspeed_fp16_2b/.tracker-data",
|
| 84 |
"overwrite_data_path": true,
|
| 85 |
|
| 86 |
"log": {
|
| 87 |
+
"log_type": "console",
|
| 88 |
|
| 89 |
"wandb_entity": "Veldrovive",
|
| 90 |
"wandb_project": "dalle2_train_decoder",
|
| 91 |
+
"wandb_run_name": "3B deepspeed fp16 2B",
|
| 92 |
|
| 93 |
"auto_resume": true,
|
| 94 |
"verbose": true
|
|
|
|
| 97 |
"load": {
|
| 98 |
"load_from": "local",
|
| 99 |
"only_auto_resume": true,
|
| 100 |
+
"file_path": "/fsx/aidan/new/multinode/experiments/deepspeed_fp16_2b/models/checkpoints/latest.pth"
|
| 101 |
},
|
| 102 |
|
| 103 |
"save": [{
|
|
|
|
| 117 |
"save_type": "checkpoint"
|
| 118 |
},{
|
| 119 |
"save_to": "local",
|
| 120 |
+
"save_latest_to": "/fsx/aidan/new/multinode/experiments/deepspeed_fp16_2b/models/checkpoints/latest.pth",
|
| 121 |
|
| 122 |
"save_type": "checkpoint"
|
| 123 |
}]
|