| { |
| "OUTPUT_DIR": "OUTPUT/", |
| "WORKERS": 6, |
| "PRINT_FREQ": 500, |
| "AMP": { |
| "ENABLED": true |
| }, |
| "MODEL": { |
| "NAME": "cls_cvt", |
| "SPEC": { |
| "INIT": "trunc_norm", |
| "NUM_STAGES": 3, |
| "PATCH_SIZE": [7, 3, 3], |
| "PATCH_STRIDE": [4, 2, 2], |
| "PATCH_PADDING": [2, 1, 1], |
| "DIM_EMBED": [64, 192, 384], |
| "NUM_HEADS": [1, 3, 6], |
| "DEPTH": [1, 2, 10], |
| "MLP_RATIO": [4.0, 4.0, 4.0], |
| "ATTN_DROP_RATE": [0.0, 0.0, 0.0], |
| "DROP_RATE": [0.0, 0.0, 0.0], |
| "DROP_PATH_RATE": [0.0, 0.0, 0.1], |
| "QKV_BIAS": [true, true, true], |
| "CLS_TOKEN": [false, false, true], |
| "POS_EMBED": [false, false, false], |
| "QKV_PROJ_METHOD": ["dw_bn", "dw_bn", "dw_bn"], |
| "KERNEL_QKV": [3, 3, 3], |
| "PADDING_KV": [1, 1, 1], |
| "STRIDE_KV": [2, 2, 2], |
| "PADDING_Q": [1, 1, 1], |
| "STRIDE_Q": [1, 1, 1] |
| } |
| }, |
| "AUG": { |
| "MIXUP_PROB": 1.0, |
| "MIXUP": 0.8, |
| "MIXCUT": 1.0, |
| "TIMM_AUG": { |
| "USE_LOADER": true, |
| "RE_COUNT": 1, |
| "RE_MODE": "pixel", |
| "RE_SPLIT": false, |
| "RE_PROB": 0.25, |
| "AUTO_AUGMENT": "rand-m9-mstd0.5-inc1", |
| "HFLIP": 0.5, |
| "VFLIP": 0.0, |
| "COLOR_JITTER": 0.4, |
| "INTERPOLATION": "bicubic" |
| } |
| }, |
| "LOSS": { |
| "LABEL_SMOOTHING": 0.1 |
| }, |
| "CUDNN": { |
| "BENCHMARK": true, |
| "DETERMINISTIC": false, |
| "ENABLED": true |
| }, |
| "DATASET": { |
| "DATASET": "imagenet", |
| "DATA_FORMAT": "jpg", |
| "ROOT": "DATASET/imagenet/", |
| "TEST_SET": "val", |
| "TRAIN_SET": "train" |
| }, |
| "TEST": { |
| "BATCH_SIZE_PER_GPU": 32, |
| "IMAGE_SIZE": [224, 224], |
| "MODEL_FILE": "", |
| "INTERPOLATION": 3 |
| }, |
| "TRAIN": { |
| "BATCH_SIZE_PER_GPU": 256, |
| "LR": 0.00025, |
| "IMAGE_SIZE": [224, 224], |
| "BEGIN_EPOCH": 0, |
| "END_EPOCH": 300, |
| "LR_SCHEDULER": { |
| "METHOD": "timm", |
| "ARGS": { |
| "sched": "cosine", |
| "warmup_epochs": 5, |
| "warmup_lr": 0.000001, |
| "min_lr": 0.00001, |
| "cooldown_epochs": 10, |
| "decay_rate": 0.1 |
| } |
| }, |
| "OPTIMIZER": "adamW", |
| "WD": 0.05, |
| "WITHOUT_WD_LIST": ["bn", "bias", "ln"], |
| "SHUFFLE": true |
| }, |
| "DEBUG": { |
| "DEBUG": false |
| } |
| } |