| |
| |
| |
|
|
|
|
| TASK: UniCLTask |
|
|
| NAME: 'Example Eval Configuration' |
| SAVE_TIMER_LOG: true |
|
|
| |
| SAVE_DIR: '' |
| LOG_EVERY: 10 |
| LOGLEVEL_OVERRIDE: INFO |
| LOG_GPU_MEM: true |
| RESUME: False |
| RESET_DATA_LOADER: false |
|
|
| FP16: true |
| ZERO_STAGE: 0 |
| DEEPSPEED: false |
| |
| AMP: PYTORCH |
| |
| |
| |
|
|
| FIND_UNUSED_PARAMETERS: false |
|
|
| SAVE_PER_OPTIM_STEPS: 500 |
| EVAL_PER_OPTIM_STEPS: 250 |
| EVAL_AT_START: False |
| |
| |
|
|
| NO_AUTO_LR_SCALING: true |
| GRAD_CLIPPING: 1.0 |
|
|
| SET_SAMPLER_EPOCH: true |
|
|
| DONT_LOAD_MODEL: true |
|
|
| user_dir: "./MainzVision" |
|
|
| |
| |
| |
|
|
|
|
|
|
| VERBOSE: true |
| WORKERS: 6 |
| PIN_MEMORY: true |
| IMAGE_ENCODER: |
| NAME: davit_v1 |
| NUM_CLASSES: 0 |
| |
| IMAGE_SIZE: [480, 480] |
| LOAD_PRETRAINED: true |
| PRETRAINED: '' |
| PRETRAINED_LAYERS: '*' |
| IMAGE_MEAN: [0.485, 0.456, 0.406] |
| IMAGE_STD: [0.229, 0.224, 0.225] |
| SPEC: |
| DROP_RATE: 0.1 |
| DROP_PATH_RATE: 0.2 |
| PATCH_SIZE: [7, 3, 3, 3] |
| PATCH_STRIDE: [4, 2, 2, 2] |
| PATCH_PADDING: [3, 1, 1, 1] |
| PATCH_PRENORM: [false, true, true, true] |
| DIM_EMBED: [256, 512, 1024, 2048] |
| NUM_HEADS: [8, 16, 32, 64] |
| NUM_GROUPS: [8, 16, 32, 64] |
| DEPTHS: [1, 1, 9, 1] |
| WINDOW_SIZE: 12 |
| ENABLE_CHECKPOINT: true |
|
|
| LANG_ENCODER: |
| NAME: transformer |
| LOAD_PRETRAINED: false |
| PRETRAINED: '' |
| PRETRAINED_LAYERS: '*' |
| TOKENIZER: clip |
| CONTEXT_LENGTH: 77 |
| WIDTH: 1024 |
| HEADS: 16 |
| LAYERS: 16 |
| AUTOGRESSIVE: false |
|
|
| UNICL_MODEL: |
| DIM_PROJECTION: 1024 |
| GATHER_TENSORS: true |
| LOAD_PRETRAINED: true |
|
|
| |
| PRETRAINED: '' |
|
|
| PRETRAINED_LAYERS: '*' |
|
|
| AUG: |
| MIXUP_PROB: 0.0 |
| MIXUP: 0.8 |
| MIXCUT: 1.0 |
| MIXCUT_MINMAX: [] |
| MIXUP_SWITCH_PROB: 0.5 |
| MIXUP_MODE: 'batch' |
| SCALE: [0.8, 1.0] |
| RATIO: [0.75, 1.3333333] |
| INTERPOLATION: 'bicubic' |
| TORCHVISION_AUG: |
| AUTO_AUGMENT: ta_wide |
| RE_PROB: 0.25 |
| HFLIP: 0.0 |
| VFLIP: 0.0 |
|
|
| LOSS: |
| LOSS: UniCL |
| DATASET: |
| DATASET: 'image_text_pairs_v2' |
| TEXT_FORMAT: 'json' |
| ROOT: '' |
| TRAIN_SET: 'mimic_cxr_v2-chestxray14-chexpertv4-irma2009_v2-rsnaboneage-mura-bingmedicalfewshot' |
| DATA_FORMAT: 'tsv' |
| SAMPLER: 'default' |
| LOADER: 'default' |
| TOKEN_FILE: '' |
| |
| |
| |
| |
| |
|
|
|
|
| |
| |
|
|
|
|
|
|
|
|
| EVALDATASET_LTCXR_S100_N100_TEXT_CLASSIFIER: |
| TEXT_FORMAT: json |
| FORMAT: 'zip' |
| SPLIT: 'NIH-CXR-LT' |
| ZIP_FILE: '' |
| ZIP_MAP_FILE: '' |
| LABEL_FILE: '' |
| IMAGE_TSV: '' |
| TEXT_TSV: '' |
| CWEIGHT_FILE: '' |
| ZS_MODE: 2 |
| ZS_WEIGHT: 1.0 |
| KNN: 100 |
| |
| |
|
|
|
|
|
|
|
|
| |
|
|
| ZEROSHOT_EVAL_DATASET: |
| FORMAT: 'zip' |
| SPLIT: 'NIH-CXR-LT' |
| ZIP_FILE: '' |
| ZIP_MAP_FILE: '' |
| LABEL_FILE: '' |
|
|
|
|
|
|
| EVALUATION_SPLITS: ['cls-zeroshot-eval'] |
| TEST: |
| BATCH_SIZE_PER_GPU: 8 |
| MODEL_FILE: '' |
| CENTER_CROP: false |
| TRAIN: |
| BATCH_SIZE_TOTAL: 1024 |
| BATCH_SIZE_PER_GPU: 16 |
|
|
| SHUFFLE: true |
|
|
| WEIGHT_SMOOTHING: |
| decay: 0.999 |
| use_cpu: False |
| eval_smoothed_weight: True |
|
|
| START_LEARNING_RATE: 0.00001 |
| |
| MAX_NUM_EPOCHS: 100 |
| OPTIMIZER: AdamW |
| OPTIMIZER_PARAMS: |
| weight_decay: 0.2 |
| CUSTOMIZED_PARAMS_CONF: |
| NO_WEIGHT_DECAY_MODULES: ['dw', 'norm'] |
| WEIGHT_DECAY_PATTERNS: |
| "\\.bias$": 0.0 |
| "logit_scale": 0.0 |
| "positional_embedding": 0.0 |
| "token_embedding": 0.0 |
|
|
|
|
|
|
| LR_SCHEDULER: TimmScheduler |
| LR_SCHEDULER_PARAMS: |
| sched: cosine |
| warmup_steps: 5 |
| warmup_lr: 0.000000001 |
| min_lr: 0.000000001 |
|
|
| |
| |
| GRADIENT_ACCUMULATE_STEP: -1 |
|
|