| { | |
| "model": "vitamin_large", | |
| "exp_name": "meditok_s2_clipv01", | |
| "output_dir": "meditok/outputs/ckpts/meditok_s2_clipv01", | |
| "resume_from": "", | |
| "resume_net_only": false, | |
| "lpips_path": "external/lpips_with_vgg.pth", | |
| "dino_path": "external/dinov2_vits14_pretrain.pth", | |
| "fid_eval_src": "", | |
| "fid_eval_dst": "", | |
| "vis_img_dir": "assets/vis_imgs/", | |
| "fid_feature_extractor": "external/weights-inception-2015-12-05-6726825d.pth", | |
| "clip_pretrain_path": "", | |
| "fp16": false, | |
| "bf16": true, | |
| "tf32": true, | |
| "compile_model": false, | |
| "ddp_static": false, | |
| "grad_ckpt": true, | |
| "grad_accu": 1, | |
| "train_data": "meditok/datasets/meta/meta2d_train.csv", | |
| "val_data": null, | |
| "train_root": "datasets/medical_preprocessed", | |
| "val_root": null, | |
| "dataset_type": "csvimg", | |
| "csv_img_key": "identifier", | |
| "csv_caption_key": "caption", | |
| "csv_separator": ",", | |
| "subset_ratio": 1.0, | |
| "img_size": 256, | |
| "resize_ratio": 1.125, | |
| "workers": 8, | |
| "train_num_samples": null, | |
| "train_data_upsampling_factors": null, | |
| "val_num_samples": null, | |
| "dataset_resampled": false, | |
| "use_aug": false, | |
| "prob_flip": 0.5, | |
| "prob_rot": 0.5, | |
| "prob_grayscale": 0.5, | |
| "vocab_size": 32768, | |
| "vocab_width": 64, | |
| "vocab_norm": true, | |
| "vq_beta": 0.25, | |
| "num_codebooks": 8, | |
| "quant_proj": "attn", | |
| "embed_dim": 768, | |
| "num_query": 0, | |
| "use_clip_pretrain": false, | |
| "patch_size": 16, | |
| "drop_path": 0.5, | |
| "text_width": 768, | |
| "text_heads": 12, | |
| "text_layers": 12, | |
| "text_vocab_size": 49408, | |
| "text_context_length": 77, | |
| "local_loss": true, | |
| "gather_with_grad": true, | |
| "pretrained_clip": null, | |
| "pretrained_clip_text": null, | |
| "lock_text": true, | |
| "force_custom_text": false, | |
| "force_custom_vision": false, | |
| "dino_depth": 12, | |
| "dino_kernel_size": 9, | |
| "disc_norm": "gn", | |
| "disc_aug_prob": 1.0, | |
| "disc_specnorm": false, | |
| "step_disc_every": 1, | |
| "vae_init": -0.5, | |
| "vocab_init": -1, | |
| "disc_init": -0.5, | |
| "epoch": 2, | |
| "local_bs": 512, | |
| "global_bs": 1, | |
| "lr": 0.0005, | |
| "wd": 0.02, | |
| "disc_lr": 2e-05, | |
| "disc_wd": 0.2, | |
| "grad_clip": 10, | |
| "ema": 0.9999, | |
| "warmup_iter": null, | |
| "warmup_ep": 0.01, | |
| "disc_start_ep": 0.375, | |
| "disc_warmup_ep": 0.03, | |
| "schedule": "cos", | |
| "lr_start_ratio": 0.0, | |
| "lr_end_ratio": 0.5, | |
| "disc_lr_end_ratio": 0.5, | |
| "custom_lr_multiplier": null, | |
| "optimizer": "adamw", | |
| "optim_eps": 1e-06, | |
| "fuse_opt": false, | |
| "optim_beta": "0.9_0.95", | |
| "disc_optim_beta": "0.5_0.9", | |
| "l1": 0.2, | |
| "l2": 1.0, | |
| "lp": 1.0, | |
| "lpr": 48, | |
| "ld": 0.4, | |
| "le": 0.0, | |
| "lq": 1.0, | |
| "lc": 1.0, | |
| "lcos": 0.0, | |
| "e_temp": 0.01, | |
| "gada": 1, | |
| "bcr": 4.0, | |
| "bcr_cut": 0.2, | |
| "dcrit": "hg", | |
| "report_wandb": false, | |
| "wandb_notes": null, | |
| "run_id": null, | |
| "eval_per_epoch": 10, | |
| "dbg_unused_param": false, | |
| "dbg_nan": false, | |
| "seed": null, | |
| "deterministic": false, | |
| "use_biomedclip": true, | |
| "vision_as_text": false, | |
| "ignore_text_params": true, | |
| "ct_bias": 1024, | |
| "freeze_logit_scale": false, | |
| "pretrained_core_path": null | |
| } |