| { |
| "architectures": [ |
| "InternVLOVDForDetection" |
| ], |
| "batch_size": 4, |
| "coco_root": "/workspace/common/coco/", |
| "cost_bbox": 5.0, |
| "cost_class": 0.0, |
| "cost_giou": 2.0, |
| "dataset_type": "coco+refcocoplus", |
| "device": "cuda", |
| "device_map": "cuda", |
| "dim_feedforward": 1024, |
| "dropout": 0.0, |
| "dtype": "bfloat16", |
| "eos_coef": 0.1, |
| "eval_on_train": true, |
| "focal_alpha": 0.75, |
| "focal_gamma": 2.0, |
| "freeze_backbone": true, |
| "gradient_accumulation_steps": 4, |
| "head_type": "small", |
| "hidden_size": 1024, |
| "input_size": 448, |
| "log_every": 50, |
| "loss_bbox": 5.0, |
| "loss_cls": 0.0, |
| "loss_giou": 2.0, |
| "loss_mode": "hungarian", |
| "lr": 0.0001, |
| "lr_scheduler": "cosine", |
| "max_grad_norm": 0.1, |
| "max_instances": 100, |
| "max_num_patches": 12, |
| "model_type": "internvl_ovd", |
| "nhead": 8, |
| "num_decoder_layers": 2, |
| "num_epochs": 50, |
| "num_queries": 1, |
| "num_workers": 4, |
| "refcoco_train_max_samples": null, |
| "refcoco_train_split": "val", |
| "refcoco_val_max_samples": 128, |
| "refcoco_val_split": "testB", |
| "resume_from": null, |
| "save_dir": "./checkpoints/multi_label_model2", |
| "save_every_steps": 1000, |
| "save_total_limit": 2, |
| "seed": 42, |
| "token_fpn_include_text": true, |
| "token_fpn_levels": [ |
| 16, |
| 8, |
| 4, |
| 2 |
| ], |
| "train_ann_file": "/workspace/common/coco//annotations/instances_train2017.json", |
| "train_eval_max_samples": 128, |
| "train_eval_ratio": 0.001, |
| "train_img_dir": "/workspace/common/coco//train2017", |
| "transformers_version": "4.57.5", |
| "use_focal_loss": false, |
| "use_token_fpn": false, |
| "use_wandb": true, |
| "val_ann_file": "/workspace/common/coco//annotations/instances_val2017.json", |
| "val_every_steps": 1000, |
| "val_img_dir": "/workspace/common/coco//val2017", |
| "vlm_model_name": "OpenGVLab/InternVL3_5-1B", |
| "wandb_project": "internvl-ovd", |
| "wandb_run_name": "0114_multi_label_model2", |
| "warmup_epochs": 1.0, |
| "weight_decay": 0.0001, |
| "auto_map": { |
| "AutoConfig": "configuration_internvl_ovd.InternVLOVDConfig", |
| "AutoModel": "modeling_internvl_ovd.InternVLOVDForDetection" |
| } |
| } |
|
|