xpuenabler's picture
Upload folder using huggingface_hub
c31a5fe verified
raw
history blame
2.08 kB
{
"architectures": [
"InternVLOVDForDetection"
],
"batch_size": 4,
"coco_root": "/workspace/common/coco/",
"cost_bbox": 5.0,
"cost_class": 0.0,
"cost_giou": 2.0,
"dataset_type": "coco+refcocoplus",
"device": "cuda",
"device_map": "cuda",
"dim_feedforward": 1024,
"dropout": 0.0,
"dtype": "bfloat16",
"eos_coef": 0.1,
"eval_on_train": true,
"focal_alpha": 0.75,
"focal_gamma": 2.0,
"freeze_backbone": true,
"gradient_accumulation_steps": 4,
"head_type": "small",
"hidden_size": 1024,
"input_size": 448,
"log_every": 50,
"loss_bbox": 5.0,
"loss_cls": 0.0,
"loss_giou": 2.0,
"loss_mode": "hungarian",
"lr": 0.0001,
"lr_scheduler": "cosine",
"max_grad_norm": 0.1,
"max_instances": 100,
"max_num_patches": 12,
"model_type": "internvl_ovd",
"nhead": 8,
"num_decoder_layers": 2,
"num_epochs": 50,
"num_queries": 1,
"num_workers": 4,
"refcoco_train_max_samples": null,
"refcoco_train_split": "val",
"refcoco_val_max_samples": 128,
"refcoco_val_split": "testB",
"resume_from": null,
"save_dir": "./checkpoints/multi_label_model2",
"save_every_steps": 1000,
"save_total_limit": 2,
"seed": 42,
"token_fpn_include_text": true,
"token_fpn_levels": [
16,
8,
4,
2
],
"train_ann_file": "/workspace/common/coco//annotations/instances_train2017.json",
"train_eval_max_samples": 128,
"train_eval_ratio": 0.001,
"train_img_dir": "/workspace/common/coco//train2017",
"transformers_version": "4.57.5",
"use_focal_loss": false,
"use_token_fpn": false,
"use_wandb": true,
"val_ann_file": "/workspace/common/coco//annotations/instances_val2017.json",
"val_every_steps": 1000,
"val_img_dir": "/workspace/common/coco//val2017",
"vlm_model_name": "OpenGVLab/InternVL3_5-1B",
"wandb_project": "internvl-ovd",
"wandb_run_name": "0114_multi_label_model2",
"warmup_epochs": 1.0,
"weight_decay": 0.0001,
"auto_map": {
"AutoConfig": "configuration_internvl_ovd.InternVLOVDConfig",
"AutoModel": "modeling_internvl_ovd.InternVLOVDForDetection"
}
}