InterVL-HW1 / meta.json
Kate-03's picture
Upload trained model export (2025-10-13_11-29-14)
6500eee verified
{
"export_time": "2025-10-13_11-29-14",
"trainer_cfg": {
"batch_size": 1,
"grad_accum_steps": 8,
"num_workers": 2,
"lr": 2e-05,
"weight_decay": 0.01,
"max_epochs": 6,
"max_grad_norm": 1.0,
"warmup_ratio": 0.1,
"log_every": 5,
"save_dir": "./checkpoints_pt",
"resume_path": null,
"max_seq_len": 1792,
"left_ctx": 768,
"max_vis_tokens": 64,
"image_token_id": 151643,
"PAD_ID": 0,
"LABEL_PAD": -100,
"label_smoothing": 0.1,
"train_frames_min": 8,
"train_frames_max": 14,
"lr_lm": 5e-06,
"lr_vision": 0.0001,
"lr_connector": 0.0002,
"weight_decay_lm": 0.01,
"weight_decay_vision": 0.05,
"weight_decay_connector": 0.05
},
"model_class": "InternVLChatModel",
"device": "cuda:0",
"notes": "Weights saved after training; if you used a monkey-patched forward at train time, weights remain standard."
}