{ "export_time": "2025-10-13_11-29-14", "trainer_cfg": { "batch_size": 1, "grad_accum_steps": 8, "num_workers": 2, "lr": 2e-05, "weight_decay": 0.01, "max_epochs": 6, "max_grad_norm": 1.0, "warmup_ratio": 0.1, "log_every": 5, "save_dir": "./checkpoints_pt", "resume_path": null, "max_seq_len": 1792, "left_ctx": 768, "max_vis_tokens": 64, "image_token_id": 151643, "PAD_ID": 0, "LABEL_PAD": -100, "label_smoothing": 0.1, "train_frames_min": 8, "train_frames_max": 14, "lr_lm": 5e-06, "lr_vision": 0.0001, "lr_connector": 0.0002, "weight_decay_lm": 0.01, "weight_decay_vision": 0.05, "weight_decay_connector": 0.05 }, "model_class": "InternVLChatModel", "device": "cuda:0", "notes": "Weights saved after training; if you used a monkey-patched forward at train time, weights remain standard." }