Kate-03 commited on
Commit
41ec022
·
verified ·
1 Parent(s): 4efbcd1

Upload trained model export (2025-10-13_10-15-42)

Browse files
README.md CHANGED
@@ -9,7 +9,7 @@ tags:
9
 
10
  # InterVL-HW1
11
 
12
- Trained and exported on 2025-10-13_09-20-38.
13
 
14
  - Backbone: InternVLChatModel
15
  - AMP dtype: bfloat16
 
9
 
10
  # InterVL-HW1
11
 
12
+ Trained and exported on 2025-10-13_10-15-42.
13
 
14
  - Backbone: InternVLChatModel
15
  - AMP dtype: bfloat16
checkpoints/ckpt_epoch0_step0_2025-10-13_10-15-42.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:545b66a066f8aa1a4c44ee42126d699c97935194fcd157ffe7f0d0e90bcba763
3
+ size 6366330923
checkpoints/latest.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8d346a2d4671049d03732054ae541b214845aca809d199588559a045c133f41
3
- size 6366333559
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:545b66a066f8aa1a4c44ee42126d699c97935194fcd157ffe7f0d0e90bcba763
3
+ size 6366330923
meta.json CHANGED
@@ -1,23 +1,32 @@
1
  {
2
- "export_time": "2025-10-13_09-20-38",
3
  "trainer_cfg": {
4
  "batch_size": 1,
5
- "grad_accum_steps": 4,
6
  "num_workers": 2,
7
  "lr": 2e-05,
8
  "weight_decay": 0.01,
9
  "max_epochs": 3,
10
  "max_grad_norm": 1.0,
11
- "warmup_ratio": 0.03,
12
  "log_every": 5,
13
  "save_dir": "./checkpoints_pt",
14
  "resume_path": null,
15
- "max_seq_len": 2048,
16
- "left_ctx": 512,
17
- "max_vis_tokens": 32,
18
  "image_token_id": 151643,
19
  "PAD_ID": 0,
20
- "LABEL_PAD": -100
 
 
 
 
 
 
 
 
 
21
  },
22
  "model_class": "InternVLChatModel",
23
  "device": "cuda:0",
 
1
  {
2
+ "export_time": "2025-10-13_10-15-42",
3
  "trainer_cfg": {
4
  "batch_size": 1,
5
+ "grad_accum_steps": 8,
6
  "num_workers": 2,
7
  "lr": 2e-05,
8
  "weight_decay": 0.01,
9
  "max_epochs": 3,
10
  "max_grad_norm": 1.0,
11
+ "warmup_ratio": 0.1,
12
  "log_every": 5,
13
  "save_dir": "./checkpoints_pt",
14
  "resume_path": null,
15
+ "max_seq_len": 1792,
16
+ "left_ctx": 768,
17
+ "max_vis_tokens": 64,
18
  "image_token_id": 151643,
19
  "PAD_ID": 0,
20
+ "LABEL_PAD": -100,
21
+ "label_smoothing": 0.1,
22
+ "train_frames_min": 8,
23
+ "train_frames_max": 14,
24
+ "lr_lm": 5e-06,
25
+ "lr_vision": 0.0001,
26
+ "lr_connector": 0.0002,
27
+ "weight_decay_lm": 0.01,
28
+ "weight_decay_vision": 0.05,
29
+ "weight_decay_connector": 0.05
30
  },
31
  "model_class": "InternVLChatModel",
32
  "device": "cuda:0",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f02769347c69ad9319b002c7a9559750b404ec4606980fd0d2ea7ad48d41003d
3
  size 2121885120
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62627ee00a36ab893cf2173e77559795db932fae169d3c9993e49426a6dea5d2
3
  size 2121885120