brthor commited on
Commit
6157ab6
·
verified ·
1 Parent(s): 5329dbc

Upload full trainer checkpoint step=2346 (profile=llama3_2_1b_base_grpo, run_type=grpo)

Browse files
meta-llama__llama-3.2-1b/grpo/checkpoints/checkpoint-2346/adapter_config.json CHANGED
@@ -33,12 +33,12 @@
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
 
 
36
  "up_proj",
37
  "q_proj",
38
  "down_proj",
39
- "v_proj",
40
  "k_proj",
41
- "o_proj",
42
  "gate_proj"
43
  ],
44
  "target_parameters": null,
 
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
+ "o_proj",
37
+ "v_proj",
38
  "up_proj",
39
  "q_proj",
40
  "down_proj",
 
41
  "k_proj",
 
42
  "gate_proj"
43
  ],
44
  "target_parameters": null,
meta-llama__llama-3.2-1b/grpo/checkpoints/checkpoint-2346/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b3b251df1e70f60b48ed1acf9f74378d0ddd5d4ce229862281c91491d087d95
3
  size 23162187
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8f468d303b34eabf914eb939d7070479731c87ac477acbe15ddefe512bd2e77
3
  size 23162187
meta-llama__llama-3.2-1b/grpo/checkpoints/checkpoint-2346/resume_sft_best/adapter_config.json CHANGED
@@ -33,13 +33,13 @@
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
- "up_proj",
37
- "q_proj",
38
  "down_proj",
39
- "v_proj",
 
40
  "k_proj",
41
- "o_proj",
42
- "gate_proj"
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
 
33
  "rank_pattern": {},
34
  "revision": null,
35
  "target_modules": [
36
+ "o_proj",
37
+ "gate_proj",
38
  "down_proj",
39
+ "q_proj",
40
+ "up_proj",
41
  "k_proj",
42
+ "v_proj"
 
43
  ],
44
  "target_parameters": null,
45
  "task_type": "CAUSAL_LM",
meta-llama__llama-3.2-1b/grpo/checkpoints/checkpoint-2346/resume_sft_best/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d5cf25674e9f6fd7b207688fd6ad6c3bb8743e9a4322fa74c2404c9361bbc82b
3
  size 45118424
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a596f5e9254286640cef01c4ff2d94b2b26e47ace5a3a66bd0ce614ea45945d
3
  size 45118424
meta-llama__llama-3.2-1b/grpo/checkpoints/checkpoint-2346/trainer_state.json CHANGED
The diff for this file is too large to render. See raw diff
 
meta-llama__llama-3.2-1b/grpo/run_manifest.json CHANGED
@@ -9,17 +9,23 @@
9
  "best_metric_value": 0.012881267607927434,
10
  "best_step": 1173,
11
  "best_checkpoint_step": 1173,
12
- "latest_checkpoint_step": 1173,
13
  "checkpoints": [
14
  {
15
  "step": 1173,
16
  "epoch": 0.00625053286725211,
17
  "repo_path": "meta-llama__llama-3.2-1b/grpo/checkpoints/checkpoint-1173",
18
  "timestamp": "2026-04-08T21:07:07.041384+00:00"
 
 
 
 
 
 
19
  }
20
  ],
21
  "epoch_artifacts": [],
22
  "resume_history": [],
23
  "created_at": "2026-04-08T20:52:57.531787+00:00",
24
- "updated_at": "2026-04-08T21:07:07.041401+00:00"
25
  }
 
9
  "best_metric_value": 0.012881267607927434,
10
  "best_step": 1173,
11
  "best_checkpoint_step": 1173,
12
+ "latest_checkpoint_step": 2346,
13
  "checkpoints": [
14
  {
15
  "step": 1173,
16
  "epoch": 0.00625053286725211,
17
  "repo_path": "meta-llama__llama-3.2-1b/grpo/checkpoints/checkpoint-1173",
18
  "timestamp": "2026-04-08T21:07:07.041384+00:00"
19
+ },
20
+ {
21
+ "step": 2346,
22
+ "epoch": 0.01250106573450422,
23
+ "repo_path": "meta-llama__llama-3.2-1b/grpo/checkpoints/checkpoint-2346",
24
+ "timestamp": "2026-04-08T21:18:34.568372+00:00"
25
  }
26
  ],
27
  "epoch_artifacts": [],
28
  "resume_history": [],
29
  "created_at": "2026-04-08T20:52:57.531787+00:00",
30
+ "updated_at": "2026-04-08T21:18:34.568388+00:00"
31
  }