SamMikaelson commited on
Commit
049e119
·
verified ·
1 Parent(s): 10070a0

Upload folder using huggingface_hub

Browse files
adapter_config.json CHANGED
@@ -29,12 +29,12 @@
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
- "gate_proj",
33
  "down_proj",
34
- "q_proj",
35
  "up_proj",
 
36
  "v_proj",
37
  "o_proj",
 
38
  "k_proj"
39
  ],
40
  "task_type": "CAUSAL_LM",
 
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
 
32
  "down_proj",
 
33
  "up_proj",
34
+ "gate_proj",
35
  "v_proj",
36
  "o_proj",
37
+ "q_proj",
38
  "k_proj"
39
  ],
40
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dc030f8ea10c352e5747a54fd6bd60b5d61c279d752fe38e1d75aff90472319b
3
  size 264308896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c5fe9cd11eab35635b3e40afb66399670464aeb435423f4a450cca4a4ac3626a
3
  size 264308896
optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d85ab20dfbad778fc5a15fb52e139c37b62533714841cd3769c9b18976e264a9
3
- size 134777605
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c19907c05be97657db095ba64e710f3f3f486bd1ed0860b1bbd6662d2b1e5b1e
3
+ size 136089395
rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ebac56874dd3cee39433ddfeb334df4a599430bfff17402cb47ea22a559fee9f
3
  size 14645
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b144eceedfa2101476447173dfe3d346a36b7516fd4322dfd02b73b27d9b2310
3
  size 14645
scaler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f573b9f7149922ed73a27c9028f6f2cbdca1c0ef23c998ef777ef3be95e566d
3
  size 1383
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4fee0874fa9afae54661807fadac685c3d3f843473b6af99cc43d812ec6e1b36
3
  size 1383
scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:078542fd99723b70b4d1288e198aa1c9b9788cf33584a5b08ffba1fd602d7f84
3
  size 1465
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c1b3d3a192c565272886289c8e8ac137d3c10918ed8d56d761a18da40f9c741
3
  size 1465
trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.0006876633200385092,
6
  "eval_steps": 500,
7
- "global_step": 10,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -36,11 +36,39 @@
36
  "rewards/match_format_exactly/mean": 1.0,
37
  "rewards/match_format_exactly/std": 0.0,
38
  "step": 10
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
39
  }
40
  ],
41
  "logging_steps": 10,
42
- "max_steps": 60,
43
- "num_input_tokens_seen": 26778,
44
  "num_train_epochs": 1,
45
  "save_steps": 10,
46
  "stateful_callbacks": {
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.0013753266400770184,
6
  "eval_steps": 500,
7
+ "global_step": 20,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
36
  "rewards/match_format_exactly/mean": 1.0,
37
  "rewards/match_format_exactly/std": 0.0,
38
  "step": 10
39
+ },
40
+ {
41
+ "completion_length": 334.6,
42
+ "completions/clipped_ratio": 0.025,
43
+ "completions/max_length": 824.9,
44
+ "completions/max_terminated_length": 713.2,
45
+ "completions/mean_length": 334.6,
46
+ "completions/mean_terminated_length": 299.05833435058594,
47
+ "completions/min_length": 50.2,
48
+ "completions/min_terminated_length": 50.2,
49
+ "epoch": 0.0013753266400770184,
50
+ "frac_reward_zero_std": 0.1,
51
+ "grad_norm": 5.82886266708374,
52
+ "kl": 1.5751606613397597,
53
+ "learning_rate": 2.3750000000000003e-07,
54
+ "loss": 0.0016,
55
+ "num_tokens": 51474.0,
56
+ "reward": 4.4375,
57
+ "reward_std": 0.4622055947780609,
58
+ "rewards/check_coherence/mean": 0.4875,
59
+ "rewards/check_coherence/std": 0.33231321573257444,
60
+ "rewards/check_response_quality/mean": 2.2125,
61
+ "rewards/check_response_quality/std": 0.2633414089679718,
62
+ "rewards/match_format_approximately/mean": 0.7375,
63
+ "rewards/match_format_approximately/std": 0.21933756470680238,
64
+ "rewards/match_format_exactly/mean": 1.0,
65
+ "rewards/match_format_exactly/std": 0.0,
66
+ "step": 20
67
  }
68
  ],
69
  "logging_steps": 10,
70
+ "max_steps": 4000,
71
+ "num_input_tokens_seen": 51474,
72
  "num_train_epochs": 1,
73
  "save_steps": 10,
74
  "stateful_callbacks": {
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a6e31b6545879cafd72186cf6ce7bab37b7f1b65d30aec6986b01692da80961c
3
  size 7313
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89640938646618221e1b1ed739226e1b8be20971bb4a902cd531ba9b4399d32e
3
  size 7313