Jordansky commited on
Commit
482f215
·
verified ·
1 Parent(s): bc15116

Upload task output 1

Browse files
adapter_config.json CHANGED
@@ -29,13 +29,13 @@
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
- "k_proj",
33
- "o_proj",
34
- "gate_proj",
35
- "q_proj",
36
  "down_proj",
 
 
 
 
37
  "up_proj",
38
- "v_proj"
39
  ],
40
  "target_parameters": null,
41
  "task_type": "CAUSAL_LM",
 
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
 
 
 
 
32
  "down_proj",
33
+ "q_proj",
34
+ "o_proj",
35
+ "k_proj",
36
+ "v_proj",
37
  "up_proj",
38
+ "gate_proj"
39
  ],
40
  "target_parameters": null,
41
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a151743bd2bfcaf6c6bbd56130dcd1b3eac79f338662e0fb95fded1b41638bf7
3
  size 264308896
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a17ecb3d16c394d54ea010770d97d42fd277d6f9b82351d62fa408a79588633c
3
  size 264308896
trainer_state.json CHANGED
@@ -22,30 +22,30 @@
22
  "completions/mean_terminated_length": 2.90625,
23
  "completions/min_length": 2.0,
24
  "completions/min_terminated_length": 2.0,
25
- "entropy": 0.0580792877372005,
26
  "epoch": 2e-05,
27
- "frac_reward_zero_std": 0.375,
28
- "grad_norm": 0.007543689571321011,
29
  "kl": 0.0,
30
  "learning_rate": 0.0,
31
- "loss": 0.0,
32
- "num_tokens": 76760.0,
33
- "reward": -3.4157025814056396,
34
- "reward_std": 8.211202621459961,
35
- "rewards/rollout_reward_func/mean": -3.4157025814056396,
36
- "rewards/rollout_reward_func/std": 8.211202621459961,
37
- "sampling/importance_sampling_ratio/max": 1.0455573797225952,
38
- "sampling/importance_sampling_ratio/mean": 0.9704139232635498,
39
- "sampling/importance_sampling_ratio/min": 0.6538259983062744,
40
- "sampling/sampling_logp_difference/max": 0.42491185665130615,
41
- "sampling/sampling_logp_difference/mean": 0.017627999186515808,
42
  "step": 1,
43
- "step_time": 41.46402477799802
44
  }
45
  ],
46
  "logging_steps": 1.0,
47
  "max_steps": 100000,
48
- "num_input_tokens_seen": 76760,
49
  "num_train_epochs": 2,
50
  "save_steps": 500,
51
  "stateful_callbacks": {
 
22
  "completions/mean_terminated_length": 2.90625,
23
  "completions/min_length": 2.0,
24
  "completions/min_terminated_length": 2.0,
25
+ "entropy": 0.10359678417444229,
26
  "epoch": 2e-05,
27
+ "frac_reward_zero_std": 0.0,
28
+ "grad_norm": 0.01581481844186783,
29
  "kl": 0.0,
30
  "learning_rate": 0.0,
31
+ "loss": -0.0,
32
+ "num_tokens": 84936.0,
33
+ "reward": -0.5638285875320435,
34
+ "reward_std": 0.25014564394950867,
35
+ "rewards/rollout_reward_func/mean": -0.5638285875320435,
36
+ "rewards/rollout_reward_func/std": 0.25014564394950867,
37
+ "sampling/importance_sampling_ratio/max": 2.8205859661102295,
38
+ "sampling/importance_sampling_ratio/mean": 1.0278419256210327,
39
+ "sampling/importance_sampling_ratio/min": 0.6058012843132019,
40
+ "sampling/sampling_logp_difference/max": 1.0369436740875244,
41
+ "sampling/sampling_logp_difference/mean": 0.032973386347293854,
42
  "step": 1,
43
+ "step_time": 46.24527741299971
44
  }
45
  ],
46
  "logging_steps": 1.0,
47
  "max_steps": 100000,
48
+ "num_input_tokens_seen": 84936,
49
  "num_train_epochs": 2,
50
  "save_steps": 500,
51
  "stateful_callbacks": {
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06752bf9c95e82feb07130d9f23b1092e28a9ffa7c543df8f0481db05b449dcd
3
  size 8081
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7fa76374f3946a17e1b039d941a82cf671cd3da0c39d599a06415a668a69610
3
  size 8081