bimabk commited on
Commit
3a6d21c
·
verified ·
1 Parent(s): 104dc15

Upload task output 1

Browse files
adapter_config.json CHANGED
@@ -29,13 +29,13 @@
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
 
 
32
  "down_proj",
33
- "up_proj",
34
  "k_proj",
35
- "gate_proj",
36
- "q_proj",
37
  "o_proj",
38
- "v_proj"
 
39
  ],
40
  "target_parameters": null,
41
  "task_type": "CAUSAL_LM",
 
29
  "rank_pattern": {},
30
  "revision": null,
31
  "target_modules": [
32
+ "q_proj",
33
+ "v_proj",
34
  "down_proj",
 
35
  "k_proj",
 
 
36
  "o_proj",
37
+ "up_proj",
38
+ "gate_proj"
39
  ],
40
  "target_parameters": null,
41
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a51e4d58b1e4af75220adfa4b19eb8e54a528c771c7995176479f54a4662aee
3
  size 957942768
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38704008a55135f8c68ad0c90eaa5bfdebc06173357d68ab8ccc64d7e5c514b3
3
  size 957942768
loss.txt CHANGED
@@ -1 +1 @@
1
- 4,-0.57375
 
1
+ 9,no_eval
trainer_state.json CHANGED
@@ -2,49 +2,50 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 1.0,
6
  "eval_steps": 500,
7
- "global_step": 4,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
- "epoch": 1.0,
14
- "eval_clip_ratio/high_max": 0.0,
15
- "eval_clip_ratio/high_mean": 0.0,
16
- "eval_clip_ratio/low_mean": 0.0,
17
- "eval_clip_ratio/low_min": 0.0,
18
- "eval_clip_ratio/region_mean": 0.0,
19
- "eval_completions/clipped_ratio": 0.0,
20
- "eval_completions/max_length": 2.98,
21
- "eval_completions/max_terminated_length": 2.98,
22
- "eval_completions/mean_length": 2.32,
23
- "eval_completions/mean_terminated_length": 2.32,
24
- "eval_completions/min_length": 2.0,
25
- "eval_completions/min_terminated_length": 2.0,
26
- "eval_entropy": 0.6514365351200104,
27
- "eval_frac_reward_zero_std": 0.44,
28
- "eval_loss": 0.015936430543661118,
29
- "eval_num_tokens": 439873.0,
30
- "eval_reward": 0.57375,
31
- "eval_reward_std": 0.48721748173236845,
32
- "eval_rewards/env_game_reward/mean": 0.57375,
33
- "eval_rewards/env_game_reward/std": 0.48721749722957614,
34
- "eval_runtime": 71.8753,
35
- "eval_samples_per_second": 2.783,
36
- "eval_sampling/importance_sampling_ratio/max": 1.3798925983905792,
37
- "eval_sampling/importance_sampling_ratio/mean": 0.9876983833312988,
38
- "eval_sampling/importance_sampling_ratio/min": 0.7033022457361221,
39
- "eval_sampling/sampling_logp_difference/max": 0.4170952755212784,
40
- "eval_sampling/sampling_logp_difference/mean": 0.09031737592071294,
41
- "eval_steps_per_second": 0.348,
42
- "step": 4
 
43
  }
44
  ],
45
  "logging_steps": 5,
46
- "max_steps": 12,
47
- "num_input_tokens_seen": 439873,
48
  "num_train_epochs": 3,
49
  "save_steps": 500,
50
  "stateful_callbacks": {
@@ -54,13 +55,13 @@
54
  "should_evaluate": false,
55
  "should_log": false,
56
  "should_save": true,
57
- "should_training_stop": false
58
  },
59
  "attributes": {}
60
  }
61
  },
62
  "total_flos": 0.0,
63
- "train_batch_size": 42,
64
  "trial_name": null,
65
  "trial_params": null
66
  }
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.011523687580025609,
6
  "eval_steps": 500,
7
+ "global_step": 9,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
11
  "log_history": [
12
  {
13
+ "clip_ratio/high_max": 0.01083222816232592,
14
+ "clip_ratio/high_mean": 0.007730815443210304,
15
+ "clip_ratio/low_mean": 0.008320118731353432,
16
+ "clip_ratio/low_min": 0.004644901840947568,
17
+ "clip_ratio/region_mean": 0.016050934419035913,
18
+ "completions/clipped_ratio": 0.0,
19
+ "completions/max_length": 374.6,
20
+ "completions/max_terminated_length": 374.6,
21
+ "completions/mean_length": 288.41796875,
22
+ "completions/mean_terminated_length": 288.41796875,
23
+ "completions/min_length": 145.2,
24
+ "completions/min_terminated_length": 145.2,
25
+ "entropy": 0.35683331191539763,
26
+ "epoch": 0.006402048655569782,
27
+ "frac_reward_zero_std": 0.4546875,
28
+ "grad_norm": 0.04971550032496452,
29
+ "kl": 0.011301717348396778,
30
+ "learning_rate": 1.137216e-06,
31
+ "loss": 0.0003326917765662074,
32
+ "num_tokens": 1074086.0,
33
+ "reward": 0.28232031464576723,
34
+ "reward_std": 0.25428222119808197,
35
+ "rewards/env_goofspiel_reward/mean": 0.2823203206062317,
36
+ "rewards/env_goofspiel_reward/std": 0.38380778431892393,
37
+ "sampling/importance_sampling_ratio/max": 2.474874496459961,
38
+ "sampling/importance_sampling_ratio/mean": 0.972897756099701,
39
+ "sampling/importance_sampling_ratio/min": 0.00847407877445221,
40
+ "sampling/sampling_logp_difference/max": 8.352801895141601,
41
+ "sampling/sampling_logp_difference/mean": 0.09170940220355987,
42
+ "step": 5,
43
+ "step_time": 27.68519940240021
44
  }
45
  ],
46
  "logging_steps": 5,
47
+ "max_steps": 2343,
48
+ "num_input_tokens_seen": 1930059,
49
  "num_train_epochs": 3,
50
  "save_steps": 500,
51
  "stateful_callbacks": {
 
55
  "should_evaluate": false,
56
  "should_log": false,
57
  "should_save": true,
58
+ "should_training_stop": true
59
  },
60
  "attributes": {}
61
  }
62
  },
63
  "total_flos": 0.0,
64
+ "train_batch_size": 32,
65
  "trial_name": null,
66
  "trial_params": null
67
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:86716a0f9d6726730f9bb33b6ff3e2ea21914baec34e4348e4636d0c05bbd3ef
3
- size 7889
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c896334b84a5cf87c711da6ada923aa8cad601284747089a6a46ea1af55c0030
3
+ size 7185