nbtpj commited on
Commit
2ce4d17
·
verified ·
1 Parent(s): ad1bd1b

Upload best model checkpoint

Browse files
Files changed (4) hide show
  1. metrics.json +23 -24
  2. model.safetensors +1 -1
  3. special_tokens_map.json +4 -28
  4. train_configs.json +8 -8
metrics.json CHANGED
@@ -1,30 +1,29 @@
1
  {
2
- "rl_info/A2G": -0.00804260652512312,
3
- "rl_info/entropy": 2.8796980381011963,
4
- "rl_info/total_token": 440.0,
5
- "rl_info/advantage_b4_norm": 961.4583129882812,
6
- "rl_info/advantage_after_gnorm": -0.13672709465026855,
7
  "rl_info/kl_w_ref": 0.0,
8
- "train/rl_loss": 0.8039727210998535,
9
- "train/total_loss": 0.8039727210998535,
10
- "xsum/rouge1": 0.1822673507912263,
11
- "xsum/rouge2": 0.03530779605308503,
12
- "xsum/rougeL": 0.1487245393010488,
13
- "xsum/rougeLsum": 0.14915382086079024,
14
- "xsum/bertscore_precision": 0.7578381817936898,
15
- "xsum/bertscore_recall": 0.7217868343293666,
16
- "xsum/bertscore_f1": 0.7386852816343308,
17
- "eval_agg/avg_all_rougef": 0.12886337675153758,
18
- "eval_agg/avg_all_bertf": 0.7386852816343308,
19
- "eval_agg/avg_all": 0.4337743291929342,
20
- "num_rl_rollout": 213,
21
  "lm_epoch": 0,
22
  "rl_epoch": 0,
23
- "step": 17000,
24
- "total_data_token": 2906376,
25
- "total_rl_token": 18963869,
26
  "total_lm_token": 0,
27
- "total_token": 18963869,
28
- "completed_steps": 17000,
29
- "tune_objective": 0.4375542633059791
30
  }
 
1
  {
2
+ "rl_info/A2G": -0.07268727570772171,
3
+ "rl_info/entropy": 3.100099802017212,
4
+ "rl_info/total_token": 1794.0,
5
+ "rl_info/advantage_b4_norm": -329.8147277832031,
 
6
  "rl_info/kl_w_ref": 0.0,
7
+ "train/rl_loss": 7.268417835235596,
8
+ "train/total_loss": 7.268417835235596,
9
+ "xsum/rouge1": 0.16526458612022013,
10
+ "xsum/rouge2": 0.026317550263276528,
11
+ "xsum/rougeL": 0.13316665912096423,
12
+ "xsum/rougeLsum": 0.13414432999907605,
13
+ "xsum/bertscore_precision": 0.7271568326748551,
14
+ "xsum/bertscore_recall": 0.7270669051583575,
15
+ "xsum/bertscore_f1": 0.7266696648915777,
16
+ "eval_agg/avg_all_rougef": 0.11472328137588424,
17
+ "eval_agg/avg_all_bertf": 0.7266696648915777,
18
+ "eval_agg/avg_all": 0.420696473133731,
19
+ "num_rl_rollout": 5,
20
  "lm_epoch": 0,
21
  "rl_epoch": 0,
22
+ "step": 1000,
23
+ "total_data_token": 63494,
24
+ "total_rl_token": 1974715,
25
  "total_lm_token": 0,
26
+ "total_token": 1974715,
27
+ "completed_steps": 1000,
28
+ "tune_objective": 0.39956710286966757
29
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0f294b9fb269ca49e980c3ffa101f250bc2cf3e76bad910a3fe9ca6640d8e6da
3
  size 497774208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a667f9decf7af7cec90a666c53820a1019f056c5ce05dd606e613c926596526
3
  size 497774208
special_tokens_map.json CHANGED
@@ -1,30 +1,6 @@
1
  {
2
- "bos_token": {
3
- "content": "<|endoftext|>",
4
- "lstrip": false,
5
- "normalized": true,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "eos_token": {
10
- "content": "<|endoftext|>",
11
- "lstrip": false,
12
- "normalized": true,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": {
17
- "content": "<|endoftext|>",
18
- "lstrip": false,
19
- "normalized": true,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "unk_token": {
24
- "content": "<|endoftext|>",
25
- "lstrip": false,
26
- "normalized": true,
27
- "rstrip": false,
28
- "single_word": false
29
- }
30
  }
 
1
  {
2
+ "bos_token": "<|endoftext|>",
3
+ "eos_token": "<|endoftext|>",
4
+ "pad_token": "<|endoftext|>",
5
+ "unk_token": "<|endoftext|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6
  }
train_configs.json CHANGED
@@ -29,7 +29,7 @@
29
  "seed": 0,
30
  "model_type": null,
31
  "block_size": 1024,
32
- "mini_epoch": 1,
33
  "rollout_game": "baseline3v2",
34
  "rl_algo": "off_policy",
35
  "constraint_type": "kl",
@@ -39,7 +39,7 @@
39
  "n_generate": 4,
40
  "n_augment": 0,
41
  "gradient_checkpoint": false,
42
- "group_relative_norm": true,
43
  "sample_config": {
44
  "do_sample": true,
45
  "min_new_tokens": 5,
@@ -52,13 +52,13 @@
52
  "max_new_tokens": 40
53
  },
54
  "rollout_config": {
55
- "accuracy_w": 8764.345947696369,
56
  "len_pen": 1.0,
57
- "accuracy_w2": 0.008731239835689814,
58
  "len_pen2": 1.0,
59
- "threshold": 0.00013728894342626908,
60
  "similarity_fn": "rouge",
61
- "acc_scale": "lin",
62
  "max_ctx_len": 760
63
  },
64
  "ent_coef": 0.0001,
@@ -68,7 +68,7 @@
68
  "prompt_2": "Given the text: {role1_output}\nReconstruct the summarized text to the detailed:",
69
  "prompt_eval": "{text}\nTL;DR:",
70
  "epsilon": 0.2,
71
- "a2g_norm": true,
72
  "vllm_sleep": true,
73
  "lora": false,
74
  "need_attn_mask": true,
@@ -82,7 +82,7 @@
82
  "trunc_eval": 256,
83
  "buffer_max_size": 20000,
84
  "trunc_evals": [
85
- "xsum___2000"
86
  ],
87
  "use_deepspeed": false,
88
  "zero_config": 2,
 
29
  "seed": 0,
30
  "model_type": null,
31
  "block_size": 1024,
32
+ "mini_epoch": 3,
33
  "rollout_game": "baseline3v2",
34
  "rl_algo": "off_policy",
35
  "constraint_type": "kl",
 
39
  "n_generate": 4,
40
  "n_augment": 0,
41
  "gradient_checkpoint": false,
42
+ "group_relative_norm": false,
43
  "sample_config": {
44
  "do_sample": true,
45
  "min_new_tokens": 5,
 
52
  "max_new_tokens": 40
53
  },
54
  "rollout_config": {
55
+ "accuracy_w": 0.0005981501367285106,
56
  "len_pen": 1.0,
57
+ "accuracy_w2": 505.3115905942363,
58
  "len_pen2": 1.0,
59
+ "threshold": 0.0001942205696972693,
60
  "similarity_fn": "rouge",
61
+ "acc_scale": "log",
62
  "max_ctx_len": 760
63
  },
64
  "ent_coef": 0.0001,
 
68
  "prompt_2": "Given the text: {role1_output}\nReconstruct the summarized text to the detailed:",
69
  "prompt_eval": "{text}\nTL;DR:",
70
  "epsilon": 0.2,
71
+ "a2g_norm": false,
72
  "vllm_sleep": true,
73
  "lora": false,
74
  "need_attn_mask": true,
 
82
  "trunc_eval": 256,
83
  "buffer_max_size": 20000,
84
  "trunc_evals": [
85
+ "xsum___20000"
86
  ],
87
  "use_deepspeed": false,
88
  "zero_config": 2,