nbtpj commited on
Commit
174b104
·
verified ·
1 Parent(s): d0258f9

Upload best model checkpoint

Browse files
accelerator.ckpt/dl_state_dict.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d2567898e7971a0b5670bf6a2737bc31f98cc950fb4130fe8d746054d9f1be3
3
  size 1489
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74bd30b4bae1eb20aaee33823339f45a6a332404c6418808b3f23c5506071988
3
  size 1489
accelerator.ckpt/dl_state_dict_1.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:43919dbdf599450386720f61a25bad24d90eca951c25271e500df587378f1abf
3
  size 1501
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e30604dce73b0be0cfc1012424f910bc5c6af6763f54add923ee866b5a7be937
3
  size 1501
accelerator.ckpt/dl_state_dict_2.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d18bcd689dbb471d486cfc1fcae82e7fb210ffb37bd6172295a630d9fea40b9c
3
  size 1501
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:458236410ffa4bd403bb211b02671bd554643c1cf3d549a07b34d1a5efd51235
3
  size 1501
accelerator.ckpt/dl_state_dict_3.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7071a9b7092627c45be3df7796c8387732b699abc24c431c8d8abe771d2f1cdb
3
  size 1501
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:34219474ed2666dcbc6ee637b72049654546f48e581c4940f51b0578ab15f517
3
  size 1501
accelerator.ckpt/dl_state_dict_4.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0c852d5f1a0b46f769dceae5ed0350bbebda4ae59f4d937518014c7ffd8c39db
3
  size 1501
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e2b52a00ea47e691fcf45a0f6c762bfa77c060859c21428b153f729e745e5d5
3
  size 1501
accelerator.ckpt/dl_state_dict_6.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:073d07e02f891414b4651a8be06b723ad811730888320cbcd88c7c842ec4f401
3
+ size 1501
accelerator.ckpt/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72cb730d48a4ebb7c171131201d4ef436a363e29f3612a1bef070eb443d27540
3
  size 497774208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1a6a08657ba030890c32eb5d5eabdd191ce627dd251c567d5a58c2297ee89f0
3
  size 497774208
accelerator.ckpt/optimizer.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4bf5be8ddaa821b05c94549412b54654e98f21c54385c65705aaa6a10cbd0ea6
3
  size 995606091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:041c6162961c5ab2c547b1ccc71d343eb0fc073c7bb9a6e03b0674df256a5f1e
3
  size 995606091
accelerator.ckpt/random_states_0.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c2096e5fe9ed800834e5062b80cf17dbcc2e3a970c7f22cab692e6840cd078a
3
  size 14757
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6f53c7e2cb24c2a4de9637a6da182f87bb6ed2f90a2d4e82bf9c880f0ad7e1a
3
  size 14757
metrics.json CHANGED
@@ -1,51 +1,52 @@
1
  {
2
- "rl_info/A2G": -2.228810262749903e-05,
3
- "rl_info/entropy": 3.103461980819702,
4
- "rl_info/total_token": 3872.0,
5
- "rl_info/advantage_b4_norm": -847.2278442382812,
6
- "rl_info/advantage_after_gnorm": 0.2974321246147156,
7
  "rl_info/kl_w_ref": 0.0,
8
- "train/rl_loss": 0.0019184639677405357,
9
- "train/total_loss": 0.0019184639677405357,
10
- "gigaword/rouge1": 0.017424667842673495,
11
- "gigaword/rouge2": 0.002778778179571005,
12
- "gigaword/rougeL": 0.01708351188579019,
13
- "gigaword/rougeLsum": 0.01597830557868938,
14
- "gigaword/bertscore_precision": 0.5688383205235005,
15
- "gigaword/bertscore_recall": 0.6489311541616917,
16
- "gigaword/bertscore_f1": 0.6054284919798374,
17
- "cnndm/rouge1": 0.1657242795787633,
18
- "cnndm/rouge2": 0.05944159953280759,
19
- "cnndm/rougeL": 0.13357654072383415,
20
- "cnndm/rougeLsum": 0.14685147194336262,
21
- "cnndm/bertscore_precision": 0.6781402329603831,
22
- "cnndm/bertscore_recall": 0.7525439510742823,
23
- "cnndm/bertscore_f1": 0.7120969245831171,
24
- "xsum/rouge1": 0.12156545540546186,
25
- "xsum/rouge2": 0.01235304893841479,
26
- "xsum/rougeL": 0.08560314826140131,
27
- "xsum/rougeLsum": 0.09009432870268685,
28
- "xsum/bertscore_precision": 0.6957823038101196,
29
- "xsum/bertscore_recall": 0.7223540594180425,
30
- "xsum/bertscore_f1": 0.7064366390307745,
31
- "samsum/rouge1": 0.08285230780746375,
32
- "samsum/rouge2": 0.021593044513516627,
33
- "samsum/rougeL": 0.07018645398318014,
34
- "samsum/rougeLsum": 0.057873523121751924,
35
- "samsum/bertscore_precision": 0.6268573751052221,
36
- "samsum/bertscore_recall": 0.6982430865367254,
37
- "samsum/bertscore_f1": 0.6594596952199936,
38
- "eval_agg/avg_all_rougef": 0.06881127912496056,
39
- "eval_agg/avg_all_bertf": 0.6708554377034307,
40
- "eval_agg/avg_all": 0.3698333584141956,
41
- "num_rl_rollout": 10,
 
42
  "lm_epoch": 0,
43
  "rl_epoch": 0,
44
  "step": 400,
45
- "total_data_token": 109047,
46
- "total_rl_token": 1767730,
47
- "total_lm_token": 0,
48
- "total_token": 1767730,
49
  "completed_steps": 400,
50
- "tune_objective": 0.8896403575001602
51
  }
 
1
  {
2
+ "rl_info/A2G": -0.006648760288953781,
3
+ "rl_info/entropy": 3.1247427463531494,
4
+ "rl_info/total_token": 1710.0,
5
+ "rl_info/advantage_b4_norm": -524.6408081054688,
6
+ "rl_info/advantage_after_gnorm": 1.010803461074829,
7
  "rl_info/kl_w_ref": 0.0,
8
+ "train/rl_loss": 0.6645635962486267,
9
+ "train/lm_loss": 6.4453349113464355,
10
+ "train/total_loss": 7.109898567199707,
11
+ "samsum/rouge1": 0.07018707411132723,
12
+ "samsum/rouge2": 0.015589278392518668,
13
+ "samsum/rougeL": 0.05694806401174433,
14
+ "samsum/rougeLsum": 0.05097452753746131,
15
+ "samsum/bertscore_precision": 0.6306706219911575,
16
+ "samsum/bertscore_recall": 0.7116748541593552,
17
+ "samsum/bertscore_f1": 0.6681777884562811,
18
+ "xsum/rouge1": 0.07577425197474222,
19
+ "xsum/rouge2": 0.015173697537833916,
20
+ "xsum/rougeL": 0.06791431460162027,
21
+ "xsum/rougeLsum": 0.06226845688932118,
22
+ "xsum/bertscore_precision": 0.685419961810112,
23
+ "xsum/bertscore_recall": 0.6998258779446284,
24
+ "xsum/bertscore_f1": 0.6894047458966573,
25
+ "gigaword/rouge1": 0.01673533809218624,
26
+ "gigaword/rouge2": 0.002688706117978111,
27
+ "gigaword/rougeL": 0.016448820149720444,
28
+ "gigaword/rougeLsum": 0.015425704010653109,
29
+ "gigaword/bertscore_precision": 0.5675247123837471,
30
+ "gigaword/bertscore_recall": 0.6473609921336174,
31
+ "gigaword/bertscore_f1": 0.6041367189586162,
32
+ "cnndm/rouge1": 0.12628644770575717,
33
+ "cnndm/rouge2": 0.04433825429137848,
34
+ "cnndm/rougeL": 0.09875398462560836,
35
+ "cnndm/rougeLsum": 0.10678645281701828,
36
+ "cnndm/bertscore_precision": 0.6603378802537918,
37
+ "cnndm/bertscore_recall": 0.7300801773866018,
38
+ "cnndm/bertscore_f1": 0.6927102555831274,
39
+ "eval_agg/avg_all_rougef": 0.052643335804179334,
40
+ "eval_agg/avg_all_bertf": 0.6636073772236705,
41
+ "eval_agg/avg_all": 0.3581253565139249,
42
+ "num_rl_rollout": 4,
43
  "lm_epoch": 0,
44
  "rl_epoch": 0,
45
  "step": 400,
46
+ "total_data_token": 668982,
47
+ "total_rl_token": 849448,
48
+ "total_lm_token": 625452,
49
+ "total_token": 1474900,
50
  "completed_steps": 400,
51
+ "tune_objective": 0.784820971275843
52
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:72cb730d48a4ebb7c171131201d4ef436a363e29f3612a1bef070eb443d27540
3
  size 497774208
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1a6a08657ba030890c32eb5d5eabdd191ce627dd251c567d5a58c2297ee89f0
3
  size 497774208
special_tokens_map.json CHANGED
@@ -1,30 +1,6 @@
1
  {
2
- "bos_token": {
3
- "content": "<|endoftext|>",
4
- "lstrip": false,
5
- "normalized": true,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "eos_token": {
10
- "content": "<|endoftext|>",
11
- "lstrip": false,
12
- "normalized": true,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": {
17
- "content": "<|endoftext|>",
18
- "lstrip": false,
19
- "normalized": true,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "unk_token": {
24
- "content": "<|endoftext|>",
25
- "lstrip": false,
26
- "normalized": true,
27
- "rstrip": false,
28
- "single_word": false
29
- }
30
  }
 
1
  {
2
+ "bos_token": "<|endoftext|>",
3
+ "eos_token": "<|endoftext|>",
4
+ "pad_token": "<|endoftext|>",
5
+ "unk_token": "<|endoftext|>"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6
  }
train_configs.json CHANGED
@@ -2,7 +2,8 @@
2
  "dataset_name": "nbtpj/summ_ds_train",
3
  "dataset_config_name": null,
4
  "train_split_name": "merge36_cnndmsamsumxsum",
5
- "text_col": "text",
 
6
  "freeze_role2": false,
7
  "only_train_role1": false,
8
  "model_name_or_path": "gpt2",
@@ -34,7 +35,7 @@
34
  "constraint_type": "kl",
35
  "clamp_update": false,
36
  "rl_w": 1.0,
37
- "lm_w": 0.0,
38
  "n_generate": 4,
39
  "n_augment": 0,
40
  "gradient_checkpoint": false,
@@ -51,11 +52,11 @@
51
  "max_new_tokens": 250
52
  },
53
  "rollout_config": {
54
- "accuracy_w": 60.07249475906205,
55
  "len_pen": 1.0,
56
- "accuracy_w2": 1.2229065947034368,
57
  "len_pen2": 1.0,
58
- "threshold": 0.006750312521595928,
59
  "similarity_fn": "rouge"
60
  },
61
  "ent_coef": 0.0001,
 
2
  "dataset_name": "nbtpj/summ_ds_train",
3
  "dataset_config_name": null,
4
  "train_split_name": "merge36_cnndmsamsumxsum",
5
+ "text_template": "{text}\nTL;DR: {summary}",
6
+ "label_col": "summary",
7
  "freeze_role2": false,
8
  "only_train_role1": false,
9
  "model_name_or_path": "gpt2",
 
35
  "constraint_type": "kl",
36
  "clamp_update": false,
37
  "rl_w": 1.0,
38
+ "lm_w": 1.0,
39
  "n_generate": 4,
40
  "n_augment": 0,
41
  "gradient_checkpoint": false,
 
52
  "max_new_tokens": 250
53
  },
54
  "rollout_config": {
55
+ "accuracy_w": 12.960656597279739,
56
  "len_pen": 1.0,
57
+ "accuracy_w2": 30.20289640158668,
58
  "len_pen2": 1.0,
59
+ "threshold": 0.09062263471261954,
60
  "similarity_fn": "rouge"
61
  },
62
  "ent_coef": 0.0001,