vicclab commited on
Commit
6aa6133
·
1 Parent(s): 832117f

End of training

Browse files
Files changed (40) hide show
  1. .gitignore +1 -0
  2. config.json +39 -0
  3. generation_config.json +6 -0
  4. merges.txt +0 -0
  5. pytorch_model.bin +3 -0
  6. runs/Feb27_08-26-30_fc60717d9ef2/1677486429.5043063/events.out.tfevents.1677486429.fc60717d9ef2.681.1 +3 -0
  7. runs/Feb27_08-26-30_fc60717d9ef2/1677487228.6652255/events.out.tfevents.1677487228.fc60717d9ef2.681.3 +3 -0
  8. runs/Feb27_08-26-30_fc60717d9ef2/events.out.tfevents.1677486429.fc60717d9ef2.681.0 +3 -0
  9. runs/Feb27_08-26-30_fc60717d9ef2/events.out.tfevents.1677487228.fc60717d9ef2.681.2 +3 -0
  10. runs/Feb27_08-41-08_fc60717d9ef2/1677487289.7801874/events.out.tfevents.1677487289.fc60717d9ef2.681.5 +3 -0
  11. runs/Feb27_08-41-08_fc60717d9ef2/events.out.tfevents.1677487289.fc60717d9ef2.681.4 +3 -0
  12. runs/Feb27_08-49-52_fc60717d9ef2/1677487809.8054178/events.out.tfevents.1677487809.fc60717d9ef2.681.7 +3 -0
  13. runs/Feb27_08-49-52_fc60717d9ef2/events.out.tfevents.1677487809.fc60717d9ef2.681.6 +3 -0
  14. runs/Feb27_08-51-39_fc60717d9ef2/1677487914.218362/events.out.tfevents.1677487914.fc60717d9ef2.681.9 +3 -0
  15. runs/Feb27_08-51-39_fc60717d9ef2/1677487969.808486/events.out.tfevents.1677487969.fc60717d9ef2.681.10 +3 -0
  16. runs/Feb27_08-51-39_fc60717d9ef2/1677488013.3413498/events.out.tfevents.1677488013.fc60717d9ef2.681.11 +3 -0
  17. runs/Feb27_08-51-39_fc60717d9ef2/events.out.tfevents.1677487914.fc60717d9ef2.681.8 +3 -0
  18. runs/Feb27_08-55-09_fc60717d9ef2/1677488290.8080983/events.out.tfevents.1677488290.fc60717d9ef2.681.13 +3 -0
  19. runs/Feb27_08-55-09_fc60717d9ef2/events.out.tfevents.1677488290.fc60717d9ef2.681.12 +3 -0
  20. runs/Feb27_09-00-26_fc60717d9ef2/1677488451.4369497/events.out.tfevents.1677488451.fc60717d9ef2.681.15 +3 -0
  21. runs/Feb27_09-00-26_fc60717d9ef2/1677488463.118922/events.out.tfevents.1677488463.fc60717d9ef2.681.16 +3 -0
  22. runs/Feb27_09-00-26_fc60717d9ef2/1677488522.5581338/events.out.tfevents.1677488522.fc60717d9ef2.681.17 +3 -0
  23. runs/Feb27_09-00-26_fc60717d9ef2/events.out.tfevents.1677488451.fc60717d9ef2.681.14 +3 -0
  24. runs/Feb27_09-05-35_fc60717d9ef2/1677488764.8892996/events.out.tfevents.1677488764.fc60717d9ef2.11912.1 +3 -0
  25. runs/Feb27_09-05-35_fc60717d9ef2/events.out.tfevents.1677488764.fc60717d9ef2.11912.0 +3 -0
  26. runs/Feb27_09-09-26_fc60717d9ef2/1677489002.5988908/events.out.tfevents.1677489002.fc60717d9ef2.12943.1 +3 -0
  27. runs/Feb27_09-09-26_fc60717d9ef2/events.out.tfevents.1677489002.fc60717d9ef2.12943.0 +3 -0
  28. runs/Feb27_09-10-39_fc60717d9ef2/1677489065.4838176/events.out.tfevents.1677489065.fc60717d9ef2.12943.3 +3 -0
  29. runs/Feb27_09-10-39_fc60717d9ef2/events.out.tfevents.1677489065.fc60717d9ef2.12943.2 +3 -0
  30. runs/Feb27_09-11-22_fc60717d9ef2/1677489105.6450863/events.out.tfevents.1677489105.fc60717d9ef2.12943.5 +3 -0
  31. runs/Feb27_09-11-22_fc60717d9ef2/events.out.tfevents.1677489105.fc60717d9ef2.12943.4 +3 -0
  32. runs/Feb27_09-16-35_fc60717d9ef2/1677489421.8902442/events.out.tfevents.1677489421.fc60717d9ef2.14971.1 +3 -0
  33. runs/Feb27_09-16-35_fc60717d9ef2/events.out.tfevents.1677489421.fc60717d9ef2.14971.0 +3 -0
  34. runs/Feb27_09-26-54_fc60717d9ef2/1677490045.1964664/events.out.tfevents.1677490045.fc60717d9ef2.17454.1 +3 -0
  35. runs/Feb27_09-26-54_fc60717d9ef2/events.out.tfevents.1677490045.fc60717d9ef2.17454.0 +3 -0
  36. special_tokens_map.json +6 -0
  37. tokenizer.json +0 -0
  38. tokenizer_config.json +10 -0
  39. training_args.bin +3 -0
  40. vocab.json +0 -0
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "gpt2",
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPT2LMHeadModel"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 50256,
11
+ "initializer_range": 0.02,
12
+ "layer_norm_epsilon": 1e-05,
13
+ "model_type": "gpt2",
14
+ "n_ctx": 1024,
15
+ "n_embd": 768,
16
+ "n_head": 12,
17
+ "n_inner": null,
18
+ "n_layer": 12,
19
+ "n_positions": 1024,
20
+ "reorder_and_upcast_attn": false,
21
+ "resid_pdrop": 0.1,
22
+ "scale_attn_by_inverse_layer_idx": false,
23
+ "scale_attn_weights": true,
24
+ "summary_activation": null,
25
+ "summary_first_dropout": 0.1,
26
+ "summary_proj_to_labels": true,
27
+ "summary_type": "cls_index",
28
+ "summary_use_proj": true,
29
+ "task_specific_params": {
30
+ "text-generation": {
31
+ "do_sample": true,
32
+ "max_length": 50
33
+ }
34
+ },
35
+ "torch_dtype": "float32",
36
+ "transformers_version": "4.26.1",
37
+ "use_cache": true,
38
+ "vocab_size": 50257
39
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 50256,
4
+ "eos_token_id": 50256,
5
+ "transformers_version": "4.26.1"
6
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2357105a8dd8ea3524652ddfbcc9bf85fce050c7c9cac77845c303fb4cfa3ffb
3
+ size 510398013
runs/Feb27_08-26-30_fc60717d9ef2/1677486429.5043063/events.out.tfevents.1677486429.fc60717d9ef2.681.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1bcd4002518aa6048d45861686e5b8bed451f580912bd37131a2bda43bb3be9d
3
+ size 5634
runs/Feb27_08-26-30_fc60717d9ef2/1677487228.6652255/events.out.tfevents.1677487228.fc60717d9ef2.681.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fcf3c7969d940833f63f8d4e2bc25b2571681056c060845af01ff02723843e54
3
+ size 5634
runs/Feb27_08-26-30_fc60717d9ef2/events.out.tfevents.1677486429.fc60717d9ef2.681.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:939863da68bd4f5807ff0666125729c118fe418507051aca4aa8d8045fe8106b
3
+ size 4121
runs/Feb27_08-26-30_fc60717d9ef2/events.out.tfevents.1677487228.fc60717d9ef2.681.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f327dd1b5be906a6c6319c070f9d647a8b18328389d9d680fe827ff2514cab5c
3
+ size 4121
runs/Feb27_08-41-08_fc60717d9ef2/1677487289.7801874/events.out.tfevents.1677487289.fc60717d9ef2.681.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5230dd43e65e9d727682cff516070b6a8c95ff5592643172d316c4ccf9a73508
3
+ size 5631
runs/Feb27_08-41-08_fc60717d9ef2/events.out.tfevents.1677487289.fc60717d9ef2.681.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46786d8cff5cf387048fd93a1b14ca4bcf5d8b7fcb20c3351d7b31b302c7cd8a
3
+ size 4119
runs/Feb27_08-49-52_fc60717d9ef2/1677487809.8054178/events.out.tfevents.1677487809.fc60717d9ef2.681.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a5cd14b0e5c3ccf647535590c7d8ec817c4dacc37b39229f0f2cf573cb03945
3
+ size 5641
runs/Feb27_08-49-52_fc60717d9ef2/events.out.tfevents.1677487809.fc60717d9ef2.681.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9e0a6f32a973afd8c049e2414ed559321677249825bb3e5296cbbe9d8fd888f
3
+ size 4129
runs/Feb27_08-51-39_fc60717d9ef2/1677487914.218362/events.out.tfevents.1677487914.fc60717d9ef2.681.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e98d178e76db9c30aa36b4f195fd11536461089e4b367acc05edf023293b3a3e
3
+ size 5641
runs/Feb27_08-51-39_fc60717d9ef2/1677487969.808486/events.out.tfevents.1677487969.fc60717d9ef2.681.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:630e528193e45aea021a766e386c1a4cadd7bcc905d2ddea3a9cac952e76f3e1
3
+ size 5641
runs/Feb27_08-51-39_fc60717d9ef2/1677488013.3413498/events.out.tfevents.1677488013.fc60717d9ef2.681.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aaa1c975210c064abcd40ce9024823802f0569a430369929f494d8fcb4b9f55d
3
+ size 5641
runs/Feb27_08-51-39_fc60717d9ef2/events.out.tfevents.1677487914.fc60717d9ef2.681.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d34fdf7ad210de29eaa801935145bfecdf928de720a0db39d9bbb92420042c84
3
+ size 12307
runs/Feb27_08-55-09_fc60717d9ef2/1677488290.8080983/events.out.tfevents.1677488290.fc60717d9ef2.681.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fb89c2058e03c18fa0b7c765597552b3908b2c1fcb0bfa889e73e467d86c8b48
3
+ size 5641
runs/Feb27_08-55-09_fc60717d9ef2/events.out.tfevents.1677488290.fc60717d9ef2.681.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8489f3a1c4371ecd7bdd669ee7bcd2b20edaf3ba7c10e0ec2c046f741a68d698
3
+ size 4127
runs/Feb27_09-00-26_fc60717d9ef2/1677488451.4369497/events.out.tfevents.1677488451.fc60717d9ef2.681.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:862a7ff9d277fdb26903455074371c85a064a4bd0c762f9b1298c5936f2d8f54
3
+ size 5641
runs/Feb27_09-00-26_fc60717d9ef2/1677488463.118922/events.out.tfevents.1677488463.fc60717d9ef2.681.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a0fa5235d7172ce354cf97de2b1024e9cafcda3d22f025ca1a3bbd684a4d63c1
3
+ size 5641
runs/Feb27_09-00-26_fc60717d9ef2/1677488522.5581338/events.out.tfevents.1677488522.fc60717d9ef2.681.17 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa358dfa789cc54aee0e279b77524673abf04b1ba5a644b1d557a28b3851a981
3
+ size 5641
runs/Feb27_09-00-26_fc60717d9ef2/events.out.tfevents.1677488451.fc60717d9ef2.681.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11e07151e93393e16d8e8b2ee4186379c154c4dc04f9e7f58eae8002e0ca11d7
3
+ size 12301
runs/Feb27_09-05-35_fc60717d9ef2/1677488764.8892996/events.out.tfevents.1677488764.fc60717d9ef2.11912.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4995e2bb6887190648c485d2fa2e90fa92559ac67c3ba34ccbdfe442b144e0ec
3
+ size 5641
runs/Feb27_09-05-35_fc60717d9ef2/events.out.tfevents.1677488764.fc60717d9ef2.11912.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91b5b6c51fedb651d9adc4dbe9a903091a01eb4c116754cee83ef2c1f140d4d2
3
+ size 4127
runs/Feb27_09-09-26_fc60717d9ef2/1677489002.5988908/events.out.tfevents.1677489002.fc60717d9ef2.12943.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39c02215581c411ee3ec87d97672cead39093bfce34f88e9bb70c497caf0718a
3
+ size 5641
runs/Feb27_09-09-26_fc60717d9ef2/events.out.tfevents.1677489002.fc60717d9ef2.12943.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:055bb60caee07c4ec45177bead279a0c62a08dc4e4b6ccd891170195ce2efaf1
3
+ size 4024
runs/Feb27_09-10-39_fc60717d9ef2/1677489065.4838176/events.out.tfevents.1677489065.fc60717d9ef2.12943.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eaf0c65ae8fa8ec54a4f433a186f396ca26a30d33b8bf9af4d6297b5f79210e4
3
+ size 5641
runs/Feb27_09-10-39_fc60717d9ef2/events.out.tfevents.1677489065.fc60717d9ef2.12943.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72729ef1e9cda5d86b9167e8c1977101bc8745f50a0dccb588259a829e49a2fe
3
+ size 4024
runs/Feb27_09-11-22_fc60717d9ef2/1677489105.6450863/events.out.tfevents.1677489105.fc60717d9ef2.12943.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c47b95885b002cc092eba23b48d7b334b0b528adccd5de53c67e4517e6e973d
3
+ size 5641
runs/Feb27_09-11-22_fc60717d9ef2/events.out.tfevents.1677489105.fc60717d9ef2.12943.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c53f0b0f88e30c5549e07c675cfd946c918f9656c6e4f92ad4969fc3a0a7ebfd
3
+ size 4024
runs/Feb27_09-16-35_fc60717d9ef2/1677489421.8902442/events.out.tfevents.1677489421.fc60717d9ef2.14971.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:446a8908dac4d2f41fcafc8bb4ad310d3de2e3a4bbf7bc90c43ec08f254db286
3
+ size 5641
runs/Feb27_09-16-35_fc60717d9ef2/events.out.tfevents.1677489421.fc60717d9ef2.14971.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd09de7267d311dc64c459dbee53ccf2a832575816025868efbd59b61523fe9f
3
+ size 4024
runs/Feb27_09-26-54_fc60717d9ef2/1677490045.1964664/events.out.tfevents.1677490045.fc60717d9ef2.17454.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f80205d07f662911ce4ffb2cf34824fc07e7338c27570314f65c1d9ef9a7dc0
3
+ size 5641
runs/Feb27_09-26-54_fc60717d9ef2/events.out.tfevents.1677490045.fc60717d9ef2.17454.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a7d58758131b49afe91b0902345ca2c36da4b4f4303a985f958a613fb17ec10
3
+ size 4378
special_tokens_map.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<|endoftext|>",
3
+ "eos_token": "<|endoftext|>",
4
+ "pad_token": "<|endoftext|>",
5
+ "unk_token": "<|endoftext|>"
6
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "bos_token": "<|endoftext|>",
4
+ "eos_token": "<|endoftext|>",
5
+ "model_max_length": 1024,
6
+ "name_or_path": "gpt2",
7
+ "special_tokens_map_file": null,
8
+ "tokenizer_class": "GPT2Tokenizer",
9
+ "unk_token": "<|endoftext|>"
10
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:445af2c43883203fddd84831824a8856b1b29d64a08ebb609d6bf26332120419
3
+ size 3451
vocab.json ADDED
The diff for this file is too large to render. See raw diff