adamthekiwi commited on
Commit
169da58
·
1 Parent(s): a62a268

Training in progress, step 500

Browse files
Files changed (26) hide show
  1. .gitignore +1 -0
  2. config.json +39 -0
  3. pytorch_model.bin +3 -0
  4. runs/May05_16-17-31_96105270ada3/1683303460.7343614/events.out.tfevents.1683303460.96105270ada3.197.1 +3 -0
  5. runs/May05_16-17-31_96105270ada3/events.out.tfevents.1683303460.96105270ada3.197.0 +3 -0
  6. runs/May05_16-17-54_96105270ada3/1683303476.6078959/events.out.tfevents.1683303476.96105270ada3.197.3 +3 -0
  7. runs/May05_16-17-54_96105270ada3/events.out.tfevents.1683303476.96105270ada3.197.2 +3 -0
  8. runs/May05_16-23-35_96105270ada3/1683303817.637306/events.out.tfevents.1683303817.96105270ada3.197.5 +3 -0
  9. runs/May05_16-23-35_96105270ada3/events.out.tfevents.1683303817.96105270ada3.197.4 +3 -0
  10. runs/May05_16-27-15_96105270ada3/1683304038.6563365/events.out.tfevents.1683304038.96105270ada3.197.7 +3 -0
  11. runs/May05_16-27-15_96105270ada3/events.out.tfevents.1683304038.96105270ada3.197.6 +3 -0
  12. runs/May05_16-32-37_96105270ada3/1683304360.2422013/events.out.tfevents.1683304360.96105270ada3.197.9 +3 -0
  13. runs/May05_16-32-37_96105270ada3/events.out.tfevents.1683304360.96105270ada3.197.8 +3 -0
  14. runs/May05_16-36-18_96105270ada3/1683304580.5996478/events.out.tfevents.1683304580.96105270ada3.197.11 +3 -0
  15. runs/May05_16-36-18_96105270ada3/events.out.tfevents.1683304580.96105270ada3.197.10 +3 -0
  16. runs/May05_16-42-03_96105270ada3/1683304926.0094068/events.out.tfevents.1683304926.96105270ada3.197.13 +3 -0
  17. runs/May05_16-42-03_96105270ada3/events.out.tfevents.1683304926.96105270ada3.197.12 +3 -0
  18. runs/May05_16-44-00_96105270ada3/1683305042.750123/events.out.tfevents.1683305042.96105270ada3.197.15 +3 -0
  19. runs/May05_16-44-00_96105270ada3/events.out.tfevents.1683305042.96105270ada3.197.14 +3 -0
  20. runs/May05_16-46-25_96105270ada3/1683305188.038199/events.out.tfevents.1683305188.96105270ada3.197.17 +3 -0
  21. runs/May05_16-46-25_96105270ada3/events.out.tfevents.1683305188.96105270ada3.197.16 +3 -0
  22. runs/May05_16-49-49_96105270ada3/1683305391.6651833/events.out.tfevents.1683305391.96105270ada3.197.19 +3 -0
  23. runs/May05_16-49-49_96105270ada3/events.out.tfevents.1683305391.96105270ada3.197.18 +3 -0
  24. runs/May05_16-54-15_96105270ada3/1683305660.27987/events.out.tfevents.1683305660.96105270ada3.11088.1 +3 -0
  25. runs/May05_16-54-15_96105270ada3/events.out.tfevents.1683305660.96105270ada3.11088.0 +3 -0
  26. training_args.bin +3 -0
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
config.json ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "vicgalle/gpt2-alpaca-gpt4",
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPT2LMHeadModel"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 50256,
11
+ "initializer_range": 0.02,
12
+ "layer_norm_epsilon": 1e-05,
13
+ "model_type": "gpt2",
14
+ "n_ctx": 1024,
15
+ "n_embd": 768,
16
+ "n_head": 12,
17
+ "n_inner": null,
18
+ "n_layer": 12,
19
+ "n_positions": 1024,
20
+ "reorder_and_upcast_attn": false,
21
+ "resid_pdrop": 0.1,
22
+ "scale_attn_by_inverse_layer_idx": false,
23
+ "scale_attn_weights": true,
24
+ "summary_activation": null,
25
+ "summary_first_dropout": 0.1,
26
+ "summary_proj_to_labels": true,
27
+ "summary_type": "cls_index",
28
+ "summary_use_proj": true,
29
+ "task_specific_params": {
30
+ "text-generation": {
31
+ "do_sample": true,
32
+ "max_length": 50
33
+ }
34
+ },
35
+ "torch_dtype": "float32",
36
+ "transformers_version": "4.28.1",
37
+ "use_cache": false,
38
+ "vocab_size": 50260
39
+ }
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25a5f0ec2876590c2cca852e26f3ee202202e1abcad4b3ee96ab74f443a8bee0
3
+ size 510407229
runs/May05_16-17-31_96105270ada3/1683303460.7343614/events.out.tfevents.1683303460.96105270ada3.197.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7c89b87aa6c19a13f030885b184a55b71ba401d1d48fefcd1b4ef16daa7db5a
3
+ size 5870
runs/May05_16-17-31_96105270ada3/events.out.tfevents.1683303460.96105270ada3.197.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9114d02e74ced463d5627545112c388198efeb2d1d709a4c8270d12e227d2ede
3
+ size 4274
runs/May05_16-17-54_96105270ada3/1683303476.6078959/events.out.tfevents.1683303476.96105270ada3.197.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05704e005a2cd0b6d86793fd1aaa9047e3e227ca806265c582e69d251c180f89
3
+ size 5870
runs/May05_16-17-54_96105270ada3/events.out.tfevents.1683303476.96105270ada3.197.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e16608aaa596b2cb67e4f08ed3acb9420558fa65f215ba22b9f78a2abeb4536
3
+ size 4274
runs/May05_16-23-35_96105270ada3/1683303817.637306/events.out.tfevents.1683303817.96105270ada3.197.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:437f3e7f86ff41ce12e6ade1526b312af8e4351c86af9bfaf58527f40e9a201e
3
+ size 5870
runs/May05_16-23-35_96105270ada3/events.out.tfevents.1683303817.96105270ada3.197.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aa0eb77052a16821bfb80e6e5ff8d7b7975ef53ccc948a1328e272f76daa9217
3
+ size 4274
runs/May05_16-27-15_96105270ada3/1683304038.6563365/events.out.tfevents.1683304038.96105270ada3.197.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22eb3dc5b926d1b348d1cbb188a0dffb0e6c12b8681dd3bc9cf8141be0f55a22
3
+ size 5870
runs/May05_16-27-15_96105270ada3/events.out.tfevents.1683304038.96105270ada3.197.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea8367094adafe7b8928ebd7f9265302e89d0b77f8d376d82d76c94f0b3bd6cb
3
+ size 4274
runs/May05_16-32-37_96105270ada3/1683304360.2422013/events.out.tfevents.1683304360.96105270ada3.197.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2677d7f73df4d2d06dd88739b93508be3337fb27df52cbd29b3ec623bf6f7b07
3
+ size 5870
runs/May05_16-32-37_96105270ada3/events.out.tfevents.1683304360.96105270ada3.197.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:626d4105661cef3cd31226fa22167f32b5f31ddeaa3e4413d4f4a28e4bd61ed9
3
+ size 4274
runs/May05_16-36-18_96105270ada3/1683304580.5996478/events.out.tfevents.1683304580.96105270ada3.197.11 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1101b2339e9bdd1f21cd5ddb78520d6b0cd5dc72a9ad40b23d4770b66050ec1e
3
+ size 5870
runs/May05_16-36-18_96105270ada3/events.out.tfevents.1683304580.96105270ada3.197.10 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35f213ee496f09f2ce510267ad337e482e5745b0d777feb0f5e117a87d59e6c0
3
+ size 4274
runs/May05_16-42-03_96105270ada3/1683304926.0094068/events.out.tfevents.1683304926.96105270ada3.197.13 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:003c28a42675af0410f8624922fabd7e7bf7e1dd492fafe1e95354e9bee2ced2
3
+ size 5870
runs/May05_16-42-03_96105270ada3/events.out.tfevents.1683304926.96105270ada3.197.12 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2500c7a6225a128a56fe8621655b0a0811b865d3514d51d3af1bdba8f9ab395e
3
+ size 4274
runs/May05_16-44-00_96105270ada3/1683305042.750123/events.out.tfevents.1683305042.96105270ada3.197.15 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b742fbc51239a7b4f440ed934533562897a6340cfdc6cea53a5c5daded5e3a03
3
+ size 5870
runs/May05_16-44-00_96105270ada3/events.out.tfevents.1683305042.96105270ada3.197.14 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:378069f953c925d46986866a8b2a5750b17df626fde6bfd3783c20b0a9995ab0
3
+ size 4274
runs/May05_16-46-25_96105270ada3/1683305188.038199/events.out.tfevents.1683305188.96105270ada3.197.17 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed2cd305954c1b6d751589350ef913293e0b71140e50794ee9d6c4fdaa16f9a5
3
+ size 5870
runs/May05_16-46-25_96105270ada3/events.out.tfevents.1683305188.96105270ada3.197.16 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e647ae6f160e00857a082538ff61ff3befb8f47ffdab79ecf6c457a165644c5
3
+ size 4274
runs/May05_16-49-49_96105270ada3/1683305391.6651833/events.out.tfevents.1683305391.96105270ada3.197.19 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b54bd4603d86985d12e6c5e9bd340c92189e5960f0dd04786a4299462f99c73
3
+ size 5870
runs/May05_16-49-49_96105270ada3/events.out.tfevents.1683305391.96105270ada3.197.18 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8194e56ad81f16a9c2b613cbad51b527ca0777f6e8dea0246777811da47f39d9
3
+ size 4184
runs/May05_16-54-15_96105270ada3/1683305660.27987/events.out.tfevents.1683305660.96105270ada3.11088.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f936cfcf6e67920b539215c00ea51596f69e5108b0015f841e688aedd8c9584
3
+ size 5870
runs/May05_16-54-15_96105270ada3/events.out.tfevents.1683305660.96105270ada3.11088.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:346635c30617865aebc76cc1bbc907acf06b28940d3cbbce61ea5c74c190c2fa
3
+ size 4431
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ba4411cb8a08cd03ebba7e6a99690d7f897a666e5ff0268a59ee707213d551c
3
+ size 3579