Commit ·
169da58
1
Parent(s): a62a268
Training in progress, step 500
Browse files- .gitignore +1 -0
- config.json +39 -0
- pytorch_model.bin +3 -0
- runs/May05_16-17-31_96105270ada3/1683303460.7343614/events.out.tfevents.1683303460.96105270ada3.197.1 +3 -0
- runs/May05_16-17-31_96105270ada3/events.out.tfevents.1683303460.96105270ada3.197.0 +3 -0
- runs/May05_16-17-54_96105270ada3/1683303476.6078959/events.out.tfevents.1683303476.96105270ada3.197.3 +3 -0
- runs/May05_16-17-54_96105270ada3/events.out.tfevents.1683303476.96105270ada3.197.2 +3 -0
- runs/May05_16-23-35_96105270ada3/1683303817.637306/events.out.tfevents.1683303817.96105270ada3.197.5 +3 -0
- runs/May05_16-23-35_96105270ada3/events.out.tfevents.1683303817.96105270ada3.197.4 +3 -0
- runs/May05_16-27-15_96105270ada3/1683304038.6563365/events.out.tfevents.1683304038.96105270ada3.197.7 +3 -0
- runs/May05_16-27-15_96105270ada3/events.out.tfevents.1683304038.96105270ada3.197.6 +3 -0
- runs/May05_16-32-37_96105270ada3/1683304360.2422013/events.out.tfevents.1683304360.96105270ada3.197.9 +3 -0
- runs/May05_16-32-37_96105270ada3/events.out.tfevents.1683304360.96105270ada3.197.8 +3 -0
- runs/May05_16-36-18_96105270ada3/1683304580.5996478/events.out.tfevents.1683304580.96105270ada3.197.11 +3 -0
- runs/May05_16-36-18_96105270ada3/events.out.tfevents.1683304580.96105270ada3.197.10 +3 -0
- runs/May05_16-42-03_96105270ada3/1683304926.0094068/events.out.tfevents.1683304926.96105270ada3.197.13 +3 -0
- runs/May05_16-42-03_96105270ada3/events.out.tfevents.1683304926.96105270ada3.197.12 +3 -0
- runs/May05_16-44-00_96105270ada3/1683305042.750123/events.out.tfevents.1683305042.96105270ada3.197.15 +3 -0
- runs/May05_16-44-00_96105270ada3/events.out.tfevents.1683305042.96105270ada3.197.14 +3 -0
- runs/May05_16-46-25_96105270ada3/1683305188.038199/events.out.tfevents.1683305188.96105270ada3.197.17 +3 -0
- runs/May05_16-46-25_96105270ada3/events.out.tfevents.1683305188.96105270ada3.197.16 +3 -0
- runs/May05_16-49-49_96105270ada3/1683305391.6651833/events.out.tfevents.1683305391.96105270ada3.197.19 +3 -0
- runs/May05_16-49-49_96105270ada3/events.out.tfevents.1683305391.96105270ada3.197.18 +3 -0
- runs/May05_16-54-15_96105270ada3/1683305660.27987/events.out.tfevents.1683305660.96105270ada3.11088.1 +3 -0
- runs/May05_16-54-15_96105270ada3/events.out.tfevents.1683305660.96105270ada3.11088.0 +3 -0
- training_args.bin +3 -0
.gitignore
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
checkpoint-*/
|
config.json
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_name_or_path": "vicgalle/gpt2-alpaca-gpt4",
|
| 3 |
+
"activation_function": "gelu_new",
|
| 4 |
+
"architectures": [
|
| 5 |
+
"GPT2LMHeadModel"
|
| 6 |
+
],
|
| 7 |
+
"attn_pdrop": 0.1,
|
| 8 |
+
"bos_token_id": 50256,
|
| 9 |
+
"embd_pdrop": 0.1,
|
| 10 |
+
"eos_token_id": 50256,
|
| 11 |
+
"initializer_range": 0.02,
|
| 12 |
+
"layer_norm_epsilon": 1e-05,
|
| 13 |
+
"model_type": "gpt2",
|
| 14 |
+
"n_ctx": 1024,
|
| 15 |
+
"n_embd": 768,
|
| 16 |
+
"n_head": 12,
|
| 17 |
+
"n_inner": null,
|
| 18 |
+
"n_layer": 12,
|
| 19 |
+
"n_positions": 1024,
|
| 20 |
+
"reorder_and_upcast_attn": false,
|
| 21 |
+
"resid_pdrop": 0.1,
|
| 22 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 23 |
+
"scale_attn_weights": true,
|
| 24 |
+
"summary_activation": null,
|
| 25 |
+
"summary_first_dropout": 0.1,
|
| 26 |
+
"summary_proj_to_labels": true,
|
| 27 |
+
"summary_type": "cls_index",
|
| 28 |
+
"summary_use_proj": true,
|
| 29 |
+
"task_specific_params": {
|
| 30 |
+
"text-generation": {
|
| 31 |
+
"do_sample": true,
|
| 32 |
+
"max_length": 50
|
| 33 |
+
}
|
| 34 |
+
},
|
| 35 |
+
"torch_dtype": "float32",
|
| 36 |
+
"transformers_version": "4.28.1",
|
| 37 |
+
"use_cache": false,
|
| 38 |
+
"vocab_size": 50260
|
| 39 |
+
}
|
pytorch_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:25a5f0ec2876590c2cca852e26f3ee202202e1abcad4b3ee96ab74f443a8bee0
|
| 3 |
+
size 510407229
|
runs/May05_16-17-31_96105270ada3/1683303460.7343614/events.out.tfevents.1683303460.96105270ada3.197.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7c89b87aa6c19a13f030885b184a55b71ba401d1d48fefcd1b4ef16daa7db5a
|
| 3 |
+
size 5870
|
runs/May05_16-17-31_96105270ada3/events.out.tfevents.1683303460.96105270ada3.197.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9114d02e74ced463d5627545112c388198efeb2d1d709a4c8270d12e227d2ede
|
| 3 |
+
size 4274
|
runs/May05_16-17-54_96105270ada3/1683303476.6078959/events.out.tfevents.1683303476.96105270ada3.197.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05704e005a2cd0b6d86793fd1aaa9047e3e227ca806265c582e69d251c180f89
|
| 3 |
+
size 5870
|
runs/May05_16-17-54_96105270ada3/events.out.tfevents.1683303476.96105270ada3.197.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e16608aaa596b2cb67e4f08ed3acb9420558fa65f215ba22b9f78a2abeb4536
|
| 3 |
+
size 4274
|
runs/May05_16-23-35_96105270ada3/1683303817.637306/events.out.tfevents.1683303817.96105270ada3.197.5
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:437f3e7f86ff41ce12e6ade1526b312af8e4351c86af9bfaf58527f40e9a201e
|
| 3 |
+
size 5870
|
runs/May05_16-23-35_96105270ada3/events.out.tfevents.1683303817.96105270ada3.197.4
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa0eb77052a16821bfb80e6e5ff8d7b7975ef53ccc948a1328e272f76daa9217
|
| 3 |
+
size 4274
|
runs/May05_16-27-15_96105270ada3/1683304038.6563365/events.out.tfevents.1683304038.96105270ada3.197.7
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22eb3dc5b926d1b348d1cbb188a0dffb0e6c12b8681dd3bc9cf8141be0f55a22
|
| 3 |
+
size 5870
|
runs/May05_16-27-15_96105270ada3/events.out.tfevents.1683304038.96105270ada3.197.6
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea8367094adafe7b8928ebd7f9265302e89d0b77f8d376d82d76c94f0b3bd6cb
|
| 3 |
+
size 4274
|
runs/May05_16-32-37_96105270ada3/1683304360.2422013/events.out.tfevents.1683304360.96105270ada3.197.9
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2677d7f73df4d2d06dd88739b93508be3337fb27df52cbd29b3ec623bf6f7b07
|
| 3 |
+
size 5870
|
runs/May05_16-32-37_96105270ada3/events.out.tfevents.1683304360.96105270ada3.197.8
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:626d4105661cef3cd31226fa22167f32b5f31ddeaa3e4413d4f4a28e4bd61ed9
|
| 3 |
+
size 4274
|
runs/May05_16-36-18_96105270ada3/1683304580.5996478/events.out.tfevents.1683304580.96105270ada3.197.11
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1101b2339e9bdd1f21cd5ddb78520d6b0cd5dc72a9ad40b23d4770b66050ec1e
|
| 3 |
+
size 5870
|
runs/May05_16-36-18_96105270ada3/events.out.tfevents.1683304580.96105270ada3.197.10
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35f213ee496f09f2ce510267ad337e482e5745b0d777feb0f5e117a87d59e6c0
|
| 3 |
+
size 4274
|
runs/May05_16-42-03_96105270ada3/1683304926.0094068/events.out.tfevents.1683304926.96105270ada3.197.13
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:003c28a42675af0410f8624922fabd7e7bf7e1dd492fafe1e95354e9bee2ced2
|
| 3 |
+
size 5870
|
runs/May05_16-42-03_96105270ada3/events.out.tfevents.1683304926.96105270ada3.197.12
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2500c7a6225a128a56fe8621655b0a0811b865d3514d51d3af1bdba8f9ab395e
|
| 3 |
+
size 4274
|
runs/May05_16-44-00_96105270ada3/1683305042.750123/events.out.tfevents.1683305042.96105270ada3.197.15
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b742fbc51239a7b4f440ed934533562897a6340cfdc6cea53a5c5daded5e3a03
|
| 3 |
+
size 5870
|
runs/May05_16-44-00_96105270ada3/events.out.tfevents.1683305042.96105270ada3.197.14
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:378069f953c925d46986866a8b2a5750b17df626fde6bfd3783c20b0a9995ab0
|
| 3 |
+
size 4274
|
runs/May05_16-46-25_96105270ada3/1683305188.038199/events.out.tfevents.1683305188.96105270ada3.197.17
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed2cd305954c1b6d751589350ef913293e0b71140e50794ee9d6c4fdaa16f9a5
|
| 3 |
+
size 5870
|
runs/May05_16-46-25_96105270ada3/events.out.tfevents.1683305188.96105270ada3.197.16
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7e647ae6f160e00857a082538ff61ff3befb8f47ffdab79ecf6c457a165644c5
|
| 3 |
+
size 4274
|
runs/May05_16-49-49_96105270ada3/1683305391.6651833/events.out.tfevents.1683305391.96105270ada3.197.19
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5b54bd4603d86985d12e6c5e9bd340c92189e5960f0dd04786a4299462f99c73
|
| 3 |
+
size 5870
|
runs/May05_16-49-49_96105270ada3/events.out.tfevents.1683305391.96105270ada3.197.18
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8194e56ad81f16a9c2b613cbad51b527ca0777f6e8dea0246777811da47f39d9
|
| 3 |
+
size 4184
|
runs/May05_16-54-15_96105270ada3/1683305660.27987/events.out.tfevents.1683305660.96105270ada3.11088.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f936cfcf6e67920b539215c00ea51596f69e5108b0015f841e688aedd8c9584
|
| 3 |
+
size 5870
|
runs/May05_16-54-15_96105270ada3/events.out.tfevents.1683305660.96105270ada3.11088.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:346635c30617865aebc76cc1bbc907acf06b28940d3cbbce61ea5c74c190c2fa
|
| 3 |
+
size 4431
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ba4411cb8a08cd03ebba7e6a99690d7f897a666e5ff0268a59ee707213d551c
|
| 3 |
+
size 3579
|