cciboglu commited on
Commit
08f8d26
·
verified ·
1 Parent(s): 84ee0ad

Training in progress, epoch 1

Browse files
Files changed (31) hide show
  1. added_tokens.json +3 -0
  2. config.json +48 -0
  3. merges.txt +0 -0
  4. model.safetensors +3 -0
  5. runs/Jan07_20-16-00_halle.cli.ito.cit.tum.de/events.out.tfevents.1736277363.halle.cli.ito.cit.tum.de.4004027.0 +3 -0
  6. runs/Jan07_20-19-30_halle.cli.ito.cit.tum.de/events.out.tfevents.1736277579.halle.cli.ito.cit.tum.de.4010916.0 +3 -0
  7. runs/Jan07_23-01-49_halle.cli.ito.cit.tum.de/events.out.tfevents.1736287309.halle.cli.ito.cit.tum.de.4010916.1 +3 -0
  8. runs/Jan07_23-49-14_halle.cli.ito.cit.tum.de/events.out.tfevents.1736290155.halle.cli.ito.cit.tum.de.4010916.2 +3 -0
  9. runs/Jan08_00-50-06_halle.cli.ito.cit.tum.de/events.out.tfevents.1736293807.halle.cli.ito.cit.tum.de.4010916.3 +3 -0
  10. runs/Jan08_05-20-22_halle.cli.ito.cit.tum.de/events.out.tfevents.1736310023.halle.cli.ito.cit.tum.de.4010916.4 +3 -0
  11. runs/Jan08_08-30-55_halle.cli.ito.cit.tum.de/events.out.tfevents.1736321455.halle.cli.ito.cit.tum.de.4010916.5 +3 -0
  12. runs/Jan08_11-27-18_halle.cli.ito.cit.tum.de/events.out.tfevents.1736332039.halle.cli.ito.cit.tum.de.4010916.6 +3 -0
  13. runs/Jan08_12-45-05_halle.cli.ito.cit.tum.de/events.out.tfevents.1736336706.halle.cli.ito.cit.tum.de.4010916.7 +3 -0
  14. runs/Jan08_14-31-14_halle.cli.ito.cit.tum.de/events.out.tfevents.1736343075.halle.cli.ito.cit.tum.de.4010916.8 +3 -0
  15. runs/Jan08_17-47-36_halle.cli.ito.cit.tum.de/events.out.tfevents.1736354856.halle.cli.ito.cit.tum.de.4010916.9 +3 -0
  16. runs/Jan08_20-48-43_halle.cli.ito.cit.tum.de/events.out.tfevents.1736365724.halle.cli.ito.cit.tum.de.2306818.0 +3 -0
  17. runs/Jan08_21-49-45_halle.cli.ito.cit.tum.de/events.out.tfevents.1736369386.halle.cli.ito.cit.tum.de.2306818.1 +3 -0
  18. runs/Jan08_23-18-57_halle.cli.ito.cit.tum.de/events.out.tfevents.1736374738.halle.cli.ito.cit.tum.de.2306818.2 +3 -0
  19. runs/Jan09_04-55-19_halle.cli.ito.cit.tum.de/events.out.tfevents.1736394920.halle.cli.ito.cit.tum.de.2306818.3 +3 -0
  20. runs/Jan09_07-49-20_halle.cli.ito.cit.tum.de/events.out.tfevents.1736405360.halle.cli.ito.cit.tum.de.2306818.4 +3 -0
  21. runs/Jan09_10-14-32_halle.cli.ito.cit.tum.de/events.out.tfevents.1736414074.halle.cli.ito.cit.tum.de.2306818.5 +3 -0
  22. runs/Jan09_11-27-26_halle.cli.ito.cit.tum.de/events.out.tfevents.1736418447.halle.cli.ito.cit.tum.de.2306818.6 +3 -0
  23. runs/Jan09_13-45-31_halle.cli.ito.cit.tum.de/events.out.tfevents.1736426732.halle.cli.ito.cit.tum.de.3948144.0 +3 -0
  24. runs/Jan09_14-12-06_halle.cli.ito.cit.tum.de/events.out.tfevents.1736428327.halle.cli.ito.cit.tum.de.4003704.0 +3 -0
  25. runs/Jan09_17-39-26_halle.cli.ito.cit.tum.de/events.out.tfevents.1736440767.halle.cli.ito.cit.tum.de.4003704.1 +3 -0
  26. special_tokens_map.json +12 -0
  27. tokenizer.json +0 -0
  28. tokenizer_config.json +29 -0
  29. training_args.bin +3 -0
  30. vocab.json +0 -0
  31. vocab.txt +0 -0
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[PAD]": 50257
3
+ }
config.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "openai-community/gpt2",
3
+ "activation_function": "gelu_new",
4
+ "architectures": [
5
+ "GPT2ForSequenceClassification"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "embd_pdrop": 0.1,
10
+ "eos_token_id": 50256,
11
+ "id2label": {
12
+ "0": "NEGATIVE",
13
+ "1": "POSITIVE"
14
+ },
15
+ "initializer_range": 0.02,
16
+ "label2id": {
17
+ "NEGATIVE": 0,
18
+ "POSITIVE": 1
19
+ },
20
+ "layer_norm_epsilon": 1e-05,
21
+ "model_type": "gpt2",
22
+ "n_ctx": 1024,
23
+ "n_embd": 768,
24
+ "n_head": 12,
25
+ "n_inner": null,
26
+ "n_layer": 12,
27
+ "n_positions": 1024,
28
+ "problem_type": "single_label_classification",
29
+ "reorder_and_upcast_attn": false,
30
+ "resid_pdrop": 0.1,
31
+ "scale_attn_by_inverse_layer_idx": false,
32
+ "scale_attn_weights": true,
33
+ "summary_activation": null,
34
+ "summary_first_dropout": 0.1,
35
+ "summary_proj_to_labels": true,
36
+ "summary_type": "cls_index",
37
+ "summary_use_proj": true,
38
+ "task_specific_params": {
39
+ "text-generation": {
40
+ "do_sample": true,
41
+ "max_length": 50
42
+ }
43
+ },
44
+ "torch_dtype": "float32",
45
+ "transformers_version": "4.47.1",
46
+ "use_cache": true,
47
+ "vocab_size": 50258
48
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40ba0c831a02a2ab7aca6956a7dbef41aad9a5021a9d57d676dba543063c041e
3
+ size 497783504
runs/Jan07_20-16-00_halle.cli.ito.cit.tum.de/events.out.tfevents.1736277363.halle.cli.ito.cit.tum.de.4004027.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8e6c5d4d25934109e9a614f6fa2c103cb93f0e8fa37cd47776958c7aff5fc4c
3
+ size 5764
runs/Jan07_20-19-30_halle.cli.ito.cit.tum.de/events.out.tfevents.1736277579.halle.cli.ito.cit.tum.de.4010916.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da78695da9c4bb1f153f59e037932c356991c6416f8d2d89a6a8833acc5680bb
3
+ size 19325
runs/Jan07_23-01-49_halle.cli.ito.cit.tum.de/events.out.tfevents.1736287309.halle.cli.ito.cit.tum.de.4010916.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5c22b7ad316b5b4908385412fee5b022d119794014a671fb94fda8d1c11e96c
3
+ size 19236
runs/Jan07_23-49-14_halle.cli.ito.cit.tum.de/events.out.tfevents.1736290155.halle.cli.ito.cit.tum.de.4010916.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cd6b97319054ef62c74557c19df05552023e83a758633c41596a2ec09f163c0
3
+ size 19193
runs/Jan08_00-50-06_halle.cli.ito.cit.tum.de/events.out.tfevents.1736293807.halle.cli.ito.cit.tum.de.4010916.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf34e5aaabfc03c9982b00b2bb712e8d3e150f6f32dad9054f3b0879977f6ec0
3
+ size 19913
runs/Jan08_05-20-22_halle.cli.ito.cit.tum.de/events.out.tfevents.1736310023.halle.cli.ito.cit.tum.de.4010916.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d817b625e4fd78a9ca1faf404d4838c91083ebbf019cd38ff19a921e59b8b9d0
3
+ size 19324
runs/Jan08_08-30-55_halle.cli.ito.cit.tum.de/events.out.tfevents.1736321455.halle.cli.ito.cit.tum.de.4010916.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fd8f5a87fe334e759a8e6231d93a80036ed06326f910eaf1c4f09e2c1d3282a
3
+ size 19087
runs/Jan08_11-27-18_halle.cli.ito.cit.tum.de/events.out.tfevents.1736332039.halle.cli.ito.cit.tum.de.4010916.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:365533f175611ccde9925ffa081b76b510f213cdeb32496b664a65a490b4db1c
3
+ size 18970
runs/Jan08_12-45-05_halle.cli.ito.cit.tum.de/events.out.tfevents.1736336706.halle.cli.ito.cit.tum.de.4010916.7 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5a8cea5457a5e5bbc38c08795cdc9e919653568984b08a21ce28dee23ca3a420
3
+ size 19077
runs/Jan08_14-31-14_halle.cli.ito.cit.tum.de/events.out.tfevents.1736343075.halle.cli.ito.cit.tum.de.4010916.8 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8bdaf6f32003834183f5980e62e5a325e3f0e79ec87f2c2c51303e4cbcbb61b
3
+ size 22555
runs/Jan08_17-47-36_halle.cli.ito.cit.tum.de/events.out.tfevents.1736354856.halle.cli.ito.cit.tum.de.4010916.9 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6387a42e205ed3104d955cdd306c22faf9b12eef6ab665c046f4ab881661d474
3
+ size 10406
runs/Jan08_20-48-43_halle.cli.ito.cit.tum.de/events.out.tfevents.1736365724.halle.cli.ito.cit.tum.de.2306818.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f7770b87540b22c1481b2dc45fdf7a714133b2ffd5d1c64575bdc5142c10a96
3
+ size 22466
runs/Jan08_21-49-45_halle.cli.ito.cit.tum.de/events.out.tfevents.1736369386.halle.cli.ito.cit.tum.de.2306818.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27b27ecd4499216871d40d00e46ab5c692213b0cc71c046a03a0c2fd05dcd302
3
+ size 22423
runs/Jan08_23-18-57_halle.cli.ito.cit.tum.de/events.out.tfevents.1736374738.halle.cli.ito.cit.tum.de.2306818.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56a3ad3fc4e22dcc40e9989d280bbfdad96d9a85b0ff8381a8b64ed90e372473
3
+ size 23143
runs/Jan09_04-55-19_halle.cli.ito.cit.tum.de/events.out.tfevents.1736394920.halle.cli.ito.cit.tum.de.2306818.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2614a3e3e05206cebe9d8253f6002be69b814ca80b451494c733cae56e711c0
3
+ size 22554
runs/Jan09_07-49-20_halle.cli.ito.cit.tum.de/events.out.tfevents.1736405360.halle.cli.ito.cit.tum.de.2306818.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3cd8bd4dacb2aafb8328502dcffd9f5f3cad667671981b66cf1ff6d4908fea29
3
+ size 22317
runs/Jan09_10-14-32_halle.cli.ito.cit.tum.de/events.out.tfevents.1736414074.halle.cli.ito.cit.tum.de.2306818.5 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25e80ece145134cf7df13bf84024d0587c4b7ca77906e347d90aa73464403c33
3
+ size 22200
runs/Jan09_11-27-26_halle.cli.ito.cit.tum.de/events.out.tfevents.1736418447.halle.cli.ito.cit.tum.de.2306818.6 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:099b92fd83d4f7d1ca6cc165c61439ae891ffc555f5dc2be7692fe116dc9e8ef
3
+ size 16296
runs/Jan09_13-45-31_halle.cli.ito.cit.tum.de/events.out.tfevents.1736426732.halle.cli.ito.cit.tum.de.3948144.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8e0fb8d7ef156fd12ed7e5d8c5ebe12c52d8b21a8e2c100788743fb95c34a795
3
+ size 5429
runs/Jan09_14-12-06_halle.cli.ito.cit.tum.de/events.out.tfevents.1736428327.halle.cli.ito.cit.tum.de.4003704.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bef185a99ab5a36e3f418866760685c29a4532e2240a0527e3390fa3e6a5111
3
+ size 22307
runs/Jan09_17-39-26_halle.cli.ito.cit.tum.de/events.out.tfevents.1736440767.halle.cli.ito.cit.tum.de.4003704.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9dd39df767dbef6fce783e117720b5ccbb0ec4fffee1905bb3c81d179c1cf0bb
3
+ size 12452
special_tokens_map.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<|endoftext|>",
3
+ "eos_token": "<|endoftext|>",
4
+ "pad_token": {
5
+ "content": "[PAD]",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false
10
+ },
11
+ "unk_token": "<|endoftext|>"
12
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "50256": {
5
+ "content": "<|endoftext|>",
6
+ "lstrip": false,
7
+ "normalized": true,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "50257": {
13
+ "content": "[PAD]",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ }
20
+ },
21
+ "bos_token": "<|endoftext|>",
22
+ "clean_up_tokenization_spaces": false,
23
+ "eos_token": "<|endoftext|>",
24
+ "extra_special_tokens": {},
25
+ "model_max_length": 1024,
26
+ "pad_token": "[PAD]",
27
+ "tokenizer_class": "GPT2Tokenizer",
28
+ "unk_token": "<|endoftext|>"
29
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b7acf1afa75a1756746b7fda58410fc01f6b8afde8cce274c3dabe2c17835ad
3
+ size 5432
vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
vocab.txt ADDED
The diff for this file is too large to render. See raw diff