cciboglu commited on
Commit
9477d3d
·
verified ·
1 Parent(s): 406b88e

Training in progress, epoch 1

Browse files
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "[PAD]": 50257
3
+ }
config.json ADDED
@@ -0,0 +1,52 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "xlnet/xlnet-base-cased",
3
+ "architectures": [
4
+ "XLNetForSequenceClassification"
5
+ ],
6
+ "attn_type": "bi",
7
+ "bi_data": false,
8
+ "bos_token_id": 1,
9
+ "clamp_len": -1,
10
+ "d_head": 64,
11
+ "d_inner": 3072,
12
+ "d_model": 768,
13
+ "dropout": 0.1,
14
+ "end_n_top": 5,
15
+ "eos_token_id": 2,
16
+ "ff_activation": "gelu",
17
+ "id2label": {
18
+ "0": "NEGATIVE",
19
+ "1": "POSITIVE"
20
+ },
21
+ "initializer_range": 0.02,
22
+ "label2id": {
23
+ "NEGATIVE": 0,
24
+ "POSITIVE": 1
25
+ },
26
+ "layer_norm_eps": 1e-12,
27
+ "mem_len": null,
28
+ "model_type": "xlnet",
29
+ "n_head": 12,
30
+ "n_layer": 12,
31
+ "pad_token_id": 5,
32
+ "problem_type": "single_label_classification",
33
+ "reuse_len": null,
34
+ "same_length": false,
35
+ "start_n_top": 5,
36
+ "summary_activation": "tanh",
37
+ "summary_last_dropout": 0.1,
38
+ "summary_type": "last",
39
+ "summary_use_proj": true,
40
+ "task_specific_params": {
41
+ "text-generation": {
42
+ "do_sample": true,
43
+ "max_length": 250
44
+ }
45
+ },
46
+ "torch_dtype": "float32",
47
+ "transformers_version": "4.47.1",
48
+ "untie_r": true,
49
+ "use_mems_eval": true,
50
+ "use_mems_train": false,
51
+ "vocab_size": 32000
52
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:968b368a981f068a1d6ff52e5de60bff258bca36fd19c12fbec830c803cb12d7
3
+ size 469264592
runs/Jan07_20-16-00_halle.cli.ito.cit.tum.de/events.out.tfevents.1736277363.halle.cli.ito.cit.tum.de.4004027.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e8e6c5d4d25934109e9a614f6fa2c103cb93f0e8fa37cd47776958c7aff5fc4c
3
+ size 5764
runs/Jan07_20-19-30_halle.cli.ito.cit.tum.de/events.out.tfevents.1736277579.halle.cli.ito.cit.tum.de.4010916.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da78695da9c4bb1f153f59e037932c356991c6416f8d2d89a6a8833acc5680bb
3
+ size 19325
runs/Jan07_23-01-49_halle.cli.ito.cit.tum.de/events.out.tfevents.1736287309.halle.cli.ito.cit.tum.de.4010916.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5c22b7ad316b5b4908385412fee5b022d119794014a671fb94fda8d1c11e96c
3
+ size 19236
runs/Jan07_23-49-14_halle.cli.ito.cit.tum.de/events.out.tfevents.1736290155.halle.cli.ito.cit.tum.de.4010916.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9cd6b97319054ef62c74557c19df05552023e83a758633c41596a2ec09f163c0
3
+ size 19193
runs/Jan08_00-50-06_halle.cli.ito.cit.tum.de/events.out.tfevents.1736293807.halle.cli.ito.cit.tum.de.4010916.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf34e5aaabfc03c9982b00b2bb712e8d3e150f6f32dad9054f3b0879977f6ec0
3
+ size 19913
runs/Jan08_05-20-22_halle.cli.ito.cit.tum.de/events.out.tfevents.1736310023.halle.cli.ito.cit.tum.de.4010916.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07bb7d6a54dfc88ea8872b22722ff457fa749f25d4a48a65df10016e5ca2b50a
3
+ size 12031
special_tokens_map.json ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<eop>",
4
+ "<eod>"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<cls>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "content": "<mask>",
11
+ "lstrip": true,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ },
16
+ "pad_token": "<pad>",
17
+ "sep_token": "<sep>",
18
+ "unk_token": "<unk>"
19
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,94 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<unk>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<s>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "</s>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<cls>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "4": {
36
+ "content": "<sep>",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ },
43
+ "5": {
44
+ "content": "<pad>",
45
+ "lstrip": false,
46
+ "normalized": false,
47
+ "rstrip": false,
48
+ "single_word": false,
49
+ "special": true
50
+ },
51
+ "6": {
52
+ "content": "<mask>",
53
+ "lstrip": true,
54
+ "normalized": false,
55
+ "rstrip": false,
56
+ "single_word": false,
57
+ "special": true
58
+ },
59
+ "7": {
60
+ "content": "<eod>",
61
+ "lstrip": false,
62
+ "normalized": false,
63
+ "rstrip": false,
64
+ "single_word": false,
65
+ "special": true
66
+ },
67
+ "8": {
68
+ "content": "<eop>",
69
+ "lstrip": false,
70
+ "normalized": false,
71
+ "rstrip": false,
72
+ "single_word": false,
73
+ "special": true
74
+ }
75
+ },
76
+ "additional_special_tokens": [
77
+ "<eop>",
78
+ "<eod>"
79
+ ],
80
+ "bos_token": "<s>",
81
+ "clean_up_tokenization_spaces": false,
82
+ "cls_token": "<cls>",
83
+ "do_lower_case": false,
84
+ "eos_token": "</s>",
85
+ "extra_special_tokens": {},
86
+ "keep_accents": false,
87
+ "mask_token": "<mask>",
88
+ "model_max_length": 1000000000000000019884624838656,
89
+ "pad_token": "<pad>",
90
+ "remove_space": true,
91
+ "sep_token": "<sep>",
92
+ "tokenizer_class": "XLNetTokenizer",
93
+ "unk_token": "<unk>"
94
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdc0262c12b6c6e7aa28b326da6e03b41dca262a550504d825eea0c08a1b9981
3
+ size 5432
vocab.json ADDED
The diff for this file is too large to render. See raw diff
 
vocab.txt ADDED
The diff for this file is too large to render. See raw diff