mokcho commited on
Commit
b079a61
·
verified ·
1 Parent(s): 35c041c

Delete Gallo_Italian-DEP/Generalize/UD_French-ParTUT-UD_Italian-MarkIT

Browse files
Generalize/UD_French-ParTUT-UD_Italian-MarkIT/all_results.json DELETED
@@ -1,8 +0,0 @@
1
- {
2
- "epoch": 20.0,
3
- "total_flos": 5526978466959360.0,
4
- "train_loss": 274.4749375,
5
- "train_runtime": 632.4869,
6
- "train_samples_per_second": 50.404,
7
- "train_steps_per_second": 0.791
8
- }
 
 
 
 
 
 
 
 
 
Generalize/UD_French-ParTUT-UD_Italian-MarkIT/config.json DELETED
@@ -1,187 +0,0 @@
1
- {
2
- "_name_or_path": "bert-base-multilingual-cased",
3
- "adapters": {
4
- "adapters": {},
5
- "config_map": {},
6
- "fusion_config_map": {},
7
- "fusion_name_map": {},
8
- "fusions": {}
9
- },
10
- "architectures": [
11
- "BertAdapterGeneralizeModel"
12
- ],
13
- "attention_probs_dropout_prob": 0.1,
14
- "classifier_dropout": null,
15
- "directionality": "bidi",
16
- "hidden_act": "gelu",
17
- "hidden_dropout_prob": 0.1,
18
- "hidden_size": 768,
19
- "id2label": {
20
- "0": "_",
21
- "1": "acl",
22
- "2": "advcl",
23
- "3": "advmod",
24
- "4": "amod",
25
- "5": "appos",
26
- "6": "aux",
27
- "7": "case",
28
- "8": "cc",
29
- "9": "ccomp",
30
- "10": "clf",
31
- "11": "compound",
32
- "12": "conj",
33
- "13": "cop",
34
- "14": "csubj",
35
- "15": "dep",
36
- "16": "det",
37
- "17": "discourse",
38
- "18": "dislocated",
39
- "19": "expl",
40
- "20": "fixed",
41
- "21": "flat",
42
- "22": "goeswith",
43
- "23": "iobj",
44
- "24": "list",
45
- "25": "mark",
46
- "26": "nmod",
47
- "27": "nsubj",
48
- "28": "nummod",
49
- "29": "obj",
50
- "30": "obl",
51
- "31": "orphan",
52
- "32": "parataxis",
53
- "33": "punct",
54
- "34": "reparandum",
55
- "35": "root",
56
- "36": "vocative",
57
- "37": "xcomp",
58
- "38": "dup",
59
- "39": "mwe",
60
- "40": "name",
61
- "41": "remnant"
62
- },
63
- "initializer_range": 0.02,
64
- "intermediate_size": 3072,
65
- "label2id": {
66
- "_": 0,
67
- "acl": 1,
68
- "advcl": 2,
69
- "advmod": 3,
70
- "amod": 4,
71
- "appos": 5,
72
- "aux": 6,
73
- "case": 7,
74
- "cc": 8,
75
- "ccomp": 9,
76
- "clf": 10,
77
- "compound": 11,
78
- "conj": 12,
79
- "cop": 13,
80
- "csubj": 14,
81
- "dep": 15,
82
- "det": 16,
83
- "discourse": 17,
84
- "dislocated": 18,
85
- "dup": 38,
86
- "expl": 19,
87
- "fixed": 20,
88
- "flat": 21,
89
- "goeswith": 22,
90
- "iobj": 23,
91
- "list": 24,
92
- "mark": 25,
93
- "mwe": 39,
94
- "name": 40,
95
- "nmod": 26,
96
- "nsubj": 27,
97
- "nummod": 28,
98
- "obj": 29,
99
- "obl": 30,
100
- "orphan": 31,
101
- "parataxis": 32,
102
- "punct": 33,
103
- "remnant": 41,
104
- "reparandum": 34,
105
- "root": 35,
106
- "vocative": 36,
107
- "xcomp": 37
108
- },
109
- "layer_norm_eps": 1e-12,
110
- "max_position_embeddings": 512,
111
- "model_type": "bert",
112
- "num_attention_heads": 12,
113
- "num_hidden_layers": 12,
114
- "pad_token_id": 0,
115
- "pooler_fc_size": 768,
116
- "pooler_num_attention_heads": 12,
117
- "pooler_num_fc_layers": 3,
118
- "pooler_size_per_head": 128,
119
- "pooler_type": "first_token_transform",
120
- "position_embedding_type": "absolute",
121
- "prediction_heads": {
122
- "default": {
123
- "activation_function": "gelu",
124
- "bias": true,
125
- "embedding_size": 768,
126
- "head_type": "masked_lm",
127
- "label2id": null,
128
- "layer_norm": true,
129
- "layers": 2,
130
- "shift_labels": false,
131
- "vocab_size": 119547
132
- },
133
- "ud_Italian-MarkIT": {
134
- "head_type": "dependency_parsing",
135
- "label2id": {
136
- "_": 0,
137
- "acl": 1,
138
- "advcl": 2,
139
- "advmod": 3,
140
- "amod": 4,
141
- "appos": 5,
142
- "aux": 6,
143
- "case": 7,
144
- "cc": 8,
145
- "ccomp": 9,
146
- "clf": 10,
147
- "compound": 11,
148
- "conj": 12,
149
- "cop": 13,
150
- "csubj": 14,
151
- "dep": 15,
152
- "det": 16,
153
- "discourse": 17,
154
- "dislocated": 18,
155
- "dup": 38,
156
- "expl": 19,
157
- "fixed": 20,
158
- "flat": 21,
159
- "goeswith": 22,
160
- "iobj": 23,
161
- "list": 24,
162
- "mark": 25,
163
- "mwe": 39,
164
- "name": 40,
165
- "nmod": 26,
166
- "nsubj": 27,
167
- "nummod": 28,
168
- "obj": 29,
169
- "obl": 30,
170
- "orphan": 31,
171
- "parataxis": 32,
172
- "punct": 33,
173
- "remnant": 41,
174
- "reparandum": 34,
175
- "root": 35,
176
- "vocative": 36,
177
- "xcomp": 37
178
- },
179
- "num_labels": 42
180
- }
181
- },
182
- "torch_dtype": "float32",
183
- "transformers_version": "4.47.1",
184
- "type_vocab_size": 2,
185
- "use_cache": true,
186
- "vocab_size": 119547
187
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Generalize/UD_French-ParTUT-UD_Italian-MarkIT/model.safetensors DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:83333756e0c9bbf24e54eac8225004b43cd218ee2c459be38182dd9da12bff28
3
- size 820332780
 
 
 
 
Generalize/UD_French-ParTUT-UD_Italian-MarkIT/train_results.json DELETED
@@ -1,8 +0,0 @@
1
- {
2
- "epoch": 20.0,
3
- "total_flos": 5526978466959360.0,
4
- "train_loss": 274.4749375,
5
- "train_runtime": 632.4869,
6
- "train_samples_per_second": 50.404,
7
- "train_steps_per_second": 0.791
8
- }
 
 
 
 
 
 
 
 
 
Generalize/UD_French-ParTUT-UD_Italian-MarkIT/trainer_state.json DELETED
@@ -1,189 +0,0 @@
1
- {
2
- "best_metric": null,
3
- "best_model_checkpoint": null,
4
- "epoch": 20.0,
5
- "eval_steps": 500,
6
- "global_step": 500,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 1.0,
13
- "eval_loss": 0.8605439912441165,
14
- "las": 78.37542254921456,
15
- "step": 25,
16
- "uas": 83.10797375223703
17
- },
18
- {
19
- "epoch": 2.0,
20
- "eval_loss": 0.8715260832808739,
21
- "las": 81.23881487373235,
22
- "step": 50,
23
- "uas": 85.99125074567509
24
- },
25
- {
26
- "epoch": 3.0,
27
- "eval_loss": 0.7943321466445923,
28
- "las": 82.9389540664148,
29
- "step": 75,
30
- "uas": 87.19427321535096
31
- },
32
- {
33
- "epoch": 4.0,
34
- "eval_loss": 0.8268451780773872,
35
- "las": 83.53549413402267,
36
- "step": 100,
37
- "uas": 87.75104394511831
38
- },
39
- {
40
- "epoch": 5.0,
41
- "eval_loss": 0.8672095509462578,
42
- "las": 83.65480214754425,
43
- "step": 125,
44
- "uas": 87.64167826605687
45
- },
46
- {
47
- "epoch": 6.0,
48
- "eval_loss": 0.8780410338279813,
49
- "las": 83.60509047524359,
50
- "step": 150,
51
- "uas": 87.72121694173792
52
- },
53
- {
54
- "epoch": 7.0,
55
- "eval_loss": 0.8944749922253364,
56
- "las": 83.82382183336648,
57
- "step": 175,
58
- "uas": 87.8405249552595
59
- },
60
- {
61
- "epoch": 8.0,
62
- "eval_loss": 0.8979702058226563,
63
- "las": 83.98289918472858,
64
- "step": 200,
65
- "uas": 87.9697753032412
66
- },
67
- {
68
- "epoch": 9.0,
69
- "eval_loss": 0.9090941423593566,
70
- "las": 84.12209186717041,
71
- "step": 225,
72
- "uas": 88.08908331676277
73
- },
74
- {
75
- "epoch": 10.0,
76
- "eval_loss": 0.9286551801271217,
77
- "las": 83.95307218134818,
78
- "step": 250,
79
- "uas": 87.9399482998608
80
- },
81
- {
82
- "epoch": 11.0,
83
- "eval_loss": 0.9500270187854767,
84
- "las": 82.96878106979518,
85
- "step": 275,
86
- "uas": 87.57208192483596
87
- },
88
- {
89
- "epoch": 12.0,
90
- "eval_loss": 0.9293884170609851,
91
- "las": 81.50725790415589,
92
- "step": 300,
93
- "uas": 86.23980910717836
94
- },
95
- {
96
- "epoch": 13.0,
97
- "eval_loss": 1.0011215362437935,
98
- "las": 83.35653211374031,
99
- "step": 325,
100
- "uas": 87.64167826605687
101
- },
102
- {
103
- "epoch": 14.0,
104
- "eval_loss": 0.9906252109727194,
105
- "las": 83.59514814078346,
106
- "step": 350,
107
- "uas": 87.91012129648041
108
- },
109
- {
110
- "epoch": 15.0,
111
- "eval_loss": 1.0156649240227633,
112
- "las": 83.59514814078346,
113
- "step": 375,
114
- "uas": 87.76098627957845
115
- },
116
- {
117
- "epoch": 16.0,
118
- "eval_loss": 1.0199621541555537,
119
- "las": 83.8337641678266,
120
- "step": 400,
121
- "uas": 88.0990256512229
122
- },
123
- {
124
- "epoch": 17.0,
125
- "eval_loss": 1.0884958824446036,
126
- "las": 83.82382183336648,
127
- "step": 425,
128
- "uas": 87.9697753032412
129
- },
130
- {
131
- "epoch": 18.0,
132
- "eval_loss": 1.0988125412963157,
133
- "las": 83.99284151918872,
134
- "step": 450,
135
- "uas": 88.18850666136409
136
- },
137
- {
138
- "epoch": 19.0,
139
- "eval_loss": 1.105759042640065,
140
- "las": 83.96301451580831,
141
- "step": 475,
142
- "uas": 88.19844899582422
143
- },
144
- {
145
- "epoch": 20.0,
146
- "grad_norm": 81.63844299316406,
147
- "learning_rate": 0.0,
148
- "loss": 274.4749,
149
- "step": 500
150
- },
151
- {
152
- "epoch": 20.0,
153
- "eval_loss": 1.1056630902512128,
154
- "las": 83.95307218134818,
155
- "step": 500,
156
- "uas": 88.18850666136409
157
- },
158
- {
159
- "epoch": 20.0,
160
- "step": 500,
161
- "total_flos": 5526978466959360.0,
162
- "train_loss": 274.4749375,
163
- "train_runtime": 632.4869,
164
- "train_samples_per_second": 50.404,
165
- "train_steps_per_second": 0.791
166
- }
167
- ],
168
- "logging_steps": 500,
169
- "max_steps": 500,
170
- "num_input_tokens_seen": 0,
171
- "num_train_epochs": 20,
172
- "save_steps": 500,
173
- "stateful_callbacks": {
174
- "TrainerControl": {
175
- "args": {
176
- "should_epoch_stop": false,
177
- "should_evaluate": false,
178
- "should_log": false,
179
- "should_save": true,
180
- "should_training_stop": true
181
- },
182
- "attributes": {}
183
- }
184
- },
185
- "total_flos": 5526978466959360.0,
186
- "train_batch_size": 64,
187
- "trial_name": null,
188
- "trial_params": null
189
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
Generalize/UD_French-ParTUT-UD_Italian-MarkIT/training_args.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:590fd532282ffc222acd6fbbf4ccb0c95501199d8d127bc40aefe06a2b091a04
3
- size 5432