Yova commited on
Commit
6ac4300
·
1 Parent(s): 1c8294b

Training in progress, step 800

Browse files
added_tokens.json CHANGED
@@ -1,20 +1,17 @@
1
  {
2
- "<1>": 50,
3
- "<2>": 58,
4
- "<3>": 63,
5
- "<COND>": 57,
6
- "<FUT>": 51,
7
- "<IMP>": 52,
8
- "<IND>": 61,
9
- "<IPFV>": 56,
10
- "<NFIN>": 53,
11
- "<NOM>": 62,
12
- "<PFV>": 59,
13
- "<PL>": 54,
14
- "<POS>": 60,
15
- "<PRS>": 46,
16
- "<PST>": 49,
17
- "<SBJV>": 47,
18
- "<SG>": 55,
19
- "<V>": 48
20
  }
 
1
  {
2
+ "<1>": 51,
3
+ "<2>": 50,
4
+ "<3>": 38,
5
+ "<4>": 48,
6
+ "<GRPL>": 43,
7
+ "<IND>": 45,
8
+ "<IPFV>": 49,
9
+ "<ITER>": 37,
10
+ "<NOM>": 46,
11
+ "<OPT>": 41,
12
+ "<PFV>": 47,
13
+ "<PL>": 44,
14
+ "<PROSP>": 42,
15
+ "<SG>": 40,
16
+ "<V>": 39
 
 
 
17
  }
config.json CHANGED
@@ -8,7 +8,7 @@
8
  "d_model": 256,
9
  "decoder_start_token_id": 1,
10
  "dense_act_fn": "relu",
11
- "dropout_rate": 0.2,
12
  "eos_token_id": 1,
13
  "feed_forward_proj": "relu",
14
  "initializer_factor": 1.0,
@@ -25,5 +25,5 @@
25
  "torch_dtype": "float32",
26
  "transformers_version": "4.35.2",
27
  "use_cache": true,
28
- "vocab_size": 64
29
  }
 
8
  "d_model": 256,
9
  "decoder_start_token_id": 1,
10
  "dense_act_fn": "relu",
11
+ "dropout_rate": 0.3,
12
  "eos_token_id": 1,
13
  "feed_forward_proj": "relu",
14
  "initializer_factor": 1.0,
 
25
  "torch_dtype": "float32",
26
  "transformers_version": "4.35.2",
27
  "use_cache": true,
28
+ "vocab_size": 52
29
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3ac0323be0f2e4a5b3b0acf00201a3946492d0d25189d77fe8ba26bc06fb1466
3
- size 29459544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:002881796d1b6745d1f31eccbe70512b959892f672ae1c6edf81e146c92f575b
3
+ size 29447256
special_tokens_map.json CHANGED
@@ -1,23 +1,20 @@
1
  {
2
  "additional_special_tokens": [
3
- "<PRS>",
4
- "<SBJV>",
5
  "<V>",
6
- "<PST>",
7
- "<1>",
8
- "<FUT>",
9
- "<IMP>",
10
- "<NFIN>",
11
- "<PL>",
12
  "<SG>",
13
- "<IPFV>",
14
- "<COND>",
15
- "<2>",
16
- "<PFV>",
17
- "<POS>",
18
  "<IND>",
19
  "<NOM>",
20
- "<3>"
 
 
 
 
21
  ],
22
  "bos_token": {
23
  "content": "<s>",
 
1
  {
2
  "additional_special_tokens": [
3
+ "<ITER>",
4
+ "<3>",
5
  "<V>",
 
 
 
 
 
 
6
  "<SG>",
7
+ "<OPT>",
8
+ "<PROSP>",
9
+ "<GRPL>",
10
+ "<PL>",
 
11
  "<IND>",
12
  "<NOM>",
13
+ "<PFV>",
14
+ "<4>",
15
+ "<IPFV>",
16
+ "<2>",
17
+ "<1>"
18
  ],
19
  "bos_token": {
20
  "content": "<s>",
tokenizer_config.json CHANGED
@@ -32,23 +32,23 @@
32
  "single_word": false,
33
  "special": true
34
  },
35
- "46": {
36
- "content": "<PRS>",
37
  "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
42
  },
43
- "47": {
44
- "content": "<SBJV>",
45
  "lstrip": false,
46
  "normalized": false,
47
  "rstrip": false,
48
  "single_word": false,
49
  "special": true
50
  },
51
- "48": {
52
  "content": "<V>",
53
  "lstrip": false,
54
  "normalized": false,
@@ -56,47 +56,39 @@
56
  "single_word": false,
57
  "special": true
58
  },
59
- "49": {
60
- "content": "<PST>",
61
- "lstrip": false,
62
- "normalized": false,
63
- "rstrip": false,
64
- "single_word": false,
65
- "special": true
66
- },
67
- "50": {
68
- "content": "<1>",
69
  "lstrip": false,
70
  "normalized": false,
71
  "rstrip": false,
72
  "single_word": false,
73
  "special": true
74
  },
75
- "51": {
76
- "content": "<FUT>",
77
  "lstrip": false,
78
  "normalized": false,
79
  "rstrip": false,
80
  "single_word": false,
81
  "special": true
82
  },
83
- "52": {
84
- "content": "<IMP>",
85
  "lstrip": false,
86
  "normalized": false,
87
  "rstrip": false,
88
  "single_word": false,
89
  "special": true
90
  },
91
- "53": {
92
- "content": "<NFIN>",
93
  "lstrip": false,
94
  "normalized": false,
95
  "rstrip": false,
96
  "single_word": false,
97
  "special": true
98
  },
99
- "54": {
100
  "content": "<PL>",
101
  "lstrip": false,
102
  "normalized": false,
@@ -104,39 +96,23 @@
104
  "single_word": false,
105
  "special": true
106
  },
107
- "55": {
108
- "content": "<SG>",
109
- "lstrip": false,
110
- "normalized": false,
111
- "rstrip": false,
112
- "single_word": false,
113
- "special": true
114
- },
115
- "56": {
116
- "content": "<IPFV>",
117
- "lstrip": false,
118
- "normalized": false,
119
- "rstrip": false,
120
- "single_word": false,
121
- "special": true
122
- },
123
- "57": {
124
- "content": "<COND>",
125
  "lstrip": false,
126
  "normalized": false,
127
  "rstrip": false,
128
  "single_word": false,
129
  "special": true
130
  },
131
- "58": {
132
- "content": "<2>",
133
  "lstrip": false,
134
  "normalized": false,
135
  "rstrip": false,
136
  "single_word": false,
137
  "special": true
138
  },
139
- "59": {
140
  "content": "<PFV>",
141
  "lstrip": false,
142
  "normalized": false,
@@ -144,32 +120,32 @@
144
  "single_word": false,
145
  "special": true
146
  },
147
- "60": {
148
- "content": "<POS>",
149
  "lstrip": false,
150
  "normalized": false,
151
  "rstrip": false,
152
  "single_word": false,
153
  "special": true
154
  },
155
- "61": {
156
- "content": "<IND>",
157
  "lstrip": false,
158
  "normalized": false,
159
  "rstrip": false,
160
  "single_word": false,
161
  "special": true
162
  },
163
- "62": {
164
- "content": "<NOM>",
165
  "lstrip": false,
166
  "normalized": false,
167
  "rstrip": false,
168
  "single_word": false,
169
  "special": true
170
  },
171
- "63": {
172
- "content": "<3>",
173
  "lstrip": false,
174
  "normalized": false,
175
  "rstrip": false,
@@ -178,24 +154,21 @@
178
  }
179
  },
180
  "additional_special_tokens": [
181
- "<PRS>",
182
- "<SBJV>",
183
  "<V>",
184
- "<PST>",
185
- "<1>",
186
- "<FUT>",
187
- "<IMP>",
188
- "<NFIN>",
189
- "<PL>",
190
  "<SG>",
191
- "<IPFV>",
192
- "<COND>",
193
- "<2>",
194
- "<PFV>",
195
- "<POS>",
196
  "<IND>",
197
  "<NOM>",
198
- "<3>"
 
 
 
 
199
  ],
200
  "bos_token": "<s>",
201
  "clean_up_tokenization_spaces": true,
 
32
  "single_word": false,
33
  "special": true
34
  },
35
+ "37": {
36
+ "content": "<ITER>",
37
  "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
40
  "single_word": false,
41
  "special": true
42
  },
43
+ "38": {
44
+ "content": "<3>",
45
  "lstrip": false,
46
  "normalized": false,
47
  "rstrip": false,
48
  "single_word": false,
49
  "special": true
50
  },
51
+ "39": {
52
  "content": "<V>",
53
  "lstrip": false,
54
  "normalized": false,
 
56
  "single_word": false,
57
  "special": true
58
  },
59
+ "40": {
60
+ "content": "<SG>",
 
 
 
 
 
 
 
 
61
  "lstrip": false,
62
  "normalized": false,
63
  "rstrip": false,
64
  "single_word": false,
65
  "special": true
66
  },
67
+ "41": {
68
+ "content": "<OPT>",
69
  "lstrip": false,
70
  "normalized": false,
71
  "rstrip": false,
72
  "single_word": false,
73
  "special": true
74
  },
75
+ "42": {
76
+ "content": "<PROSP>",
77
  "lstrip": false,
78
  "normalized": false,
79
  "rstrip": false,
80
  "single_word": false,
81
  "special": true
82
  },
83
+ "43": {
84
+ "content": "<GRPL>",
85
  "lstrip": false,
86
  "normalized": false,
87
  "rstrip": false,
88
  "single_word": false,
89
  "special": true
90
  },
91
+ "44": {
92
  "content": "<PL>",
93
  "lstrip": false,
94
  "normalized": false,
 
96
  "single_word": false,
97
  "special": true
98
  },
99
+ "45": {
100
+ "content": "<IND>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
101
  "lstrip": false,
102
  "normalized": false,
103
  "rstrip": false,
104
  "single_word": false,
105
  "special": true
106
  },
107
+ "46": {
108
+ "content": "<NOM>",
109
  "lstrip": false,
110
  "normalized": false,
111
  "rstrip": false,
112
  "single_word": false,
113
  "special": true
114
  },
115
+ "47": {
116
  "content": "<PFV>",
117
  "lstrip": false,
118
  "normalized": false,
 
120
  "single_word": false,
121
  "special": true
122
  },
123
+ "48": {
124
+ "content": "<4>",
125
  "lstrip": false,
126
  "normalized": false,
127
  "rstrip": false,
128
  "single_word": false,
129
  "special": true
130
  },
131
+ "49": {
132
+ "content": "<IPFV>",
133
  "lstrip": false,
134
  "normalized": false,
135
  "rstrip": false,
136
  "single_word": false,
137
  "special": true
138
  },
139
+ "50": {
140
+ "content": "<2>",
141
  "lstrip": false,
142
  "normalized": false,
143
  "rstrip": false,
144
  "single_word": false,
145
  "special": true
146
  },
147
+ "51": {
148
+ "content": "<1>",
149
  "lstrip": false,
150
  "normalized": false,
151
  "rstrip": false,
 
154
  }
155
  },
156
  "additional_special_tokens": [
157
+ "<ITER>",
158
+ "<3>",
159
  "<V>",
 
 
 
 
 
 
160
  "<SG>",
161
+ "<OPT>",
162
+ "<PROSP>",
163
+ "<GRPL>",
164
+ "<PL>",
 
165
  "<IND>",
166
  "<NOM>",
167
+ "<PFV>",
168
+ "<4>",
169
+ "<IPFV>",
170
+ "<2>",
171
+ "<1>"
172
  ],
173
  "bos_token": "<s>",
174
  "clean_up_tokenization_spaces": true,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d43744df5c002561af0767247b7ee3912b584b6b1941caa4d245f60f01e9ca4
3
  size 4728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b96d5142b9173d25c4281529f4958afca5c57cbcdefc2fa89aee9ad7d213700
3
  size 4728
vocab.json CHANGED
@@ -1 +1 @@
1
- {"y": 0, "\u0153": 1, "d": 2, "s": 3, "i": 4, "\u00fb": 5, "\u00e2": 6, "x": 7, "'": 8, "\u00e9": 9, "\u00f4": 10, "m": 11, "e": 12, "g": 13, "\u00e7": 14, "N": 15, "j": 16, " ": 17, "v": 18, "a": 19, "u": 20, "\u00ee": 21, "h": 22, "c": 23, "f": 24, "l": 25, "w": 26, "k": 27, "o": 28, "n": 29, "\u00eb": 30, "\u00ef": 31, "\u00fc": 32, "b": 33, "\u1e63": 34, "\u00e8": 35, "-": 36, "z": 37, "r": 38, "q": 39, "t": 40, "p": 41}
 
1
+ {"\u0105": 0, "z": 1, "y": 2, "s": 3, " ": 4, "m": 5, "k": 6, "l": 7, "\u0119": 8, "i": 9, "b": 10, "j": 11, "n": 12, "d": 13, "\u012f": 14, "\u0301": 15, "w": 16, "t": 17, "\u02bc": 18, "\u01eb": 19, "o": 20, "\u00ed": 21, "a": 22, "c": 23, "h": 24, "\u0142": 25, "g": 26, "\u00f3": 27, "\u0144": 28, "\u00e9": 29, "e": 30, "\u00e1": 31, "x": 32}