Floncer commited on
Commit
fc75e01
·
verified ·
1 Parent(s): 126e0e0

Upload 5 files

Browse files
Files changed (5) hide show
  1. config.json +35 -10
  2. generation_config.json +10 -9
  3. model.safetensors +2 -2
  4. tokenizer.json +2 -266
  5. tokenizer_config.json +12 -12
config.json CHANGED
@@ -1,10 +1,35 @@
1
- {
2
- "vocab_size": 504,
3
- "n_embd": 256,
4
- "n_layer": 2,
5
- "n_head": 4,
6
- "n_positions": 128,
7
- "n_ctx": 128,
8
- "model_type": "gpt2",
9
- "architectures": ["GPT2LMHeadModel"]
10
- }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation_function": "gelu_new",
3
+ "add_cross_attention": false,
4
+ "architectures": [
5
+ "GPT2LMHeadModel"
6
+ ],
7
+ "attn_pdrop": 0.1,
8
+ "bos_token_id": 50256,
9
+ "dtype": "float32",
10
+ "embd_pdrop": 0.1,
11
+ "eos_token_id": 50256,
12
+ "initializer_range": 0.02,
13
+ "layer_norm_epsilon": 1e-05,
14
+ "model_type": "gpt2",
15
+ "n_ctx": 1024,
16
+ "n_embd": 192,
17
+ "n_head": 6,
18
+ "n_inner": 768,
19
+ "n_layer": 6,
20
+ "n_positions": 1024,
21
+ "pad_token_id": 50256,
22
+ "reorder_and_upcast_attn": false,
23
+ "resid_pdrop": 0.1,
24
+ "scale_attn_by_inverse_layer_idx": false,
25
+ "scale_attn_weights": true,
26
+ "summary_activation": null,
27
+ "summary_first_dropout": 0.1,
28
+ "summary_proj_to_labels": true,
29
+ "summary_type": "cls_index",
30
+ "summary_use_proj": true,
31
+ "tie_word_embeddings": true,
32
+ "transformers_version": "5.1.0",
33
+ "use_cache": true,
34
+ "vocab_size": 50257
35
+ }
generation_config.json CHANGED
@@ -1,9 +1,10 @@
1
- {
2
- "_from_model_config": true,
3
- "bos_token_id": 50256,
4
- "eos_token_id": 50256,
5
- "output_attentions": false,
6
- "output_hidden_states": false,
7
- "transformers_version": "5.0.0",
8
- "use_cache": true
9
- }
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 50256,
4
+ "eos_token_id": 50256,
5
+ "output_attentions": false,
6
+ "output_hidden_states": false,
7
+ "pad_token_id": 50256,
8
+ "transformers_version": "5.1.0",
9
+ "use_cache": true
10
+ }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edb4644bf494930130be80b5286f72dfa172d700843179eb22ca989d1c5d3f08
3
- size 57945776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a56202162e5f5f086634e65e6b20e716dd72d518009047e64b33e2dfa4e75978
3
+ size 50069480
tokenizer.json CHANGED
@@ -1,19 +1,7 @@
1
  {
2
  "version": "1.0",
3
- "truncation": {
4
- "direction": "Right",
5
- "max_length": 16,
6
- "strategy": "LongestFirst",
7
- "stride": 0
8
- },
9
- "padding": {
10
- "strategy": "BatchLongest",
11
- "direction": "Right",
12
- "pad_to_multiple_of": null,
13
- "pad_id": 50284,
14
- "pad_type_id": 0,
15
- "pad_token": "[PAD]"
16
- },
17
  "added_tokens": [
18
  {
19
  "id": 50256,
@@ -23,258 +11,6 @@
23
  "rstrip": false,
24
  "normalized": true,
25
  "special": true
26
- },
27
- {
28
- "id": 50257,
29
- "content": "когда",
30
- "single_word": false,
31
- "lstrip": false,
32
- "rstrip": false,
33
- "normalized": true,
34
- "special": false
35
- },
36
- {
37
- "id": 50258,
38
- "content": "человек",
39
- "single_word": false,
40
- "lstrip": false,
41
- "rstrip": false,
42
- "normalized": true,
43
- "special": false
44
- },
45
- {
46
- "id": 50259,
47
- "content": "они",
48
- "single_word": false,
49
- "lstrip": false,
50
- "rstrip": false,
51
- "normalized": true,
52
- "special": false
53
- },
54
- {
55
- "id": 50260,
56
- "content": "дом",
57
- "single_word": false,
58
- "lstrip": false,
59
- "rstrip": false,
60
- "normalized": true,
61
- "special": false
62
- },
63
- {
64
- "id": 50261,
65
- "content": "мы",
66
- "single_word": false,
67
- "lstrip": false,
68
- "rstrip": false,
69
- "normalized": true,
70
- "special": false
71
- },
72
- {
73
- "id": 50262,
74
- "content": "кот",
75
- "single_word": false,
76
- "lstrip": false,
77
- "rstrip": false,
78
- "normalized": true,
79
- "special": false
80
- },
81
- {
82
- "id": 50263,
83
- "content": "как",
84
- "single_word": false,
85
- "lstrip": false,
86
- "rstrip": false,
87
- "normalized": true,
88
- "special": false
89
- },
90
- {
91
- "id": 50264,
92
- "content": "дела",
93
- "single_word": false,
94
- "lstrip": false,
95
- "rstrip": false,
96
- "normalized": true,
97
- "special": false
98
- },
99
- {
100
- "id": 50265,
101
- "content": "солнце",
102
- "single_word": false,
103
- "lstrip": false,
104
- "rstrip": false,
105
- "normalized": true,
106
- "special": false
107
- },
108
- {
109
- "id": 50266,
110
- "content": "вы",
111
- "single_word": false,
112
- "lstrip": false,
113
- "rstrip": false,
114
- "normalized": true,
115
- "special": false
116
- },
117
- {
118
- "id": 50267,
119
- "content": "привет",
120
- "single_word": false,
121
- "lstrip": false,
122
- "rstrip": false,
123
- "normalized": true,
124
- "special": false
125
- },
126
- {
127
- "id": 50268,
128
- "content": "да",
129
- "single_word": false,
130
- "lstrip": false,
131
- "rstrip": false,
132
- "normalized": true,
133
- "special": false
134
- },
135
- {
136
- "id": 50269,
137
- "content": "что",
138
- "single_word": false,
139
- "lstrip": false,
140
- "rstrip": false,
141
- "normalized": true,
142
- "special": false
143
- },
144
- {
145
- "id": 50270,
146
- "content": "она",
147
- "single_word": false,
148
- "lstrip": false,
149
- "rstrip": false,
150
- "normalized": true,
151
- "special": false
152
- },
153
- {
154
- "id": 50271,
155
- "content": "друг",
156
- "single_word": false,
157
- "lstrip": false,
158
- "rstrip": false,
159
- "normalized": true,
160
- "special": false
161
- },
162
- {
163
- "id": 50272,
164
- "content": "ты",
165
- "single_word": false,
166
- "lstrip": false,
167
- "rstrip": false,
168
- "normalized": true,
169
- "special": false
170
- },
171
- {
172
- "id": 50273,
173
- "content": "плохо",
174
- "single_word": false,
175
- "lstrip": false,
176
- "rstrip": false,
177
- "normalized": true,
178
- "special": false
179
- },
180
- {
181
- "id": 50274,
182
- "content": "любовь",
183
- "single_word": false,
184
- "lstrip": false,
185
- "rstrip": false,
186
- "normalized": true,
187
- "special": false
188
- },
189
- {
190
- "id": 50275,
191
- "content": "где",
192
- "single_word": false,
193
- "lstrip": false,
194
- "rstrip": false,
195
- "normalized": true,
196
- "special": false
197
- },
198
- {
199
- "id": 50276,
200
- "content": "собака",
201
- "single_word": false,
202
- "lstrip": false,
203
- "rstrip": false,
204
- "normalized": true,
205
- "special": false
206
- },
207
- {
208
- "id": 50277,
209
- "content": "кто",
210
- "single_word": false,
211
- "lstrip": false,
212
- "rstrip": false,
213
- "normalized": true,
214
- "special": false
215
- },
216
- {
217
- "id": 50278,
218
- "content": "он",
219
- "single_word": false,
220
- "lstrip": false,
221
- "rstrip": false,
222
- "normalized": true,
223
- "special": false
224
- },
225
- {
226
- "id": 50279,
227
- "content": "хорошо",
228
- "single_word": false,
229
- "lstrip": false,
230
- "rstrip": false,
231
- "normalized": true,
232
- "special": false
233
- },
234
- {
235
- "id": 50280,
236
- "content": "нет",
237
- "single_word": false,
238
- "lstrip": false,
239
- "rstrip": false,
240
- "normalized": true,
241
- "special": false
242
- },
243
- {
244
- "id": 50281,
245
- "content": "я",
246
- "single_word": false,
247
- "lstrip": false,
248
- "rstrip": false,
249
- "normalized": true,
250
- "special": false
251
- },
252
- {
253
- "id": 50282,
254
- "content": "пока",
255
- "single_word": false,
256
- "lstrip": false,
257
- "rstrip": false,
258
- "normalized": true,
259
- "special": false
260
- },
261
- {
262
- "id": 50283,
263
- "content": "мир",
264
- "single_word": false,
265
- "lstrip": false,
266
- "rstrip": false,
267
- "normalized": true,
268
- "special": false
269
- },
270
- {
271
- "id": 50284,
272
- "content": "[PAD]",
273
- "single_word": false,
274
- "lstrip": false,
275
- "rstrip": false,
276
- "normalized": false,
277
- "special": true
278
  }
279
  ],
280
  "normalizer": null,
 
1
  {
2
  "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 50256,
 
11
  "rstrip": false,
12
  "normalized": true,
13
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
14
  }
15
  ],
16
  "normalizer": null,
tokenizer_config.json CHANGED
@@ -1,12 +1,12 @@
1
- {
2
- "add_prefix_space": false,
3
- "backend": "tokenizers",
4
- "bos_token": "<|endoftext|>",
5
- "eos_token": "<|endoftext|>",
6
- "errors": "replace",
7
- "is_local": false,
8
- "model_max_length": 1024,
9
- "pad_token": "[PAD]",
10
- "tokenizer_class": "GPT2Tokenizer",
11
- "unk_token": "<|endoftext|>"
12
- }
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "backend": "tokenizers",
4
+ "bos_token": "<|endoftext|>",
5
+ "eos_token": "<|endoftext|>",
6
+ "errors": "replace",
7
+ "is_local": false,
8
+ "model_max_length": 1024,
9
+ "pad_token": "<|endoftext|>",
10
+ "tokenizer_class": "GPT2Tokenizer",
11
+ "unk_token": "<|endoftext|>"
12
+ }