np-cr commited on
Commit
73ec8b6
·
verified ·
1 Parent(s): 494d7cb

Upload folder using huggingface_hub

Browse files
config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_sliding_window_pattern": 6,
3
+ "architectures": [
4
+ "Gemma3ForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "attn_logit_softcapping": null,
9
+ "bos_token_id": 2,
10
+ "cache_implementation": "hybrid",
11
+ "dtype": "bfloat16",
12
+ "eos_token_id": [
13
+ 1,
14
+ 106
15
+ ],
16
+ "final_logit_softcapping": null,
17
+ "head_dim": 16,
18
+ "hidden_activation": "gelu_pytorch_tanh",
19
+ "hidden_size": 64,
20
+ "initializer_range": 0.02,
21
+ "intermediate_size": 128,
22
+ "layer_types": [
23
+ "sliding_attention",
24
+ "full_attention"
25
+ ],
26
+ "max_position_embeddings": 32768,
27
+ "model_type": "gemma3_text",
28
+ "num_attention_heads": 4,
29
+ "num_hidden_layers": 2,
30
+ "num_key_value_heads": 1,
31
+ "pad_token_id": 0,
32
+ "query_pre_attn_scalar": 256,
33
+ "rms_norm_eps": 1e-06,
34
+ "rope_local_base_freq": 10000,
35
+ "rope_scaling": null,
36
+ "rope_theta": 1000000,
37
+ "sliding_window": 512,
38
+ "sliding_window_pattern": 6,
39
+ "transformers_version": "4.57.6",
40
+ "use_bidirectional_attention": false,
41
+ "use_cache": true,
42
+ "vocab_size": 51
43
+ }
generation_config.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 2,
4
+ "cache_implementation": "hybrid",
5
+ "eos_token_id": [
6
+ 1,
7
+ 106
8
+ ],
9
+ "pad_token_id": 0,
10
+ "transformers_version": "4.57.6"
11
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f08266076a1c2c2647aaf00f08b9dca60af72a05923ccf5443d22d7d93f23375
3
+ size 149976
special_tokens_map.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<bos>",
3
+ "eos_token": "<eos>",
4
+ "pad_token": "<pad>",
5
+ "unk_token": "<unk>"
6
+ }
tokenizer.json ADDED
@@ -0,0 +1,237 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "1.0",
3
+ "truncation": null,
4
+ "padding": null,
5
+ "added_tokens": [
6
+ {
7
+ "id": 0,
8
+ "content": "<pad>",
9
+ "single_word": false,
10
+ "lstrip": false,
11
+ "rstrip": false,
12
+ "normalized": false,
13
+ "special": true
14
+ },
15
+ {
16
+ "id": 1,
17
+ "content": "<eos>",
18
+ "single_word": false,
19
+ "lstrip": false,
20
+ "rstrip": false,
21
+ "normalized": false,
22
+ "special": true
23
+ },
24
+ {
25
+ "id": 2,
26
+ "content": "<bos>",
27
+ "single_word": false,
28
+ "lstrip": false,
29
+ "rstrip": false,
30
+ "normalized": false,
31
+ "special": true
32
+ },
33
+ {
34
+ "id": 3,
35
+ "content": "<unk>",
36
+ "single_word": false,
37
+ "lstrip": false,
38
+ "rstrip": false,
39
+ "normalized": false,
40
+ "special": true
41
+ }
42
+ ],
43
+ "normalizer": null,
44
+ "pre_tokenizer": {
45
+ "type": "ByteLevel",
46
+ "add_prefix_space": false,
47
+ "trim_offsets": true,
48
+ "use_regex": true
49
+ },
50
+ "post_processor": null,
51
+ "decoder": null,
52
+ "model": {
53
+ "type": "BPE",
54
+ "dropout": null,
55
+ "unk_token": null,
56
+ "continuing_subword_prefix": null,
57
+ "end_of_word_suffix": null,
58
+ "fuse_unk": false,
59
+ "byte_fallback": false,
60
+ "ignore_merges": false,
61
+ "vocab": {
62
+ "<pad>": 0,
63
+ "<eos>": 1,
64
+ "<bos>": 2,
65
+ "<unk>": 3,
66
+ "a": 4,
67
+ "d": 5,
68
+ "e": 6,
69
+ "f": 7,
70
+ "h": 8,
71
+ "i": 9,
72
+ "k": 10,
73
+ "l": 11,
74
+ "n": 12,
75
+ "o": 13,
76
+ "r": 14,
77
+ "s": 15,
78
+ "t": 16,
79
+ "w": 17,
80
+ "y": 18,
81
+ "z": 19,
82
+ "Ġ": 20,
83
+ "Ġt": 21,
84
+ "or": 22,
85
+ "at": 23,
86
+ "dat": 24,
87
+ "el": 25,
88
+ "en": 26,
89
+ "er": 27,
90
+ "es": 28,
91
+ "for": 29,
92
+ "hel": 30,
93
+ "in": 31,
94
+ "iz": 32,
95
+ "ken": 33,
96
+ "ld": 34,
97
+ "lo": 35,
98
+ "oken": 36,
99
+ "wor": 37,
100
+ "Ġdat": 38,
101
+ "Ġfor": 39,
102
+ "Ġwor": 40,
103
+ "Ġtes": 41,
104
+ "Ġtin": 42,
105
+ "Ġtoken": 43,
106
+ "hello": 44,
107
+ "izer": 45,
108
+ "Ġdata": 46,
109
+ "Ġworld": 47,
110
+ "Ġtest": 48,
111
+ "Ġtiny": 49,
112
+ "Ġtokenizer": 50
113
+ },
114
+ "merges": [
115
+ [
116
+ "Ġ",
117
+ "t"
118
+ ],
119
+ [
120
+ "o",
121
+ "r"
122
+ ],
123
+ [
124
+ "a",
125
+ "t"
126
+ ],
127
+ [
128
+ "d",
129
+ "at"
130
+ ],
131
+ [
132
+ "e",
133
+ "l"
134
+ ],
135
+ [
136
+ "e",
137
+ "n"
138
+ ],
139
+ [
140
+ "e",
141
+ "r"
142
+ ],
143
+ [
144
+ "e",
145
+ "s"
146
+ ],
147
+ [
148
+ "f",
149
+ "or"
150
+ ],
151
+ [
152
+ "h",
153
+ "el"
154
+ ],
155
+ [
156
+ "i",
157
+ "n"
158
+ ],
159
+ [
160
+ "i",
161
+ "z"
162
+ ],
163
+ [
164
+ "k",
165
+ "en"
166
+ ],
167
+ [
168
+ "l",
169
+ "d"
170
+ ],
171
+ [
172
+ "l",
173
+ "o"
174
+ ],
175
+ [
176
+ "o",
177
+ "ken"
178
+ ],
179
+ [
180
+ "w",
181
+ "or"
182
+ ],
183
+ [
184
+ "Ġ",
185
+ "dat"
186
+ ],
187
+ [
188
+ "Ġ",
189
+ "for"
190
+ ],
191
+ [
192
+ "Ġ",
193
+ "wor"
194
+ ],
195
+ [
196
+ "Ġt",
197
+ "es"
198
+ ],
199
+ [
200
+ "Ġt",
201
+ "in"
202
+ ],
203
+ [
204
+ "Ġt",
205
+ "oken"
206
+ ],
207
+ [
208
+ "hel",
209
+ "lo"
210
+ ],
211
+ [
212
+ "iz",
213
+ "er"
214
+ ],
215
+ [
216
+ "Ġdat",
217
+ "a"
218
+ ],
219
+ [
220
+ "Ġwor",
221
+ "ld"
222
+ ],
223
+ [
224
+ "Ġtes",
225
+ "t"
226
+ ],
227
+ [
228
+ "Ġtin",
229
+ "y"
230
+ ],
231
+ [
232
+ "Ġtoken",
233
+ "izer"
234
+ ]
235
+ ]
236
+ }
237
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "<pad>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "1": {
12
+ "content": "<eos>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "2": {
20
+ "content": "<bos>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "3": {
28
+ "content": "<unk>",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ }
35
+ },
36
+ "bos_token": "<bos>",
37
+ "clean_up_tokenization_spaces": false,
38
+ "eos_token": "<eos>",
39
+ "extra_special_tokens": {},
40
+ "model_max_length": 1000000000000000019884624838656,
41
+ "pad_token": "<pad>",
42
+ "tokenizer_class": "PreTrainedTokenizerFast",
43
+ "unk_token": "<unk>"
44
+ }