ULFBERTO commited on
Commit
9e2facb
·
verified ·
1 Parent(s): 8fc9655

Upload folder using huggingface_hub

Browse files
Files changed (5) hide show
  1. .gitattributes +1 -0
  2. README.md +47 -0
  3. config.json +9 -0
  4. model.keras +3 -0
  5. vocab.json +448 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ model.keras filter=lfs diff=lfs merge=lfs -text
README.md ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ language: es
3
+ tags:
4
+ - text-generation
5
+ - gpt
6
+ - tensorflow
7
+ - don-quijote
8
+ license: mit
9
+ ---
10
+
11
+ # GPT OxideLLM_5M
12
+
13
+ Modelo de lenguaje tipo GPT entrenado desde cero con el texto de OxideLLM_5M de la Mancha.
14
+
15
+ ## Configuración del modelo
16
+
17
+ - **Vocabulario**: 221 caracteres
18
+ - **Dimensión del modelo (d_model)**: 256
19
+ - **Número de cabezas de atención**: 4
20
+ - **Dimensión feedforward (dff)**: 512
21
+ - **Número de capas**: 4
22
+ - **Longitud máxima de secuencia**: 128
23
+
24
+ ## Uso
25
+
26
+ ```python
27
+ from huggingface_hub import snapshot_download
28
+ import tensorflow as tf
29
+ import json
30
+
31
+ # Descargar modelo
32
+ model_path = snapshot_download(repo_id="ULFBERTO/OxideLLM_5M")
33
+
34
+ # Cargar vocabulario
35
+ with open(f"{model_path}/vocab.json", "r", encoding="utf-8") as f:
36
+ vocab_data = json.load(f)
37
+
38
+ char2idx = vocab_data["char2idx"]
39
+ idx2char = {int(k): v for k, v in vocab_data["idx2char"].items()}
40
+
41
+ # Cargar modelo
42
+ model = tf.keras.models.load_model(f"{model_path}/saved_model")
43
+ ```
44
+
45
+ ## Entrenamiento
46
+
47
+ Entrenado con TensorFlow 2.x usando arquitectura Transformer (decoder-only).
config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "vocab_size": 221,
3
+ "d_model": 256,
4
+ "num_heads": 4,
5
+ "dff": 512,
6
+ "num_layers": 4,
7
+ "max_len": 128,
8
+ "dropout": 0.1
9
+ }
model.keras ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f950d22dc92e1e46b8709f5b4fcdb8b2ba1016c30a9dbfb1c219e30345ec6c2
3
+ size 65170584
vocab.json ADDED
@@ -0,0 +1,448 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "char2idx": {
3
+ "\n": 0,
4
+ " ": 1,
5
+ "!": 2,
6
+ "\"": 3,
7
+ "#": 4,
8
+ "$": 5,
9
+ "%": 6,
10
+ "&": 7,
11
+ "'": 8,
12
+ "(": 9,
13
+ ")": 10,
14
+ "*": 11,
15
+ "+": 12,
16
+ ",": 13,
17
+ "-": 14,
18
+ ".": 15,
19
+ "/": 16,
20
+ "0": 17,
21
+ "1": 18,
22
+ "2": 19,
23
+ "3": 20,
24
+ "4": 21,
25
+ "5": 22,
26
+ "6": 23,
27
+ "7": 24,
28
+ "8": 25,
29
+ "9": 26,
30
+ ":": 27,
31
+ ";": 28,
32
+ "<": 29,
33
+ "=": 30,
34
+ ">": 31,
35
+ "?": 32,
36
+ "A": 33,
37
+ "B": 34,
38
+ "C": 35,
39
+ "D": 36,
40
+ "E": 37,
41
+ "F": 38,
42
+ "G": 39,
43
+ "H": 40,
44
+ "I": 41,
45
+ "J": 42,
46
+ "K": 43,
47
+ "L": 44,
48
+ "M": 45,
49
+ "N": 46,
50
+ "O": 47,
51
+ "P": 48,
52
+ "Q": 49,
53
+ "R": 50,
54
+ "S": 51,
55
+ "T": 52,
56
+ "U": 53,
57
+ "V": 54,
58
+ "W": 55,
59
+ "X": 56,
60
+ "Y": 57,
61
+ "Z": 58,
62
+ "[": 59,
63
+ "]": 60,
64
+ "^": 61,
65
+ "_": 62,
66
+ "a": 63,
67
+ "b": 64,
68
+ "c": 65,
69
+ "d": 66,
70
+ "e": 67,
71
+ "f": 68,
72
+ "g": 69,
73
+ "h": 70,
74
+ "i": 71,
75
+ "j": 72,
76
+ "k": 73,
77
+ "l": 74,
78
+ "m": 75,
79
+ "n": 76,
80
+ "o": 77,
81
+ "p": 78,
82
+ "q": 79,
83
+ "r": 80,
84
+ "s": 81,
85
+ "t": 82,
86
+ "u": 83,
87
+ "v": 84,
88
+ "w": 85,
89
+ "x": 86,
90
+ "y": 87,
91
+ "z": 88,
92
+ "|": 89,
93
+ "}": 90,
94
+ "¡": 91,
95
+ "£": 92,
96
+ "§": 93,
97
+ "©": 94,
98
+ "ª": 95,
99
+ "«": 96,
100
+ "°": 97,
101
+ "´": 98,
102
+ "·": 99,
103
+ "º": 100,
104
+ "»": 101,
105
+ "½": 102,
106
+ "¾": 103,
107
+ "¿": 104,
108
+ "Á": 105,
109
+ "Â": 106,
110
+ "Æ": 107,
111
+ "Ç": 108,
112
+ "È": 109,
113
+ "É": 110,
114
+ "Ê": 111,
115
+ "Í": 112,
116
+ "Î": 113,
117
+ "Ñ": 114,
118
+ "Ó": 115,
119
+ "Ú": 116,
120
+ "Ü": 117,
121
+ "à": 118,
122
+ "á": 119,
123
+ "â": 120,
124
+ "ä": 121,
125
+ "æ": 122,
126
+ "ç": 123,
127
+ "è": 124,
128
+ "é": 125,
129
+ "ê": 126,
130
+ "ë": 127,
131
+ "ì": 128,
132
+ "í": 129,
133
+ "î": 130,
134
+ "ï": 131,
135
+ "ñ": 132,
136
+ "ò": 133,
137
+ "ó": 134,
138
+ "ô": 135,
139
+ "ö": 136,
140
+ "ù": 137,
141
+ "ú": 138,
142
+ "û": 139,
143
+ "ü": 140,
144
+ "ā": 141,
145
+ "ē": 142,
146
+ "ě": 143,
147
+ "ī": 144,
148
+ "ō": 145,
149
+ "Œ": 146,
150
+ "œ": 147,
151
+ "̃": 148,
152
+ "Δ": 149,
153
+ "Ο": 150,
154
+ "Π": 151,
155
+ "Τ": 152,
156
+ "Φ": 153,
157
+ "ά": 154,
158
+ "έ": 155,
159
+ "ί": 156,
160
+ "α": 157,
161
+ "β": 158,
162
+ "γ": 159,
163
+ "δ": 160,
164
+ "ε": 161,
165
+ "η": 162,
166
+ "θ": 163,
167
+ "ι": 164,
168
+ "κ": 165,
169
+ "λ": 166,
170
+ "μ": 167,
171
+ "ν": 168,
172
+ "ξ": 169,
173
+ "ο": 170,
174
+ "π": 171,
175
+ "ρ": 172,
176
+ "ς": 173,
177
+ "σ": 174,
178
+ "τ": 175,
179
+ "υ": 176,
180
+ "χ": 177,
181
+ "ω": 178,
182
+ "ό": 179,
183
+ "ύ": 180,
184
+ "ώ": 181,
185
+ "ἀ": 182,
186
+ "ἄ": 183,
187
+ "ἐ": 184,
188
+ "ἔ": 185,
189
+ "ἠ": 186,
190
+ "ἡ": 187,
191
+ "ἤ": 188,
192
+ "ἦ": 189,
193
+ "ἰ": 190,
194
+ "ἵ": 191,
195
+ "ἶ": 192,
196
+ "ὁ": 193,
197
+ "ὄ": 194,
198
+ "ὅ": 195,
199
+ "ὐ": 196,
200
+ "ὑ": 197,
201
+ "ὰ": 198,
202
+ "ὲ": 199,
203
+ "ὴ": 200,
204
+ "ὶ": 201,
205
+ "ὸ": 202,
206
+ "ὺ": 203,
207
+ "ᾶ": 204,
208
+ "᾽": 205,
209
+ "ῆ": 206,
210
+ "ῖ": 207,
211
+ "ῦ": 208,
212
+ "ῶ": 209,
213
+ " ": 210,
214
+ "–": 211,
215
+ "—": 212,
216
+ "‘": 213,
217
+ "’": 214,
218
+ "“": 215,
219
+ "”": 216,
220
+ "′": 217,
221
+ "⅓": 218,
222
+ "○": 219,
223
+ "●": 220
224
+ },
225
+ "idx2char": {
226
+ "0": "\n",
227
+ "1": " ",
228
+ "2": "!",
229
+ "3": "\"",
230
+ "4": "#",
231
+ "5": "$",
232
+ "6": "%",
233
+ "7": "&",
234
+ "8": "'",
235
+ "9": "(",
236
+ "10": ")",
237
+ "11": "*",
238
+ "12": "+",
239
+ "13": ",",
240
+ "14": "-",
241
+ "15": ".",
242
+ "16": "/",
243
+ "17": "0",
244
+ "18": "1",
245
+ "19": "2",
246
+ "20": "3",
247
+ "21": "4",
248
+ "22": "5",
249
+ "23": "6",
250
+ "24": "7",
251
+ "25": "8",
252
+ "26": "9",
253
+ "27": ":",
254
+ "28": ";",
255
+ "29": "<",
256
+ "30": "=",
257
+ "31": ">",
258
+ "32": "?",
259
+ "33": "A",
260
+ "34": "B",
261
+ "35": "C",
262
+ "36": "D",
263
+ "37": "E",
264
+ "38": "F",
265
+ "39": "G",
266
+ "40": "H",
267
+ "41": "I",
268
+ "42": "J",
269
+ "43": "K",
270
+ "44": "L",
271
+ "45": "M",
272
+ "46": "N",
273
+ "47": "O",
274
+ "48": "P",
275
+ "49": "Q",
276
+ "50": "R",
277
+ "51": "S",
278
+ "52": "T",
279
+ "53": "U",
280
+ "54": "V",
281
+ "55": "W",
282
+ "56": "X",
283
+ "57": "Y",
284
+ "58": "Z",
285
+ "59": "[",
286
+ "60": "]",
287
+ "61": "^",
288
+ "62": "_",
289
+ "63": "a",
290
+ "64": "b",
291
+ "65": "c",
292
+ "66": "d",
293
+ "67": "e",
294
+ "68": "f",
295
+ "69": "g",
296
+ "70": "h",
297
+ "71": "i",
298
+ "72": "j",
299
+ "73": "k",
300
+ "74": "l",
301
+ "75": "m",
302
+ "76": "n",
303
+ "77": "o",
304
+ "78": "p",
305
+ "79": "q",
306
+ "80": "r",
307
+ "81": "s",
308
+ "82": "t",
309
+ "83": "u",
310
+ "84": "v",
311
+ "85": "w",
312
+ "86": "x",
313
+ "87": "y",
314
+ "88": "z",
315
+ "89": "|",
316
+ "90": "}",
317
+ "91": "¡",
318
+ "92": "£",
319
+ "93": "§",
320
+ "94": "©",
321
+ "95": "ª",
322
+ "96": "«",
323
+ "97": "°",
324
+ "98": "´",
325
+ "99": "·",
326
+ "100": "º",
327
+ "101": "»",
328
+ "102": "½",
329
+ "103": "¾",
330
+ "104": "¿",
331
+ "105": "Á",
332
+ "106": "Â",
333
+ "107": "Æ",
334
+ "108": "Ç",
335
+ "109": "È",
336
+ "110": "É",
337
+ "111": "Ê",
338
+ "112": "Í",
339
+ "113": "Î",
340
+ "114": "Ñ",
341
+ "115": "Ó",
342
+ "116": "Ú",
343
+ "117": "Ü",
344
+ "118": "à",
345
+ "119": "á",
346
+ "120": "â",
347
+ "121": "ä",
348
+ "122": "æ",
349
+ "123": "ç",
350
+ "124": "è",
351
+ "125": "é",
352
+ "126": "ê",
353
+ "127": "ë",
354
+ "128": "ì",
355
+ "129": "í",
356
+ "130": "î",
357
+ "131": "ï",
358
+ "132": "ñ",
359
+ "133": "ò",
360
+ "134": "ó",
361
+ "135": "ô",
362
+ "136": "ö",
363
+ "137": "ù",
364
+ "138": "ú",
365
+ "139": "û",
366
+ "140": "ü",
367
+ "141": "ā",
368
+ "142": "ē",
369
+ "143": "ě",
370
+ "144": "ī",
371
+ "145": "ō",
372
+ "146": "Œ",
373
+ "147": "œ",
374
+ "148": "̃",
375
+ "149": "Δ",
376
+ "150": "Ο",
377
+ "151": "Π",
378
+ "152": "Τ",
379
+ "153": "Φ",
380
+ "154": "ά",
381
+ "155": "έ",
382
+ "156": "ί",
383
+ "157": "α",
384
+ "158": "β",
385
+ "159": "γ",
386
+ "160": "δ",
387
+ "161": "ε",
388
+ "162": "η",
389
+ "163": "θ",
390
+ "164": "ι",
391
+ "165": "κ",
392
+ "166": "λ",
393
+ "167": "μ",
394
+ "168": "ν",
395
+ "169": "ξ",
396
+ "170": "ο",
397
+ "171": "π",
398
+ "172": "ρ",
399
+ "173": "ς",
400
+ "174": "σ",
401
+ "175": "τ",
402
+ "176": "υ",
403
+ "177": "χ",
404
+ "178": "ω",
405
+ "179": "ό",
406
+ "180": "ύ",
407
+ "181": "ώ",
408
+ "182": "ἀ",
409
+ "183": "ἄ",
410
+ "184": "ἐ",
411
+ "185": "ἔ",
412
+ "186": "ἠ",
413
+ "187": "ἡ",
414
+ "188": "ἤ",
415
+ "189": "ἦ",
416
+ "190": "ἰ",
417
+ "191": "ἵ",
418
+ "192": "ἶ",
419
+ "193": "ὁ",
420
+ "194": "ὄ",
421
+ "195": "ὅ",
422
+ "196": "ὐ",
423
+ "197": "ὑ",
424
+ "198": "ὰ",
425
+ "199": "ὲ",
426
+ "200": "ὴ",
427
+ "201": "ὶ",
428
+ "202": "ὸ",
429
+ "203": "ὺ",
430
+ "204": "ᾶ",
431
+ "205": "᾽",
432
+ "206": "ῆ",
433
+ "207": "ῖ",
434
+ "208": "ῦ",
435
+ "209": "ῶ",
436
+ "210": " ",
437
+ "211": "–",
438
+ "212": "—",
439
+ "213": "‘",
440
+ "214": "’",
441
+ "215": "“",
442
+ "216": "”",
443
+ "217": "′",
444
+ "218": "⅓",
445
+ "219": "○",
446
+ "220": "●"
447
+ }
448
+ }