First model
Browse files- config.json +27 -0
- merges.txt +65 -0
- pytorch_model.bin +3 -0
- training_args.bin +3 -0
- vocab.json +1 -0
config.json
ADDED
|
@@ -0,0 +1,27 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"architectures": [
|
| 3 |
+
"RobertaForMaskedLM"
|
| 4 |
+
],
|
| 5 |
+
"attention_probs_dropout_prob": 0.1,
|
| 6 |
+
"bos_token_id": 0,
|
| 7 |
+
"classifier_dropout": null,
|
| 8 |
+
"eos_token_id": 2,
|
| 9 |
+
"hidden_act": "gelu",
|
| 10 |
+
"hidden_dropout_prob": 0.1,
|
| 11 |
+
"hidden_size": 768,
|
| 12 |
+
"initializer_range": 0.02,
|
| 13 |
+
"intermediate_size": 3072,
|
| 14 |
+
"layer_norm_eps": 1e-12,
|
| 15 |
+
"max_position_embeddings": 256,
|
| 16 |
+
"model_type": "roberta",
|
| 17 |
+
"num_attention_heads": 12,
|
| 18 |
+
"num_hidden_layer": 6,
|
| 19 |
+
"num_hidden_layers": 12,
|
| 20 |
+
"pad_token_id": 1,
|
| 21 |
+
"position_embedding_type": "absolute",
|
| 22 |
+
"torch_dtype": "float32",
|
| 23 |
+
"transformers_version": "4.25.1",
|
| 24 |
+
"type_vocab_size": 1,
|
| 25 |
+
"use_cache": true,
|
| 26 |
+
"vocab_size": 52000
|
| 27 |
+
}
|
merges.txt
ADDED
|
@@ -0,0 +1,65 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
#version: 0.2 - Trained by `huggingface/tokenizers`
|
| 2 |
+
Ġ E
|
| 3 |
+
Ġ N
|
| 4 |
+
Ġ A
|
| 5 |
+
Ġ I
|
| 6 |
+
Ġ G
|
| 7 |
+
ĠE U
|
| 8 |
+
Ġ D
|
| 9 |
+
Ġ S
|
| 10 |
+
ĠE O
|
| 11 |
+
Ġ O
|
| 12 |
+
Ġ i
|
| 13 |
+
Ġ J
|
| 14 |
+
ĠN G
|
| 15 |
+
Ġ R
|
| 16 |
+
Ġ L
|
| 17 |
+
Ġ U
|
| 18 |
+
Ġ M
|
| 19 |
+
Ġ H
|
| 20 |
+
E O
|
| 21 |
+
Ġ B
|
| 22 |
+
Ġi EO
|
| 23 |
+
Ġ o
|
| 24 |
+
u I
|
| 25 |
+
C H
|
| 26 |
+
CH h
|
| 27 |
+
Ġ t
|
| 28 |
+
Ġ CHh
|
| 29 |
+
Ġ k
|
| 30 |
+
Ġo A
|
| 31 |
+
e uI
|
| 32 |
+
Ġ euI
|
| 33 |
+
ĠD D
|
| 34 |
+
T h
|
| 35 |
+
Ġ Th
|
| 36 |
+
P h
|
| 37 |
+
Ġ Ph
|
| 38 |
+
Ġo E
|
| 39 |
+
K h
|
| 40 |
+
Ġ Kh
|
| 41 |
+
ĠG G
|
| 42 |
+
ĠS S
|
| 43 |
+
Ġi O
|
| 44 |
+
Ġ p
|
| 45 |
+
Ġi U
|
| 46 |
+
ĠJ J
|
| 47 |
+
u EO
|
| 48 |
+
Ġ uEO
|
| 49 |
+
Ġi A
|
| 50 |
+
Ġ uI
|
| 51 |
+
Ġi E
|
| 52 |
+
ĠB B
|
| 53 |
+
i EO
|
| 54 |
+
i U
|
| 55 |
+
i A
|
| 56 |
+
o E
|
| 57 |
+
D D
|
| 58 |
+
i O
|
| 59 |
+
i E
|
| 60 |
+
E U
|
| 61 |
+
G G
|
| 62 |
+
o A
|
| 63 |
+
S S
|
| 64 |
+
B B
|
| 65 |
+
J J
|
pytorch_model.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1785cd19176c71889bf63127694e3167925609ae84627ac3d74345c180bbfed
|
| 3 |
+
size 503402873
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c541bdf6d274e5ced5c1706204468bff371a90f37d2670b7e834f651d4d28d95
|
| 3 |
+
size 3387
|
vocab.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"<s>":0,"<pad>":1,"</s>":2,"<unk>":3,"<mask>":4,"!":5,"\"":6,"#":7,"$":8,"%":9,"&":10,"'":11,"(":12,")":13,"*":14,"+":15,",":16,"-":17,".":18,"/":19,"0":20,"1":21,"2":22,"3":23,"4":24,"5":25,"6":26,"7":27,"8":28,"9":29,":":30,";":31,"<":32,"=":33,">":34,"?":35,"@":36,"A":37,"B":38,"C":39,"D":40,"E":41,"F":42,"G":43,"H":44,"I":45,"J":46,"K":47,"L":48,"M":49,"N":50,"O":51,"P":52,"Q":53,"R":54,"S":55,"T":56,"U":57,"V":58,"W":59,"X":60,"Y":61,"Z":62,"[":63,"\\":64,"]":65,"^":66,"_":67,"`":68,"a":69,"b":70,"c":71,"d":72,"e":73,"f":74,"g":75,"h":76,"i":77,"j":78,"k":79,"l":80,"m":81,"n":82,"o":83,"p":84,"q":85,"r":86,"s":87,"t":88,"u":89,"v":90,"w":91,"x":92,"y":93,"z":94,"{":95,"|":96,"}":97,"~":98,"¡":99,"¢":100,"£":101,"¤":102,"¥":103,"¦":104,"§":105,"¨":106,"©":107,"ª":108,"«":109,"¬":110,"®":111,"¯":112,"°":113,"±":114,"²":115,"³":116,"´":117,"µ":118,"¶":119,"·":120,"¸":121,"¹":122,"º":123,"»":124,"¼":125,"½":126,"¾":127,"¿":128,"À":129,"Á":130,"Â":131,"Ã":132,"Ä":133,"Å":134,"Æ":135,"Ç":136,"È":137,"É":138,"Ê":139,"Ë":140,"Ì":141,"Í":142,"Î":143,"Ï":144,"Ð":145,"Ñ":146,"Ò":147,"Ó":148,"Ô":149,"Õ":150,"Ö":151,"×":152,"Ø":153,"Ù":154,"Ú":155,"Û":156,"Ü":157,"Ý":158,"Þ":159,"ß":160,"à":161,"á":162,"â":163,"ã":164,"ä":165,"å":166,"æ":167,"ç":168,"è":169,"é":170,"ê":171,"ë":172,"ì":173,"í":174,"î":175,"ï":176,"ð":177,"ñ":178,"ò":179,"ó":180,"ô":181,"õ":182,"ö":183,"÷":184,"ø":185,"ù":186,"ú":187,"û":188,"ü":189,"ý":190,"þ":191,"ÿ":192,"Ā":193,"ā":194,"Ă":195,"ă":196,"Ą":197,"ą":198,"Ć":199,"ć":200,"Ĉ":201,"ĉ":202,"Ċ":203,"ċ":204,"Č":205,"č":206,"Ď":207,"ď":208,"Đ":209,"đ":210,"Ē":211,"ē":212,"Ĕ":213,"ĕ":214,"Ė":215,"ė":216,"Ę":217,"ę":218,"Ě":219,"ě":220,"Ĝ":221,"ĝ":222,"Ğ":223,"ğ":224,"Ġ":225,"ġ":226,"Ģ":227,"ģ":228,"Ĥ":229,"ĥ":230,"Ħ":231,"ħ":232,"Ĩ":233,"ĩ":234,"Ī":235,"ī":236,"Ĭ":237,"ĭ":238,"Į":239,"į":240,"İ":241,"ı":242,"IJ":243,"ij":244,"Ĵ":245,"ĵ":246,"Ķ":247,"ķ":248,"ĸ":249,"Ĺ":250,"ĺ":251,"Ļ":252,"ļ":253,"Ľ":254,"ľ":255,"Ŀ":256,"ŀ":257,"Ł":258,"ł":259,"Ń":260,"ĠE":261,"ĠN":262,"ĠA":263,"ĠI":264,"ĠG":265,"ĠEU":266,"ĠD":267,"ĠS":268,"ĠEO":269,"ĠO":270,"Ġi":271,"ĠJ":272,"ĠNG":273,"ĠR":274,"ĠL":275,"ĠU":276,"ĠM":277,"ĠH":278,"EO":279,"ĠB":280,"ĠiEO":281,"Ġo":282,"uI":283,"CH":284,"CHh":285,"Ġt":286,"ĠCHh":287,"Ġk":288,"ĠoA":289,"euI":290,"ĠeuI":291,"ĠDD":292,"Th":293,"ĠTh":294,"Ph":295,"ĠPh":296,"ĠoE":297,"Kh":298,"ĠKh":299,"ĠGG":300,"ĠSS":301,"ĠiO":302,"Ġp":303,"ĠiU":304,"ĠJJ":305,"uEO":306,"ĠuEO":307,"ĠiA":308,"ĠuI":309,"ĠiE":310,"ĠBB":311,"iEO":312,"iU":313,"iA":314,"oE":315,"DD":316,"iO":317,"iE":318,"EU":319,"GG":320,"oA":321,"SS":322,"BB":323,"JJ":324}
|