BETO_3d / config.json
ismaelardo's picture
se sube el primer modelo
191d237
{
"_name_or_path": "dccuchile/bert-base-spanish-wwm-uncased",
"architectures": [
"BertForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"classifier_dropout": null,
"gradient_checkpointing": false,
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": 121,
"1": 122,
"2": 132,
"3": 133,
"4": 134,
"5": 141,
"6": 142,
"7": 214,
"8": 215,
"9": 216,
"10": 221,
"11": 222,
"12": 224,
"13": 231,
"14": 233,
"15": 234,
"16": 235,
"17": 241,
"18": 242,
"19": 243,
"20": 251,
"21": 252,
"22": 263,
"23": 311,
"24": 312,
"25": 322,
"26": 325,
"27": 331,
"28": 332,
"29": 333,
"30": 334,
"31": 343,
"32": 351,
"33": 361,
"34": 411,
"35": 421,
"36": 422,
"37": 431,
"38": 432,
"39": 441,
"40": 512,
"41": 522,
"42": 523,
"43": 524,
"44": 541,
"45": 712,
"46": 723,
"47": 741,
"48": 742,
"49": 818,
"50": 832,
"51": 833,
"52": 834,
"53": 911,
"54": 932,
"55": 933,
"56": 941,
"57": 962
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"LABEL_0": 0,
"LABEL_1": 1,
"LABEL_10": 10,
"LABEL_11": 11,
"LABEL_12": 12,
"LABEL_13": 13,
"LABEL_14": 14,
"LABEL_15": 15,
"LABEL_16": 16,
"LABEL_17": 17,
"LABEL_18": 18,
"LABEL_19": 19,
"LABEL_2": 2,
"LABEL_20": 20,
"LABEL_21": 21,
"LABEL_22": 22,
"LABEL_23": 23,
"LABEL_24": 24,
"LABEL_25": 25,
"LABEL_26": 26,
"LABEL_27": 27,
"LABEL_28": 28,
"LABEL_29": 29,
"LABEL_3": 3,
"LABEL_30": 30,
"LABEL_31": 31,
"LABEL_32": 32,
"LABEL_33": 33,
"LABEL_34": 34,
"LABEL_35": 35,
"LABEL_36": 36,
"LABEL_37": 37,
"LABEL_38": 38,
"LABEL_39": 39,
"LABEL_4": 4,
"LABEL_40": 40,
"LABEL_41": 41,
"LABEL_42": 42,
"LABEL_43": 43,
"LABEL_44": 44,
"LABEL_45": 45,
"LABEL_46": 46,
"LABEL_47": 47,
"LABEL_48": 48,
"LABEL_49": 49,
"LABEL_5": 5,
"LABEL_50": 50,
"LABEL_51": 51,
"LABEL_52": 52,
"LABEL_53": 53,
"LABEL_54": 54,
"LABEL_55": 55,
"LABEL_56": 56,
"LABEL_57": 57,
"LABEL_6": 6,
"LABEL_7": 7,
"LABEL_8": 8,
"LABEL_9": 9
},
"layer_norm_eps": 1e-12,
"max_position_embeddings": 512,
"model_type": "bert",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"output_past": true,
"pad_token_id": 1,
"position_embedding_type": "absolute",
"problem_type": "single_label_classification",
"torch_dtype": "float32",
"transformers_version": "4.11.0.dev0",
"type_vocab_size": 2,
"use_cache": true,
"vocab_size": 31002
}