cca-distilbert / config.json
lgsilvaesilva's picture
Upload BertForSequenceClassification
9405d5b verified
{
"architectures": [
"BertForSequenceClassification"
],
"attention_probs_dropout_prob": 0.1,
"classifier_dropout": null,
"directionality": "bidi",
"dtype": "float32",
"hidden_act": "gelu",
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "1.1.1",
"1": "1.1.2",
"2": "1.1.3",
"3": "1.1.4",
"4": "1.1.5",
"5": "1.1.6",
"6": "1.1.7",
"7": "1.2.1",
"8": "1.2.2",
"9": "1.2.3",
"10": "1.2.4",
"11": "1.2.5",
"12": "1.2.6",
"13": "1.2.7",
"14": "1.2.8",
"15": "1.2.9",
"16": "1.3.1",
"17": "1.3.2",
"18": "1.3.3",
"19": "1.4.1",
"20": "1.4.2",
"21": "1.4.3",
"22": "1.4.4",
"23": "1.5.1",
"24": "2.1.1",
"25": "2.1.2",
"26": "2.2.1",
"27": "2.2.2",
"28": "2.3.1",
"29": "2.3.2",
"30": "2.3.3",
"31": "2.3.4",
"32": "2.4.1",
"33": "2.4.2",
"34": "2.4.3",
"35": "2.4.4",
"36": "2.4.5",
"37": "2.5.1",
"38": "2.5.2",
"39": "3.1.1",
"40": "3.1.2",
"41": "3.1.3",
"42": "3.2.1",
"43": "3.2.2",
"44": "3.3.1",
"45": "3.3.2",
"46": "3.3.3",
"47": "3.3.4",
"48": "3.4.1",
"49": "3.4.2",
"50": "4.1.1",
"51": "4.1.2",
"52": "4.1.3",
"53": "4.2.1",
"54": "4.2.2",
"55": "4.3.1",
"56": "4.3.2",
"57": "4.3.3",
"58": "4.3.4",
"59": "4.4.1",
"60": "4.4.2",
"61": "5.1.1",
"62": "5.1.2",
"63": "5.1.3",
"64": "5.1.4",
"65": "5.1.5",
"66": "5.2.1",
"67": "5.2.2",
"68": "5.2.3",
"69": "5.2.4",
"70": "5.2.5",
"71": "6.1.1",
"72": "6.1.2",
"73": "6.1.3",
"74": "6.1.4",
"75": "6.2.1",
"76": "6.3.1",
"77": "6.3.2",
"78": "6.3.3",
"79": "6.3.4",
"80": "6.3.5",
"81": "6.4.1",
"82": "6.4.2",
"83": "6.4.3",
"84": "6.5.1",
"85": "6.5.2",
"86": "6.5.3",
"87": "6.5.4",
"88": "6.5.5",
"89": "6.5.6",
"90": "6.6.1",
"91": "6.6.2",
"92": "6.6.3",
"93": "6.6.4",
"94": "6.6.5"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"1.1.1": 0,
"1.1.2": 1,
"1.1.3": 2,
"1.1.4": 3,
"1.1.5": 4,
"1.1.6": 5,
"1.1.7": 6,
"1.2.1": 7,
"1.2.2": 8,
"1.2.3": 9,
"1.2.4": 10,
"1.2.5": 11,
"1.2.6": 12,
"1.2.7": 13,
"1.2.8": 14,
"1.2.9": 15,
"1.3.1": 16,
"1.3.2": 17,
"1.3.3": 18,
"1.4.1": 19,
"1.4.2": 20,
"1.4.3": 21,
"1.4.4": 22,
"1.5.1": 23,
"2.1.1": 24,
"2.1.2": 25,
"2.2.1": 26,
"2.2.2": 27,
"2.3.1": 28,
"2.3.2": 29,
"2.3.3": 30,
"2.3.4": 31,
"2.4.1": 32,
"2.4.2": 33,
"2.4.3": 34,
"2.4.4": 35,
"2.4.5": 36,
"2.5.1": 37,
"2.5.2": 38,
"3.1.1": 39,
"3.1.2": 40,
"3.1.3": 41,
"3.2.1": 42,
"3.2.2": 43,
"3.3.1": 44,
"3.3.2": 45,
"3.3.3": 46,
"3.3.4": 47,
"3.4.1": 48,
"3.4.2": 49,
"4.1.1": 50,
"4.1.2": 51,
"4.1.3": 52,
"4.2.1": 53,
"4.2.2": 54,
"4.3.1": 55,
"4.3.2": 56,
"4.3.3": 57,
"4.3.4": 58,
"4.4.1": 59,
"4.4.2": 60,
"5.1.1": 61,
"5.1.2": 62,
"5.1.3": 63,
"5.1.4": 64,
"5.1.5": 65,
"5.2.1": 66,
"5.2.2": 67,
"5.2.3": 68,
"5.2.4": 69,
"5.2.5": 70,
"6.1.1": 71,
"6.1.2": 72,
"6.1.3": 73,
"6.1.4": 74,
"6.2.1": 75,
"6.3.1": 76,
"6.3.2": 77,
"6.3.3": 78,
"6.3.4": 79,
"6.3.5": 80,
"6.4.1": 81,
"6.4.2": 82,
"6.4.3": 83,
"6.5.1": 84,
"6.5.2": 85,
"6.5.3": 86,
"6.5.4": 87,
"6.5.5": 88,
"6.5.6": 89,
"6.6.1": 90,
"6.6.2": 91,
"6.6.3": 92,
"6.6.4": 93,
"6.6.5": 94
},
"layer_norm_eps": 1e-12,
"max_position_embeddings": 512,
"model_type": "bert",
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 0,
"pooler_fc_size": 768,
"pooler_num_attention_heads": 12,
"pooler_num_fc_layers": 3,
"pooler_size_per_head": 128,
"pooler_type": "first_token_transform",
"position_embedding_type": "absolute",
"problem_type": "multi_label_classification",
"transformers_version": "4.57.1",
"type_vocab_size": 2,
"use_cache": true,
"vocab_size": 105879
}