{ "_name_or_path": "bert-base-cased-skill-mlm", "architectures": [ "BertForTokenClassification" ], "attention_probs_dropout_prob": 0.1, "classifier_dropout": null, "gradient_checkpointing": false, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 768, "id2label": { "0": "B-19", "1": "I-7", "2": "B-0", "3": "I-20", "4": "I-10", "5": "B-2", "6": "I-14", "7": "I-19", "8": "B-12", "9": "B-11", "10": "I-17", "11": "I-11", "12": "B-15", "13": "B-5", "14": "B-4", "15": "B-17", "16": "B-16", "17": "B-1", "18": "I-3", "19": "B-10", "20": "I-16", "21": "I-18", "22": "I-0", "23": "B-20", "24": "B-6", "25": "I-1", "26": "B-9", "27": "I-9", "28": "O", "29": "I-6", "30": "I-5", "31": "I-12", "32": "B-3", "33": "B-13", "34": "B-8", "35": "I-13", "36": "I-4", "37": "I-15", "38": "B-18", "39": "B-7", "40": "B-14", "41": "I-2", "42": "I-8" }, "initializer_range": 0.02, "intermediate_size": 3072, "label2id": { "B-0": 2, "B-1": 17, "B-10": 19, "B-11": 9, "B-12": 8, "B-13": 33, "B-14": 40, "B-15": 12, "B-16": 16, "B-17": 15, "B-18": 38, "B-19": 0, "B-2": 5, "B-20": 23, "B-3": 32, "B-4": 14, "B-5": 13, "B-6": 24, "B-7": 39, "B-8": 34, "B-9": 26, "I-0": 22, "I-1": 25, "I-10": 4, "I-11": 11, "I-12": 31, "I-13": 35, "I-14": 6, "I-15": 37, "I-16": 20, "I-17": 10, "I-18": 21, "I-19": 7, "I-2": 41, "I-20": 3, "I-3": 18, "I-4": 36, "I-5": 30, "I-6": 29, "I-7": 1, "I-8": 42, "I-9": 27, "O": 28 }, "layer_norm_eps": 1e-12, "max_position_embeddings": 512, "model_type": "bert", "num_attention_heads": 12, "num_hidden_layers": 12, "pad_token_id": 0, "position_embedding_type": "absolute", "torch_dtype": "float32", "transformers_version": "4.16.2", "type_vocab_size": 2, "use_cache": true, "vocab_size": 28996 }