oleg-potichnyi
/

ModernBERT-code-classifier

Model card Files Files and versions

ModernBERT-code-classifier / config.json

oleg-potichnyi's picture

Training in progress, epoch 1

4811d64 verified 7 months ago

history blame contribute delete

2.81 kB

	{
	"architectures": [
	"ModernBertForSequenceClassification"
	],
	"attention_bias": false,
	"attention_dropout": 0.0,
	"bos_token_id": 50281,
	"classifier_activation": "gelu",
	"classifier_bias": false,
	"classifier_dropout": 0.0,
	"classifier_pooling": "mean",
	"cls_token_id": 50281,
	"decoder_bias": true,
	"deterministic_flash_attn": false,
	"embedding_dropout": 0.0,
	"eos_token_id": 50282,
	"global_attn_every_n_layers": 3,
	"global_rope_theta": 160000.0,
	"gradient_checkpointing": false,
	"hidden_activation": "gelu",
	"hidden_size": 768,
	"id2label": {
	"0": 0,
	"1": 1,
	"10": 10,
	"11": 11,
	"12": 12,
	"13": 13,
	"14": 14,
	"15": 15,
	"16": 16,
	"17": 17,
	"18": 18,
	"19": 19,
	"2": 2,
	"20": 20,
	"21": 21,
	"22": 22,
	"23": 23,
	"24": 24,
	"25": 25,
	"26": 26,
	"27": 27,
	"28": 28,
	"29": 29,
	"3": 3,
	"30": 30,
	"31": 31,
	"32": 32,
	"33": 33,
	"34": 34,
	"35": 35,
	"36": 36,
	"37": 37,
	"38": 38,
	"39": 39,
	"4": 4,
	"40": 40,
	"41": 41,
	"42": 42,
	"43": 43,
	"44": 44,
	"45": 45,
	"46": 46,
	"47": 47,
	"48": 48,
	"49": 49,
	"5": 5,
	"50": 50,
	"6": 6,
	"7": 7,
	"8": 8,
	"9": 9
	},
	"initializer_cutoff_factor": 2.0,
	"initializer_range": 0.02,
	"intermediate_size": 1152,
	"label2id": {
	"0": "0",
	"1": "1",
	"2": "2",
	"3": "3",
	"4": "4",
	"5": "5",
	"6": "6",
	"7": "7",
	"8": "8",
	"9": "9",
	"10": "10",
	"11": "11",
	"12": "12",
	"13": "13",
	"14": "14",
	"15": "15",
	"16": "16",
	"17": "17",
	"18": "18",
	"19": "19",
	"20": "20",
	"21": "21",
	"22": "22",
	"23": "23",
	"24": "24",
	"25": "25",
	"26": "26",
	"27": "27",
	"28": "28",
	"29": "29",
	"30": "30",
	"31": "31",
	"32": "32",
	"33": "33",
	"34": "34",
	"35": "35",
	"36": "36",
	"37": "37",
	"38": "38",
	"39": "39",
	"40": "40",
	"41": "41",
	"42": "42",
	"43": "43",
	"44": "44",
	"45": "45",
	"46": "46",
	"47": "47",
	"48": "48",
	"49": "49",
	"50": "50"
	},
	"layer_norm_eps": 1e-05,
	"local_attention": 128,
	"local_rope_theta": 10000.0,
	"max_position_embeddings": 8192,
	"mlp_bias": false,
	"mlp_dropout": 0.0,
	"model_type": "modernbert",
	"norm_bias": false,
	"norm_eps": 1e-05,
	"num_attention_heads": 12,
	"num_hidden_layers": 22,
	"pad_token_id": 50283,
	"position_embedding_type": "absolute",
	"problem_type": "single_label_classification",
	"repad_logits_with_grad": false,
	"sep_token_id": 50282,
	"sparse_pred_ignore_index": -100,
	"sparse_prediction": false,
	"torch_dtype": "float32",
	"transformers_version": "4.55.2",
	"vocab_size": 50368
	}