djsull's picture
djsull/sent_classification
7db1edf verified
{
"architectures": [
"ModernBertForSequenceClassification"
],
"attention_bias": false,
"attention_dropout": 0.0,
"bos_token_id": 0,
"classifier_activation": "gelu",
"classifier_bias": false,
"classifier_dropout": 0.0,
"classifier_pooling": "mean",
"cls_token_id": 0,
"decoder_bias": true,
"deterministic_flash_attn": false,
"dtype": "float32",
"embedding_dropout": 0.0,
"eos_token_id": 1,
"global_attn_every_n_layers": 3,
"global_rope_theta": 160000,
"gradient_checkpointing": false,
"hidden_activation": "gelu",
"hidden_size": 768,
"id2label": {
"0": "\ud575\uc2ec\uc9c8\ubb38",
"1": "\uc11c\ube0c\uc9c8\ubb38",
"2": "\ubc30\uacbd/\uc0c1\ud669",
"3": "\uc2dc\ub3c4/\ud574\ubcf8\uac83",
"4": "\uc624\ub958/\uc99d\uc0c1",
"5": "\ud575\uc2ec\ub2f5\ubcc0/\uacb0\ub860",
"6": "\uc778\uc6a9/\ucc38\uc870",
"7": "\uadfc\uac70/\uc124\uba85",
"8": "\uc808\ucc28/\ubc29\ubc95",
"9": "\uc8fc\uc758/\ud55c\uacc4",
"10": "\ub300\uc548/\ube44\uad50",
"11": "\ucd94\uac00\uc815\ubcf4\uc694\uccad",
"12": "\uc778\uc0ac/\uac10\uc0ac/\uc751\uc6d0",
"13": "\ucd94\ucc9c/\ubcf4\uc0c1\uc720\ub3c4",
"14": "\uc608\uc2dc\ub370\uc774\ud130/\uc99d\ube59",
"15": "\uc758\ubbf8/\ud574\ub2f9\uc0ac\ud56d\uc5c6\uc74c"
},
"initializer_cutoff_factor": 2.0,
"initializer_range": 0.02,
"intermediate_size": 1152,
"label2id": {
"\uadfc\uac70/\uc124\uba85": 7,
"\ub300\uc548/\ube44\uad50": 10,
"\ubc30\uacbd/\uc0c1\ud669": 2,
"\uc11c\ube0c\uc9c8\ubb38": 1,
"\uc2dc\ub3c4/\ud574\ubcf8\uac83": 3,
"\uc608\uc2dc\ub370\uc774\ud130/\uc99d\ube59": 14,
"\uc624\ub958/\uc99d\uc0c1": 4,
"\uc758\ubbf8/\ud574\ub2f9\uc0ac\ud56d\uc5c6\uc74c": 15,
"\uc778\uc0ac/\uac10\uc0ac/\uc751\uc6d0": 12,
"\uc778\uc6a9/\ucc38\uc870": 6,
"\uc808\ucc28/\ubc29\ubc95": 8,
"\uc8fc\uc758/\ud55c\uacc4": 9,
"\ucd94\uac00\uc815\ubcf4\uc694\uccad": 11,
"\ucd94\ucc9c/\ubcf4\uc0c1\uc720\ub3c4": 13,
"\ud575\uc2ec\ub2f5\ubcc0/\uacb0\ub860": 5,
"\ud575\uc2ec\uc9c8\ubb38": 0
},
"layer_norm_eps": 1e-05,
"local_attention": 128,
"local_rope_theta": 10000.0,
"max_position_embeddings": 16384,
"mlp_bias": false,
"mlp_dropout": 0.0,
"model_type": "modernbert",
"norm_bias": false,
"norm_eps": 1e-05,
"num_attention_heads": 12,
"num_hidden_layers": 22,
"pad_token_id": 49999,
"position_embedding_type": "absolute",
"problem_type": "single_label_classification",
"repad_logits_with_grad": false,
"sep_token_id": 1,
"sparse_pred_ignore_index": -100,
"sparse_prediction": false,
"transformers_version": "4.56.1",
"vocab_size": 50000
}