Text Classification
Safetensors
English
modernbert
File size: 4,720 Bytes
6f6a301
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
{
  "architectures": [
    "ModernBertForSequenceClassification"
  ],
  "attention_bias": false,
  "attention_dropout": 0.0,
  "bos_token_id": null,
  "causal_mask": false,
  "classifier_activation": "gelu",
  "classifier_bias": false,
  "classifier_dropout": 0.0,
  "classifier_pooling": "mean",
  "cls_token_id": 50281,
  "decoder_bias": true,
  "deterministic_flash_attn": false,
  "dtype": "float32",
  "embedding_dropout": 0.0,
  "eos_token_id": null,
  "global_attn_every_n_layers": 3,
  "global_rope_theta": 160000.0,
  "gradient_checkpointing": false,
  "hidden_activation": "gelu",
  "hidden_size": 384,
  "id2label": {
    "0": "aerospace",
    "1": "agronomy",
    "2": "artistic",
    "3": "astronomy",
    "4": "atmospheric_science",
    "5": "automotive",
    "6": "beauty",
    "7": "biology",
    "8": "celebrity",
    "9": "chemistry",
    "10": "civil_engineering",
    "11": "communication_engineering",
    "12": "computer_science_and_technology",
    "13": "design",
    "14": "drama_and_film",
    "15": "economics",
    "16": "electronic_science",
    "17": "entertainment",
    "18": "environmental_science",
    "19": "fashion",
    "20": "finance",
    "21": "food",
    "22": "gamble",
    "23": "game",
    "24": "geography",
    "25": "health",
    "26": "history",
    "27": "hobby",
    "28": "hydraulic_engineering",
    "29": "instrument_science",
    "30": "journalism_and_media_communication",
    "31": "landscape_architecture",
    "32": "law",
    "33": "library",
    "34": "literature",
    "35": "materials_science",
    "36": "mathematics",
    "37": "mechanical_engineering",
    "38": "medical",
    "39": "mining_engineering",
    "40": "movie",
    "41": "music_and_dance",
    "42": "news",
    "43": "nuclear_science",
    "44": "ocean_science",
    "45": "optical_engineering",
    "46": "painting",
    "47": "pet",
    "48": "petroleum_and_natural_gas_engineering",
    "49": "philosophy",
    "50": "photo",
    "51": "physics",
    "52": "politics",
    "53": "psychology",
    "54": "public_administration",
    "55": "relationship",
    "56": "religion",
    "57": "sociology",
    "58": "sports",
    "59": "statistics",
    "60": "systems_science",
    "61": "textile_science",
    "62": "topicality",
    "63": "transportation_engineering",
    "64": "travel",
    "65": "urban_planning",
    "66": "vulgar_language"
  },
  "initializer_cutoff_factor": 2.0,
  "initializer_range": 0.02,
  "intermediate_size": 576,
  "is_causal": false,
  "label2id": {
    "aerospace": 0,
    "agronomy": 1,
    "artistic": 2,
    "astronomy": 3,
    "atmospheric_science": 4,
    "automotive": 5,
    "beauty": 6,
    "biology": 7,
    "celebrity": 8,
    "chemistry": 9,
    "civil_engineering": 10,
    "communication_engineering": 11,
    "computer_science_and_technology": 12,
    "design": 13,
    "drama_and_film": 14,
    "economics": 15,
    "electronic_science": 16,
    "entertainment": 17,
    "environmental_science": 18,
    "fashion": 19,
    "finance": 20,
    "food": 21,
    "gamble": 22,
    "game": 23,
    "geography": 24,
    "health": 25,
    "history": 26,
    "hobby": 27,
    "hydraulic_engineering": 28,
    "instrument_science": 29,
    "journalism_and_media_communication": 30,
    "landscape_architecture": 31,
    "law": 32,
    "library": 33,
    "literature": 34,
    "materials_science": 35,
    "mathematics": 36,
    "mechanical_engineering": 37,
    "medical": 38,
    "mining_engineering": 39,
    "movie": 40,
    "music_and_dance": 41,
    "news": 42,
    "nuclear_science": 43,
    "ocean_science": 44,
    "optical_engineering": 45,
    "painting": 46,
    "pet": 47,
    "petroleum_and_natural_gas_engineering": 48,
    "philosophy": 49,
    "photo": 50,
    "physics": 51,
    "politics": 52,
    "psychology": 53,
    "public_administration": 54,
    "relationship": 55,
    "religion": 56,
    "sociology": 57,
    "sports": 58,
    "statistics": 59,
    "systems_science": 60,
    "textile_science": 61,
    "topicality": 62,
    "transportation_engineering": 63,
    "travel": 64,
    "urban_planning": 65,
    "vulgar_language": 66
  },
  "layer_norm_eps": 1e-05,
  "local_attention": 128,
  "local_rope_theta": 160000.0,
  "max_position_embeddings": 7999,
  "mlp_bias": false,
  "mlp_dropout": 0.0,
  "model_type": "modernbert",
  "norm_bias": false,
  "norm_eps": 1e-05,
  "num_attention_heads": 6,
  "num_hidden_layers": 10,
  "pad_token_id": 50283,
  "position_embedding_type": "sans_pos",
  "problem_type": "single_label_classification",
  "repad_logits_with_grad": false,
  "sep_token_id": 50282,
  "sparse_pred_ignore_index": -100,
  "sparse_prediction": false,
  "transformers_version": "4.57.6",
  "vocab_size": 50368
}