monsimas commited on
Commit
305aeb6
·
verified ·
1 Parent(s): c91026c

Upload ModernBertForSequenceClassification

Browse files
Files changed (2) hide show
  1. config.json +4 -4
  2. model.safetensors +2 -2
config.json CHANGED
@@ -18,14 +18,14 @@
18
  "global_rope_theta": 160000.0,
19
  "gradient_checkpointing": false,
20
  "hidden_activation": "gelu",
21
- "hidden_size": 1024,
22
  "id2label": {
23
  "0": "Small language model",
24
  "1": "Large language model"
25
  },
26
  "initializer_cutoff_factor": 2.0,
27
  "initializer_range": 0.02,
28
- "intermediate_size": 2624,
29
  "label2id": {
30
  "Large language model": 1,
31
  "Small language model": 0
@@ -39,8 +39,8 @@
39
  "model_type": "modernbert",
40
  "norm_bias": false,
41
  "norm_eps": 1e-05,
42
- "num_attention_heads": 16,
43
- "num_hidden_layers": 28,
44
  "pad_token_id": 50283,
45
  "position_embedding_type": "absolute",
46
  "problem_type": "single_label_classification",
 
18
  "global_rope_theta": 160000.0,
19
  "gradient_checkpointing": false,
20
  "hidden_activation": "gelu",
21
+ "hidden_size": 768,
22
  "id2label": {
23
  "0": "Small language model",
24
  "1": "Large language model"
25
  },
26
  "initializer_cutoff_factor": 2.0,
27
  "initializer_range": 0.02,
28
+ "intermediate_size": 1152,
29
  "label2id": {
30
  "Large language model": 1,
31
  "Small language model": 0
 
39
  "model_type": "modernbert",
40
  "norm_bias": false,
41
  "norm_eps": 1e-05,
42
+ "num_attention_heads": 12,
43
+ "num_hidden_layers": 22,
44
  "pad_token_id": 50283,
45
  "position_embedding_type": "absolute",
46
  "problem_type": "single_label_classification",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e849b8fb6f7844463a8547ca6dd9e31d4f132efc476e7ee0aecfa9fc3b041de8
3
- size 1583351632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb8b1142606b7031866f836c2452cf9638f689fed4bbf60ba5fddfcc6e39bea5
3
+ size 598439784