maradsky commited on
Commit
52a75d9
·
verified ·
1 Parent(s): 6e859df

Training in progress, epoch 1

Browse files
Files changed (3) hide show
  1. config.json +4 -4
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -19,7 +19,7 @@
19
  "global_rope_theta": 160000.0,
20
  "gradient_checkpointing": false,
21
  "hidden_activation": "gelu",
22
- "hidden_size": 1024,
23
  "id2label": {
24
  "0": "LABEL_0",
25
  "1": "LABEL_1",
@@ -29,7 +29,7 @@
29
  },
30
  "initializer_cutoff_factor": 2.0,
31
  "initializer_range": 0.02,
32
- "intermediate_size": 2624,
33
  "label2id": {
34
  "LABEL_0": 0,
35
  "LABEL_1": 1,
@@ -46,8 +46,8 @@
46
  "model_type": "modernbert",
47
  "norm_bias": false,
48
  "norm_eps": 1e-05,
49
- "num_attention_heads": 16,
50
- "num_hidden_layers": 28,
51
  "pad_token_id": 50283,
52
  "position_embedding_type": "absolute",
53
  "repad_logits_with_grad": false,
 
19
  "global_rope_theta": 160000.0,
20
  "gradient_checkpointing": false,
21
  "hidden_activation": "gelu",
22
+ "hidden_size": 768,
23
  "id2label": {
24
  "0": "LABEL_0",
25
  "1": "LABEL_1",
 
29
  },
30
  "initializer_cutoff_factor": 2.0,
31
  "initializer_range": 0.02,
32
+ "intermediate_size": 1152,
33
  "label2id": {
34
  "LABEL_0": 0,
35
  "LABEL_1": 1,
 
46
  "model_type": "modernbert",
47
  "norm_bias": false,
48
  "norm_eps": 1e-05,
49
+ "num_attention_heads": 12,
50
+ "num_hidden_layers": 22,
51
  "pad_token_id": 50283,
52
  "position_embedding_type": "absolute",
53
  "repad_logits_with_grad": false,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14ca347646dcc9c9a9ebadae157e9ef721b5522a1bf3e3c9d2349655ce8cae54
3
- size 1583363940
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72b06aaa781b46eea9666e986770d2b116d30b075a79bca3408a480f37a1036b
3
+ size 598449012
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3359fa1fc4e53c0ded3f111e8b863fe1d2fb1f29ee401122c3df41ecff0414af
3
  size 5496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03f9a050303d280a540f94358ebb062837b15b5fde58ac6fbb161d9fd0901003
3
  size 5496