jnwulff commited on
Commit
637d111
·
verified ·
1 Parent(s): edf7949

Training in progress, step 500

Browse files
Files changed (3) hide show
  1. config.json +4 -4
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -18,7 +18,7 @@
18
  "global_rope_theta": 160000.0,
19
  "gradient_checkpointing": false,
20
  "hidden_activation": "gelu",
21
- "hidden_size": 768,
22
  "id2label": {
23
  "0": "LABEL_0",
24
  "1": "LABEL_1",
@@ -174,7 +174,7 @@
174
  },
175
  "initializer_cutoff_factor": 2.0,
176
  "initializer_range": 0.02,
177
- "intermediate_size": 1152,
178
  "label2id": {
179
  "LABEL_0": 0,
180
  "LABEL_1": 1,
@@ -337,8 +337,8 @@
337
  "model_type": "modernbert",
338
  "norm_bias": false,
339
  "norm_eps": 1e-05,
340
- "num_attention_heads": 12,
341
- "num_hidden_layers": 22,
342
  "pad_token_id": 50283,
343
  "position_embedding_type": "absolute",
344
  "problem_type": "single_label_classification",
 
18
  "global_rope_theta": 160000.0,
19
  "gradient_checkpointing": false,
20
  "hidden_activation": "gelu",
21
+ "hidden_size": 1024,
22
  "id2label": {
23
  "0": "LABEL_0",
24
  "1": "LABEL_1",
 
174
  },
175
  "initializer_cutoff_factor": 2.0,
176
  "initializer_range": 0.02,
177
+ "intermediate_size": 2624,
178
  "label2id": {
179
  "LABEL_0": 0,
180
  "LABEL_1": 1,
 
337
  "model_type": "modernbert",
338
  "norm_bias": false,
339
  "norm_eps": 1e-05,
340
+ "num_attention_heads": 16,
341
+ "num_hidden_layers": 28,
342
  "pad_token_id": 50283,
343
  "position_embedding_type": "absolute",
344
  "problem_type": "single_label_classification",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c957eba4f99a10527e0109a9fa2d7597a42803103ae7b4cd631d0f23966ad41a
3
- size 598898116
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18e59832b1c70607be80679e27ef64d0883c170e2ba5a4e9fc913ad233593833
3
+ size 1583962548
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ba46382351804384bfb837c33b2895492a910cd05c94f202772010033e16d2f7
3
  size 5713
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae58804986a9c1f0b4fca19d217be86e8661630333ba2d9fad702fd66bba2f7b
3
  size 5713