Training in progress, step 500
Browse files- config.json +4 -4
- model.safetensors +2 -2
- training_args.bin +1 -1
config.json
CHANGED
|
@@ -18,7 +18,7 @@
|
|
| 18 |
"global_rope_theta": 160000.0,
|
| 19 |
"gradient_checkpointing": false,
|
| 20 |
"hidden_activation": "gelu",
|
| 21 |
-
"hidden_size":
|
| 22 |
"id2label": {
|
| 23 |
"0": "LABEL_0",
|
| 24 |
"1": "LABEL_1",
|
|
@@ -174,7 +174,7 @@
|
|
| 174 |
},
|
| 175 |
"initializer_cutoff_factor": 2.0,
|
| 176 |
"initializer_range": 0.02,
|
| 177 |
-
"intermediate_size":
|
| 178 |
"label2id": {
|
| 179 |
"LABEL_0": 0,
|
| 180 |
"LABEL_1": 1,
|
|
@@ -337,8 +337,8 @@
|
|
| 337 |
"model_type": "modernbert",
|
| 338 |
"norm_bias": false,
|
| 339 |
"norm_eps": 1e-05,
|
| 340 |
-
"num_attention_heads":
|
| 341 |
-
"num_hidden_layers":
|
| 342 |
"pad_token_id": 50283,
|
| 343 |
"position_embedding_type": "absolute",
|
| 344 |
"problem_type": "single_label_classification",
|
|
|
|
| 18 |
"global_rope_theta": 160000.0,
|
| 19 |
"gradient_checkpointing": false,
|
| 20 |
"hidden_activation": "gelu",
|
| 21 |
+
"hidden_size": 1024,
|
| 22 |
"id2label": {
|
| 23 |
"0": "LABEL_0",
|
| 24 |
"1": "LABEL_1",
|
|
|
|
| 174 |
},
|
| 175 |
"initializer_cutoff_factor": 2.0,
|
| 176 |
"initializer_range": 0.02,
|
| 177 |
+
"intermediate_size": 2624,
|
| 178 |
"label2id": {
|
| 179 |
"LABEL_0": 0,
|
| 180 |
"LABEL_1": 1,
|
|
|
|
| 337 |
"model_type": "modernbert",
|
| 338 |
"norm_bias": false,
|
| 339 |
"norm_eps": 1e-05,
|
| 340 |
+
"num_attention_heads": 16,
|
| 341 |
+
"num_hidden_layers": 28,
|
| 342 |
"pad_token_id": 50283,
|
| 343 |
"position_embedding_type": "absolute",
|
| 344 |
"problem_type": "single_label_classification",
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:18e59832b1c70607be80679e27ef64d0883c170e2ba5a4e9fc913ad233593833
|
| 3 |
+
size 1583962548
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5713
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae58804986a9c1f0b4fca19d217be86e8661630333ba2d9fad702fd66bba2f7b
|
| 3 |
size 5713
|