Training in progress, epoch 1
Browse files- config.json +57 -57
- model.safetensors +2 -2
- tokenizer.json +9 -0
- tokenizer_config.json +8 -0
- training_args.bin +1 -1
config.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"_name_or_path": "answerdotai/ModernBERT-base",
|
| 3 |
"architectures": [
|
| 4 |
-
"
|
| 5 |
],
|
| 6 |
"attention_bias": false,
|
| 7 |
"attention_dropout": 0.0,
|
|
@@ -21,34 +21,34 @@
|
|
| 21 |
"hidden_activation": "gelu",
|
| 22 |
"hidden_size": 768,
|
| 23 |
"id2label": {
|
| 24 |
-
"B-address":
|
| 25 |
-
"B-certificate":
|
| 26 |
-
"B-date":
|
| 27 |
-
"B-degree":
|
| 28 |
-
"B-duration":
|
| 29 |
-
"B-email":
|
| 30 |
-
"B-individual_skill":
|
| 31 |
-
"B-job_role":
|
| 32 |
-
"B-language":
|
| 33 |
-
"B-location":
|
| 34 |
-
"B-name":
|
| 35 |
-
"B-organization":
|
| 36 |
-
"B-phone_number":
|
| 37 |
-
"I-address":
|
| 38 |
-
"I-certificate":
|
| 39 |
-
"I-date":
|
| 40 |
-
"I-degree":
|
| 41 |
-
"I-duration":
|
| 42 |
-
"I-email":
|
| 43 |
-
"I-individual_skill":
|
| 44 |
-
"I-job_role":
|
| 45 |
-
"I-language":
|
| 46 |
-
"I-location":
|
| 47 |
-
"I-name":
|
| 48 |
-
"I-organization":
|
| 49 |
-
"I-phone_number":
|
| 50 |
"O": 0,
|
| 51 |
-
"O-section":
|
| 52 |
"education_description": 33,
|
| 53 |
"education_information": 32,
|
| 54 |
"employment_description": 31,
|
|
@@ -60,34 +60,34 @@
|
|
| 60 |
"initializer_range": 0.02,
|
| 61 |
"intermediate_size": 1152,
|
| 62 |
"label2id": {
|
| 63 |
-
"B-address":
|
| 64 |
-
"B-certificate":
|
| 65 |
-
"B-date":
|
| 66 |
-
"B-degree":
|
| 67 |
-
"B-duration":
|
| 68 |
-
"B-email":
|
| 69 |
-
"B-individual_skill":
|
| 70 |
-
"B-job_role":
|
| 71 |
-
"B-language":
|
| 72 |
-
"B-location":
|
| 73 |
-
"B-name":
|
| 74 |
-
"B-organization":
|
| 75 |
-
"B-phone_number":
|
| 76 |
-
"I-address":
|
| 77 |
-
"I-certificate":
|
| 78 |
-
"I-date":
|
| 79 |
-
"I-degree":
|
| 80 |
-
"I-duration":
|
| 81 |
-
"I-email":
|
| 82 |
-
"I-individual_skill":
|
| 83 |
-
"I-job_role":
|
| 84 |
-
"I-language":
|
| 85 |
-
"I-location":
|
| 86 |
-
"I-name":
|
| 87 |
-
"I-organization":
|
| 88 |
-
"I-phone_number":
|
| 89 |
"O": 0,
|
| 90 |
-
"O-section":
|
| 91 |
"education_description": 33,
|
| 92 |
"education_information": 32,
|
| 93 |
"employment_description": 31,
|
|
@@ -108,12 +108,12 @@
|
|
| 108 |
"num_hidden_layers": 22,
|
| 109 |
"pad_token_id": 50283,
|
| 110 |
"position_embedding_type": "absolute",
|
| 111 |
-
"reference_compile":
|
| 112 |
"repad_logits_with_grad": false,
|
| 113 |
"sep_token_id": 50282,
|
| 114 |
"sparse_pred_ignore_index": -100,
|
| 115 |
"sparse_prediction": false,
|
| 116 |
"torch_dtype": "float32",
|
| 117 |
"transformers_version": "4.49.0",
|
| 118 |
-
"vocab_size":
|
| 119 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"_name_or_path": "answerdotai/ModernBERT-base",
|
| 3 |
"architectures": [
|
| 4 |
+
"DualModernBertForTokenClassification"
|
| 5 |
],
|
| 6 |
"attention_bias": false,
|
| 7 |
"attention_dropout": 0.0,
|
|
|
|
| 21 |
"hidden_activation": "gelu",
|
| 22 |
"hidden_size": 768,
|
| 23 |
"id2label": {
|
| 24 |
+
"B-address": 3,
|
| 25 |
+
"B-certificate": 23,
|
| 26 |
+
"B-date": 13,
|
| 27 |
+
"B-degree": 21,
|
| 28 |
+
"B-duration": 15,
|
| 29 |
+
"B-email": 5,
|
| 30 |
+
"B-individual_skill": 25,
|
| 31 |
+
"B-job_role": 19,
|
| 32 |
+
"B-language": 9,
|
| 33 |
+
"B-location": 11,
|
| 34 |
+
"B-name": 1,
|
| 35 |
+
"B-organization": 17,
|
| 36 |
+
"B-phone_number": 7,
|
| 37 |
+
"I-address": 4,
|
| 38 |
+
"I-certificate": 24,
|
| 39 |
+
"I-date": 14,
|
| 40 |
+
"I-degree": 22,
|
| 41 |
+
"I-duration": 16,
|
| 42 |
+
"I-email": 6,
|
| 43 |
+
"I-individual_skill": 26,
|
| 44 |
+
"I-job_role": 20,
|
| 45 |
+
"I-language": 10,
|
| 46 |
+
"I-location": 12,
|
| 47 |
+
"I-name": 2,
|
| 48 |
+
"I-organization": 18,
|
| 49 |
+
"I-phone_number": 8,
|
| 50 |
"O": 0,
|
| 51 |
+
"O-section": 27,
|
| 52 |
"education_description": 33,
|
| 53 |
"education_information": 32,
|
| 54 |
"employment_description": 31,
|
|
|
|
| 60 |
"initializer_range": 0.02,
|
| 61 |
"intermediate_size": 1152,
|
| 62 |
"label2id": {
|
| 63 |
+
"B-address": 3,
|
| 64 |
+
"B-certificate": 23,
|
| 65 |
+
"B-date": 13,
|
| 66 |
+
"B-degree": 21,
|
| 67 |
+
"B-duration": 15,
|
| 68 |
+
"B-email": 5,
|
| 69 |
+
"B-individual_skill": 25,
|
| 70 |
+
"B-job_role": 19,
|
| 71 |
+
"B-language": 9,
|
| 72 |
+
"B-location": 11,
|
| 73 |
+
"B-name": 1,
|
| 74 |
+
"B-organization": 17,
|
| 75 |
+
"B-phone_number": 7,
|
| 76 |
+
"I-address": 4,
|
| 77 |
+
"I-certificate": 24,
|
| 78 |
+
"I-date": 14,
|
| 79 |
+
"I-degree": 22,
|
| 80 |
+
"I-duration": 16,
|
| 81 |
+
"I-email": 6,
|
| 82 |
+
"I-individual_skill": 26,
|
| 83 |
+
"I-job_role": 20,
|
| 84 |
+
"I-language": 10,
|
| 85 |
+
"I-location": 12,
|
| 86 |
+
"I-name": 2,
|
| 87 |
+
"I-organization": 18,
|
| 88 |
+
"I-phone_number": 8,
|
| 89 |
"O": 0,
|
| 90 |
+
"O-section": 27,
|
| 91 |
"education_description": 33,
|
| 92 |
"education_information": 32,
|
| 93 |
"employment_description": 31,
|
|
|
|
| 108 |
"num_hidden_layers": 22,
|
| 109 |
"pad_token_id": 50283,
|
| 110 |
"position_embedding_type": "absolute",
|
| 111 |
+
"reference_compile": false,
|
| 112 |
"repad_logits_with_grad": false,
|
| 113 |
"sep_token_id": 50282,
|
| 114 |
"sparse_pred_ignore_index": -100,
|
| 115 |
"sparse_prediction": false,
|
| 116 |
"torch_dtype": "float32",
|
| 117 |
"transformers_version": "4.49.0",
|
| 118 |
+
"vocab_size": 50369
|
| 119 |
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:66635a1f764636bd9920b9e811936d4c59f7682d68ef81acac1d60d10a2c5855
|
| 3 |
+
size 598541296
|
tokenizer.json
CHANGED
|
@@ -1051,6 +1051,15 @@
|
|
| 1051 |
"rstrip": false,
|
| 1052 |
"normalized": true,
|
| 1053 |
"special": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1054 |
}
|
| 1055 |
],
|
| 1056 |
"normalizer": {
|
|
|
|
| 1051 |
"rstrip": false,
|
| 1052 |
"normalized": true,
|
| 1053 |
"special": false
|
| 1054 |
+
},
|
| 1055 |
+
{
|
| 1056 |
+
"id": 50368,
|
| 1057 |
+
"content": "[SECTION]",
|
| 1058 |
+
"single_word": false,
|
| 1059 |
+
"lstrip": false,
|
| 1060 |
+
"rstrip": false,
|
| 1061 |
+
"normalized": true,
|
| 1062 |
+
"special": false
|
| 1063 |
}
|
| 1064 |
],
|
| 1065 |
"normalizer": {
|
tokenizer_config.json
CHANGED
|
@@ -927,6 +927,14 @@
|
|
| 927 |
"rstrip": false,
|
| 928 |
"single_word": false,
|
| 929 |
"special": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 930 |
}
|
| 931 |
},
|
| 932 |
"clean_up_tokenization_spaces": true,
|
|
|
|
| 927 |
"rstrip": false,
|
| 928 |
"single_word": false,
|
| 929 |
"special": false
|
| 930 |
+
},
|
| 931 |
+
"50368": {
|
| 932 |
+
"content": "[SECTION]",
|
| 933 |
+
"lstrip": false,
|
| 934 |
+
"normalized": true,
|
| 935 |
+
"rstrip": false,
|
| 936 |
+
"single_word": false,
|
| 937 |
+
"special": false
|
| 938 |
}
|
| 939 |
},
|
| 940 |
"clean_up_tokenization_spaces": true,
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5304
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:44b8732a07251e11935ffb1a06a24458ae0ee2a86b015a29f0fce4c8356e4570
|
| 3 |
size 5304
|