Tommert25 commited on
Commit
a86f3b8
·
1 Parent(s): 56fc050

End of training

Browse files
README.md CHANGED
@@ -1,11 +1,8 @@
1
  ---
2
  license: mit
3
- base_model: pdelobelle/robbert-v2-dutch-base
4
  tags:
5
  - generated_from_trainer
6
- metrics:
7
- - recall
8
- - accuracy
9
  model-index:
10
  - name: robbert_1210seed25
11
  results: []
@@ -16,13 +13,17 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # robbert_1210seed25
18
 
19
- This model is a fine-tuned version of [pdelobelle/robbert-v2-dutch-base](https://huggingface.co/pdelobelle/robbert-v2-dutch-base) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.5154
22
- - Precisions: 0.8282
23
- - Recall: 0.8023
24
- - F-measure: 0.8137
25
- - Accuracy: 0.9157
 
 
 
 
26
 
27
  ## Model description
28
 
@@ -49,26 +50,6 @@ The following hyperparameters were used during training:
49
  - lr_scheduler_type: linear
50
  - num_epochs: 14
51
 
52
- ### Training results
53
-
54
- | Training Loss | Epoch | Step | Validation Loss | Precisions | Recall | F-measure | Accuracy |
55
- |:-------------:|:-----:|:----:|:---------------:|:----------:|:------:|:---------:|:--------:|
56
- | 0.6436 | 1.0 | 236 | 0.4323 | 0.8609 | 0.6660 | 0.6824 | 0.8683 |
57
- | 0.3251 | 2.0 | 472 | 0.3626 | 0.8293 | 0.7298 | 0.7496 | 0.8888 |
58
- | 0.204 | 3.0 | 708 | 0.3922 | 0.7666 | 0.7567 | 0.7456 | 0.8987 |
59
- | 0.1274 | 4.0 | 944 | 0.4473 | 0.7811 | 0.7408 | 0.7446 | 0.9018 |
60
- | 0.0876 | 5.0 | 1180 | 0.4216 | 0.7983 | 0.7892 | 0.7924 | 0.9058 |
61
- | 0.0576 | 6.0 | 1416 | 0.5128 | 0.7782 | 0.7547 | 0.7620 | 0.9019 |
62
- | 0.0406 | 7.0 | 1652 | 0.5051 | 0.8195 | 0.7678 | 0.7855 | 0.9123 |
63
- | 0.026 | 8.0 | 1888 | 0.5467 | 0.8202 | 0.7939 | 0.8056 | 0.9106 |
64
- | 0.0206 | 9.0 | 2124 | 0.5154 | 0.8282 | 0.8023 | 0.8137 | 0.9157 |
65
- | 0.0127 | 10.0 | 2360 | 0.5393 | 0.8190 | 0.7845 | 0.7988 | 0.9155 |
66
- | 0.0082 | 11.0 | 2596 | 0.5627 | 0.8145 | 0.7770 | 0.7886 | 0.9155 |
67
- | 0.0062 | 12.0 | 2832 | 0.5912 | 0.8166 | 0.7936 | 0.8036 | 0.9169 |
68
- | 0.0046 | 13.0 | 3068 | 0.5971 | 0.8090 | 0.7926 | 0.7984 | 0.9154 |
69
- | 0.0035 | 14.0 | 3304 | 0.5914 | 0.8135 | 0.7899 | 0.7995 | 0.9166 |
70
-
71
-
72
  ### Framework versions
73
 
74
  - Transformers 4.34.0
 
1
  ---
2
  license: mit
3
+ base_model: Tommert25/robbert_1210seed25
4
  tags:
5
  - generated_from_trainer
 
 
 
6
  model-index:
7
  - name: robbert_1210seed25
8
  results: []
 
13
 
14
  # robbert_1210seed25
15
 
16
+ This model is a fine-tuned version of [Tommert25/robbert_1210seed25](https://huggingface.co/Tommert25/robbert_1210seed25) on an unknown dataset.
17
  It achieves the following results on the evaluation set:
18
+ - eval_loss: 0.3499
19
+ - eval_precisions: 0.8378
20
+ - eval_recall: 0.8190
21
+ - eval_f-measure: 0.8274
22
+ - eval_accuracy: 0.9431
23
+ - eval_runtime: 9.6837
24
+ - eval_samples_per_second: 83.336
25
+ - eval_steps_per_second: 5.267
26
+ - step: 0
27
 
28
  ## Model description
29
 
 
50
  - lr_scheduler_type: linear
51
  - num_epochs: 14
52
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
53
  ### Framework versions
54
 
55
  - Transformers 4.34.0
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "pdelobelle/robbert-v2-dutch-base",
3
  "architectures": [
4
  "RobertaForTokenClassification"
5
  ],
 
1
  {
2
+ "_name_or_path": "Tommert25/robbert_1210seed25",
3
  "architectures": [
4
  "RobertaForTokenClassification"
5
  ],
special_tokens_map.json CHANGED
@@ -1,4 +1,11 @@
1
  {
 
 
 
 
 
 
 
2
  "bos_token": "<s>",
3
  "cls_token": "<s>",
4
  "eos_token": "</s>",
 
1
  {
2
+ "additional_special_tokens": [
3
+ "<s>",
4
+ "<pad>",
5
+ "</s>",
6
+ "<unk>",
7
+ "<mask>"
8
+ ],
9
  "bos_token": "<s>",
10
  "cls_token": "<s>",
11
  "eos_token": "</s>",
tokenizer_config.json CHANGED
@@ -42,17 +42,30 @@
42
  "special": true
43
  }
44
  },
45
- "additional_special_tokens": [],
 
 
 
 
 
 
46
  "bos_token": "<s>",
47
  "clean_up_tokenization_spaces": true,
48
  "cls_token": "<s>",
49
  "eos_token": "</s>",
50
  "errors": "replace",
51
  "mask_token": "<mask>",
 
52
  "model_max_length": 512,
 
53
  "pad_token": "<pad>",
 
 
54
  "sep_token": "</s>",
 
55
  "tokenizer_class": "RobertaTokenizer",
56
  "trim_offsets": true,
 
 
57
  "unk_token": "<unk>"
58
  }
 
42
  "special": true
43
  }
44
  },
45
+ "additional_special_tokens": [
46
+ "<s>",
47
+ "<pad>",
48
+ "</s>",
49
+ "<unk>",
50
+ "<mask>"
51
+ ],
52
  "bos_token": "<s>",
53
  "clean_up_tokenization_spaces": true,
54
  "cls_token": "<s>",
55
  "eos_token": "</s>",
56
  "errors": "replace",
57
  "mask_token": "<mask>",
58
+ "max_length": 512,
59
  "model_max_length": 512,
60
+ "pad_to_multiple_of": null,
61
  "pad_token": "<pad>",
62
+ "pad_token_type_id": 0,
63
+ "padding_side": "right",
64
  "sep_token": "</s>",
65
+ "stride": 0,
66
  "tokenizer_class": "RobertaTokenizer",
67
  "trim_offsets": true,
68
+ "truncation_side": "right",
69
+ "truncation_strategy": "longest_first",
70
  "unk_token": "<unk>"
71
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dcf7c3eca3372981793478235007377cd7eb65146d4cbff2a4de406dbd295d5c
3
  size 4091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:363c6df123cf97ec8546459e9a7e336777c768ef483ab5397906fbef4741f3f5
3
  size 4091