Sigurdur commited on
Commit
e122083
·
verified ·
1 Parent(s): 4163a99

End of training

Browse files
README.md CHANGED
@@ -20,11 +20,11 @@ should probably proofread and complete it, then remove this comment. -->
20
 
21
  This model is a fine-tuned version of [HuggingFaceTB/SmolVLM-Base](https://huggingface.co/HuggingFaceTB/SmolVLM-Base) on an unknown dataset.
22
  It achieves the following results on the evaluation set:
23
- - Loss: 0.0155
24
- - Wer: 0.4048
25
- - Cer: 0.6082
26
  - Exact Match: 0.0
27
- - Special Char Acc: 0.9960
28
  - Seq Acc 5: 0.0
29
  - Seq Acc 10: 0.0
30
 
@@ -60,38 +60,36 @@ The following hyperparameters were used during training:
60
 
61
  | Training Loss | Epoch | Step | Validation Loss | Wer | Cer | Exact Match | Special Char Acc | Seq Acc 5 | Seq Acc 10 |
62
  |:-------------:|:------:|:----:|:---------------:|:------:|:------:|:-----------:|:----------------:|:---------:|:----------:|
63
- | 0.3933 | 0.0311 | 125 | 0.2240 | 1.1229 | 1.2210 | 0.0 | 0.9518 | 0.0 | 0.0 |
64
- | 0.1975 | 0.0622 | 250 | 0.1529 | 1.0361 | 1.2207 | 0.0 | 0.9719 | 0.0 | 0.0 |
65
- | 0.1483 | 0.0934 | 375 | 0.1266 | 0.9373 | 1.0345 | 0.0 | 0.9639 | 0.0 | 0.0 |
66
- | 0.1336 | 0.1245 | 500 | 0.1059 | 0.8145 | 0.9270 | 0.0 | 0.9839 | 0.0 | 0.0 |
67
- | 0.1171 | 0.1556 | 625 | 0.0915 | 1.0964 | 1.2152 | 0.0 | 0.9920 | 0.0 | 0.0 |
68
- | 0.0949 | 0.1867 | 750 | 0.0667 | 0.6193 | 0.7423 | 0.0 | 1.0 | 0.0 | 0.0 |
69
- | 0.093 | 0.2179 | 875 | 0.0731 | 0.5663 | 0.7168 | 0.0 | 0.9799 | 0.0 | 0.0 |
70
- | 0.0606 | 0.2490 | 1000 | 0.0569 | 0.5904 | 0.8103 | 0.0 | 0.9759 | 0.0 | 0.0 |
71
- | 0.0807 | 0.2801 | 1125 | 0.0514 | 0.3976 | 0.6064 | 0.0 | 0.9880 | 0.0 | 0.0 |
72
- | 0.0678 | 0.3112 | 1250 | 0.0465 | 0.4169 | 0.6449 | 0.0 | 0.9880 | 0.0 | 0.0 |
73
- | 0.0565 | 0.3424 | 1375 | 0.0447 | 0.4193 | 0.6337 | 0.0 | 1.0 | 0.0 | 0.0 |
74
- | 0.0699 | 0.3735 | 1500 | 0.0322 | 0.4337 | 0.5685 | 0.0 | 0.9960 | 0.0 | 0.0 |
75
- | 0.0604 | 0.4046 | 1625 | 0.0292 | 0.5205 | 0.6545 | 0.0 | 1.0 | 0.0 | 0.0 |
76
- | 0.067 | 0.4357 | 1750 | 0.0410 | 0.5133 | 0.5864 | 0.0 | 0.9920 | 0.0 | 0.0 |
77
- | 0.0501 | 0.4669 | 1875 | 0.0281 | 0.5831 | 0.6838 | 0.0 | 0.9920 | 0.0 | 0.0 |
78
- | 0.053 | 0.4980 | 2000 | 0.0258 | 0.3422 | 0.5311 | 0.0 | 1.0 | 0.0 | 0.0 |
79
- | 0.0492 | 0.5291 | 2125 | 0.0318 | 0.5181 | 0.6727 | 0.0 | 0.9880 | 0.0 | 0.0 |
80
- | 0.0581 | 0.5602 | 2250 | 0.0222 | 0.4747 | 0.6006 | 0.0 | 0.9960 | 0.0 | 0.0 |
81
- | 0.0492 | 0.5913 | 2375 | 0.0206 | 0.5566 | 0.6513 | 0.0 | 0.9920 | 0.0 | 0.0 |
82
- | 0.045 | 0.6225 | 2500 | 0.0203 | 0.6699 | 0.8413 | 0.0 | 0.9920 | 0.0 | 0.0 |
83
- | 0.0449 | 0.6536 | 2625 | 0.0185 | 0.5542 | 0.7837 | 0.0 | 0.9960 | 0.0 | 0.0 |
84
- | 0.0397 | 0.6847 | 2750 | 0.0161 | 0.4747 | 0.6545 | 0.0 | 0.9960 | 0.0 | 0.0 |
85
- | 0.044 | 0.7158 | 2875 | 0.0172 | 0.5614 | 0.6948 | 0.0 | 0.9920 | 0.0 | 0.0 |
86
- | 0.0352 | 0.7470 | 3000 | 0.0175 | 0.4193 | 0.5807 | 0.0 | 0.9960 | 0.0 | 0.0 |
87
- | 0.0441 | 0.7781 | 3125 | 0.0140 | 0.4096 | 0.6386 | 0.0 | 0.9960 | 0.0 | 0.0 |
88
- | 0.0339 | 0.8092 | 3250 | 0.0141 | 0.3928 | 0.5818 | 0.0 | 1.0 | 0.0 | 0.0 |
89
- | 0.0429 | 0.8403 | 3375 | 0.0176 | 0.4410 | 0.6079 | 0.0 | 1.0 | 0.0 | 0.0 |
90
- | 0.0385 | 0.8715 | 3500 | 0.0169 | 0.4048 | 0.5870 | 0.0 | 0.9960 | 0.0 | 0.0 |
91
- | 0.0417 | 0.9026 | 3625 | 0.0172 | 0.4241 | 0.6111 | 0.0 | 0.9960 | 0.0 | 0.0 |
92
- | 0.0502 | 0.9337 | 3750 | 0.0162 | 0.4145 | 0.6160 | 0.0 | 0.9960 | 0.0 | 0.0 |
93
- | 0.0316 | 0.9648 | 3875 | 0.0157 | 0.4289 | 0.6215 | 0.0 | 0.9960 | 0.0 | 0.0 |
94
- | 0.0468 | 0.9960 | 4000 | 0.0155 | 0.4048 | 0.6082 | 0.0 | 0.9960 | 0.0 | 0.0 |
95
 
96
 
97
  ### Framework versions
 
20
 
21
  This model is a fine-tuned version of [HuggingFaceTB/SmolVLM-Base](https://huggingface.co/HuggingFaceTB/SmolVLM-Base) on an unknown dataset.
22
  It achieves the following results on the evaluation set:
23
+ - Loss: 0.0147
24
+ - Wer: 0.2907
25
+ - Cer: 0.5314
26
  - Exact Match: 0.0
27
+ - Special Char Acc: 1.0
28
  - Seq Acc 5: 0.0
29
  - Seq Acc 10: 0.0
30
 
 
60
 
61
  | Training Loss | Epoch | Step | Validation Loss | Wer | Cer | Exact Match | Special Char Acc | Seq Acc 5 | Seq Acc 10 |
62
  |:-------------:|:------:|:----:|:---------------:|:------:|:------:|:-----------:|:----------------:|:---------:|:----------:|
63
+ | 0.3666 | 0.0325 | 125 | 0.2243 | 0.8704 | 0.8629 | 0.0 | 0.9622 | 0.0 | 0.0 |
64
+ | 0.168 | 0.0649 | 250 | 0.1485 | 0.7556 | 0.9306 | 0.0 | 0.9680 | 0.0 | 0.0 |
65
+ | 0.1282 | 0.0974 | 375 | 0.1187 | 0.4481 | 0.6394 | 0.0 | 0.9797 | 0.0 | 0.0 |
66
+ | 0.0984 | 0.1299 | 500 | 0.0965 | 0.5056 | 0.7014 | 0.0 | 0.9826 | 0.0 | 0.0 |
67
+ | 0.0891 | 0.1624 | 625 | 0.0755 | 0.4611 | 0.6485 | 0.0 | 0.9913 | 0.0 | 0.0 |
68
+ | 0.0744 | 0.1948 | 750 | 0.0638 | 0.4963 | 0.7116 | 0.0 | 0.9913 | 0.0 | 0.0 |
69
+ | 0.0708 | 0.2273 | 875 | 0.0518 | 0.3944 | 0.5805 | 0.0 | 0.9942 | 0.0 | 0.0 |
70
+ | 0.0647 | 0.2598 | 1000 | 0.0611 | 0.5389 | 0.8122 | 0.0 | 0.9855 | 0.0 | 0.0 |
71
+ | 0.0572 | 0.2922 | 1125 | 0.0454 | 0.4796 | 0.7158 | 0.0 | 0.9913 | 0.0 | 0.0 |
72
+ | 0.0555 | 0.3247 | 1250 | 0.0320 | 0.5685 | 0.7432 | 0.0 | 0.9884 | 0.0 | 0.0 |
73
+ | 0.0445 | 0.3572 | 1375 | 0.0386 | 0.4611 | 0.6404 | 0.0 | 0.9971 | 0.0 | 0.0 |
74
+ | 0.0455 | 0.3897 | 1500 | 0.0392 | 0.4259 | 0.6783 | 0.0 | 0.9913 | 0.0 | 0.0 |
75
+ | 0.0469 | 0.4221 | 1625 | 0.0319 | 0.2944 | 0.6415 | 0.0 | 0.9971 | 0.0 | 0.0 |
76
+ | 0.0386 | 0.4546 | 1750 | 0.0305 | 0.3574 | 0.5656 | 0.0 | 0.9971 | 0.0 | 0.0 |
77
+ | 0.0393 | 0.4871 | 1875 | 0.0327 | 0.2889 | 0.5405 | 0.0 | 0.9971 | 0.0 | 0.0 |
78
+ | 0.0364 | 0.5195 | 2000 | 0.0254 | 0.2685 | 0.4360 | 0.0 | 0.9971 | 0.0 | 0.0 |
79
+ | 0.0338 | 0.5520 | 2125 | 0.0254 | 0.2556 | 0.4616 | 0.0 | 1.0 | 0.0 | 0.0 |
80
+ | 0.0332 | 0.5845 | 2250 | 0.0217 | 0.3111 | 0.5105 | 0.0 | 1.0 | 0.0 | 0.0 |
81
+ | 0.0285 | 0.6170 | 2375 | 0.0257 | 0.3167 | 0.4898 | 0.0 | 1.0 | 0.0 | 0.0 |
82
+ | 0.0291 | 0.6494 | 2500 | 0.0230 | 0.4481 | 0.6054 | 0.0 | 1.0 | 0.0 | 0.0 |
83
+ | 0.028 | 0.6819 | 2625 | 0.0204 | 0.3741 | 0.5687 | 0.0 | 1.0 | 0.0 | 0.0 |
84
+ | 0.024 | 0.7144 | 2750 | 0.0204 | 0.3352 | 0.5242 | 0.0 | 0.9971 | 0.0 | 0.0 |
85
+ | 0.0262 | 0.7469 | 2875 | 0.0170 | 0.3796 | 0.6020 | 0.0 | 1.0 | 0.0 | 0.0 |
86
+ | 0.0237 | 0.7793 | 3000 | 0.0155 | 0.4222 | 0.6574 | 0.0 | 1.0 | 0.0 | 0.0 |
87
+ | 0.0246 | 0.8118 | 3125 | 0.0164 | 0.2796 | 0.5151 | 0.0 | 1.0 | 0.0 | 0.0 |
88
+ | 0.023 | 0.8443 | 3250 | 0.0152 | 0.2815 | 0.5054 | 0.0 | 1.0 | 0.0 | 0.0 |
89
+ | 0.0225 | 0.8767 | 3375 | 0.0150 | 0.2722 | 0.5151 | 0.0 | 1.0 | 0.0 | 0.0 |
90
+ | 0.0216 | 0.9092 | 3500 | 0.0153 | 0.2815 | 0.5268 | 0.0 | 1.0 | 0.0 | 0.0 |
91
+ | 0.0213 | 0.9417 | 3625 | 0.0149 | 0.2852 | 0.5300 | 0.0 | 1.0 | 0.0 | 0.0 |
92
+ | 0.0204 | 0.9742 | 3750 | 0.0147 | 0.2907 | 0.5314 | 0.0 | 1.0 | 0.0 | 0.0 |
 
 
93
 
94
 
95
  ### Framework versions
adapter_config.json CHANGED
@@ -32,13 +32,13 @@
32
  "rank_pattern": {},
33
  "revision": null,
34
  "target_modules": [
35
- "o_proj",
36
  "gate_proj",
37
- "q_proj",
38
- "v_proj",
39
  "k_proj",
 
 
40
  "up_proj",
41
- "down_proj"
 
42
  ],
43
  "target_parameters": null,
44
  "task_type": null,
 
32
  "rank_pattern": {},
33
  "revision": null,
34
  "target_modules": [
 
35
  "gate_proj",
 
 
36
  "k_proj",
37
+ "q_proj",
38
+ "down_proj",
39
  "up_proj",
40
+ "o_proj",
41
+ "v_proj"
42
  ],
43
  "target_parameters": null,
44
  "task_type": null,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c54d944b2f8437b53612475c94941be19613e26719d1e31fe38debfc68fab139
3
  size 171632952
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecab74e6150490ab327892d71ed95b6600f94266acab895b9a913d5210e34274
3
  size 171632952
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e248332cffe5198a42939ead4ae1098f87a6d73e0c66a7d20cd5060a98ed55a4
3
  size 5905
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72bc9907735bfabf18439e4361fc77643bf78409793ddc5135be6825c9c479b5
3
  size 5905