Hartunka commited on
Commit
57d013a
·
verified ·
1 Parent(s): a82a02c

End of training

Browse files
README.md CHANGED
@@ -1,14 +1,32 @@
1
  ---
2
  library_name: transformers
 
 
3
  base_model: Hartunka/bert_base_km_20_v2
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - accuracy
8
  - f1
9
  model-index:
10
  - name: bert_base_km_20_v2_mrpc
11
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,12 +34,12 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # bert_base_km_20_v2_mrpc
18
 
19
- This model is a fine-tuned version of [Hartunka/bert_base_km_20_v2](https://huggingface.co/Hartunka/bert_base_km_20_v2) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 1.2587
22
- - Accuracy: 0.6863
23
- - F1: 0.7793
24
- - Combined Score: 0.7328
25
 
26
  ## Model description
27
 
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - en
5
  base_model: Hartunka/bert_base_km_20_v2
6
  tags:
7
  - generated_from_trainer
8
+ datasets:
9
+ - glue
10
  metrics:
11
  - accuracy
12
  - f1
13
  model-index:
14
  - name: bert_base_km_20_v2_mrpc
15
+ results:
16
+ - task:
17
+ name: Text Classification
18
+ type: text-classification
19
+ dataset:
20
+ name: GLUE MRPC
21
+ type: glue
22
+ args: mrpc
23
+ metrics:
24
+ - name: Accuracy
25
+ type: accuracy
26
+ value: 0.7034313725490197
27
+ - name: F1
28
+ type: f1
29
+ value: 0.815267175572519
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  # bert_base_km_20_v2_mrpc
36
 
37
+ This model is a fine-tuned version of [Hartunka/bert_base_km_20_v2](https://huggingface.co/Hartunka/bert_base_km_20_v2) on the GLUE MRPC dataset.
38
  It achieves the following results on the evaluation set:
39
+ - Loss: 0.6078
40
+ - Accuracy: 0.7034
41
+ - F1: 0.8153
42
+ - Combined Score: 0.7593
43
 
44
  ## Model description
45
 
all_results.json CHANGED
@@ -4,14 +4,14 @@
4
  "eval_combined_score": 0.7593492740607694,
5
  "eval_f1": 0.815267175572519,
6
  "eval_loss": 0.6078192591667175,
7
- "eval_runtime": 0.2942,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 1386.713,
10
- "eval_steps_per_second": 6.798,
11
  "total_flos": 3377819728711680.0,
12
  "train_loss": 0.36015133233297436,
13
- "train_runtime": 57.7393,
14
  "train_samples": 3668,
15
- "train_samples_per_second": 3176.344,
16
- "train_steps_per_second": 12.989
17
  }
 
4
  "eval_combined_score": 0.7593492740607694,
5
  "eval_f1": 0.815267175572519,
6
  "eval_loss": 0.6078192591667175,
7
+ "eval_runtime": 0.2924,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 1395.509,
10
+ "eval_steps_per_second": 6.841,
11
  "total_flos": 3377819728711680.0,
12
  "train_loss": 0.36015133233297436,
13
+ "train_runtime": 59.2376,
14
  "train_samples": 3668,
15
+ "train_samples_per_second": 3096.005,
16
+ "train_steps_per_second": 12.661
17
  }
eval_results.json CHANGED
@@ -4,8 +4,8 @@
4
  "eval_combined_score": 0.7593492740607694,
5
  "eval_f1": 0.815267175572519,
6
  "eval_loss": 0.6078192591667175,
7
- "eval_runtime": 0.2942,
8
  "eval_samples": 408,
9
- "eval_samples_per_second": 1386.713,
10
- "eval_steps_per_second": 6.798
11
  }
 
4
  "eval_combined_score": 0.7593492740607694,
5
  "eval_f1": 0.815267175572519,
6
  "eval_loss": 0.6078192591667175,
7
+ "eval_runtime": 0.2924,
8
  "eval_samples": 408,
9
+ "eval_samples_per_second": 1395.509,
10
+ "eval_steps_per_second": 6.841
11
  }
logs/events.out.tfevents.1745398577.s_005_m.2876923.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:391e2bee57ddcbf934a1e30b4f280958f37c077f9a2695c4d5c67d70a26d7452
3
+ size 459
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 7.0,
3
  "total_flos": 3377819728711680.0,
4
  "train_loss": 0.36015133233297436,
5
- "train_runtime": 57.7393,
6
  "train_samples": 3668,
7
- "train_samples_per_second": 3176.344,
8
- "train_steps_per_second": 12.989
9
  }
 
2
  "epoch": 7.0,
3
  "total_flos": 3377819728711680.0,
4
  "train_loss": 0.36015133233297436,
5
+ "train_runtime": 59.2376,
6
  "train_samples": 3668,
7
+ "train_samples_per_second": 3096.005,
8
+ "train_steps_per_second": 12.661
9
  }
trainer_state.json CHANGED
@@ -22,9 +22,9 @@
22
  "eval_combined_score": 0.740016030108726,
23
  "eval_f1": 0.7962085308056872,
24
  "eval_loss": 0.616814136505127,
25
- "eval_runtime": 0.2757,
26
- "eval_samples_per_second": 1480.037,
27
- "eval_steps_per_second": 7.255,
28
  "step": 15
29
  },
30
  {
@@ -40,9 +40,9 @@
40
  "eval_combined_score": 0.7593492740607694,
41
  "eval_f1": 0.815267175572519,
42
  "eval_loss": 0.6078192591667175,
43
- "eval_runtime": 0.2689,
44
- "eval_samples_per_second": 1517.136,
45
- "eval_steps_per_second": 7.437,
46
  "step": 30
47
  },
48
  {
@@ -58,9 +58,9 @@
58
  "eval_combined_score": 0.7530461066215624,
59
  "eval_f1": 0.805111821086262,
60
  "eval_loss": 0.6499011516571045,
61
- "eval_runtime": 0.2843,
62
- "eval_samples_per_second": 1435.076,
63
- "eval_steps_per_second": 7.035,
64
  "step": 45
65
  },
66
  {
@@ -76,9 +76,9 @@
76
  "eval_combined_score": 0.7396096088521171,
77
  "eval_f1": 0.7855917667238422,
78
  "eval_loss": 0.6939632892608643,
79
- "eval_runtime": 0.2783,
80
- "eval_samples_per_second": 1466.162,
81
- "eval_steps_per_second": 7.187,
82
  "step": 60
83
  },
84
  {
@@ -94,9 +94,9 @@
94
  "eval_combined_score": 0.6798529411764705,
95
  "eval_f1": 0.72,
96
  "eval_loss": 0.876370906829834,
97
- "eval_runtime": 0.2728,
98
- "eval_samples_per_second": 1495.769,
99
- "eval_steps_per_second": 7.332,
100
  "step": 75
101
  },
102
  {
@@ -112,9 +112,9 @@
112
  "eval_combined_score": 0.7140350877192982,
113
  "eval_f1": 0.7614035087719299,
114
  "eval_loss": 1.1046664714813232,
115
- "eval_runtime": 0.2749,
116
- "eval_samples_per_second": 1483.97,
117
- "eval_steps_per_second": 7.274,
118
  "step": 90
119
  },
120
  {
@@ -130,9 +130,9 @@
130
  "eval_combined_score": 0.7327924273157539,
131
  "eval_f1": 0.7793103448275862,
132
  "eval_loss": 1.2587286233901978,
133
- "eval_runtime": 0.2835,
134
- "eval_samples_per_second": 1439.35,
135
- "eval_steps_per_second": 7.056,
136
  "step": 105
137
  },
138
  {
@@ -140,9 +140,9 @@
140
  "step": 105,
141
  "total_flos": 3377819728711680.0,
142
  "train_loss": 0.36015133233297436,
143
- "train_runtime": 57.7393,
144
- "train_samples_per_second": 3176.344,
145
- "train_steps_per_second": 12.989
146
  }
147
  ],
148
  "logging_steps": 1,
 
22
  "eval_combined_score": 0.740016030108726,
23
  "eval_f1": 0.7962085308056872,
24
  "eval_loss": 0.616814136505127,
25
+ "eval_runtime": 0.2744,
26
+ "eval_samples_per_second": 1486.649,
27
+ "eval_steps_per_second": 7.287,
28
  "step": 15
29
  },
30
  {
 
40
  "eval_combined_score": 0.7593492740607694,
41
  "eval_f1": 0.815267175572519,
42
  "eval_loss": 0.6078192591667175,
43
+ "eval_runtime": 0.2706,
44
+ "eval_samples_per_second": 1507.857,
45
+ "eval_steps_per_second": 7.391,
46
  "step": 30
47
  },
48
  {
 
58
  "eval_combined_score": 0.7530461066215624,
59
  "eval_f1": 0.805111821086262,
60
  "eval_loss": 0.6499011516571045,
61
+ "eval_runtime": 0.2726,
62
+ "eval_samples_per_second": 1496.591,
63
+ "eval_steps_per_second": 7.336,
64
  "step": 45
65
  },
66
  {
 
76
  "eval_combined_score": 0.7396096088521171,
77
  "eval_f1": 0.7855917667238422,
78
  "eval_loss": 0.6939632892608643,
79
+ "eval_runtime": 0.2946,
80
+ "eval_samples_per_second": 1384.696,
81
+ "eval_steps_per_second": 6.788,
82
  "step": 60
83
  },
84
  {
 
94
  "eval_combined_score": 0.6798529411764705,
95
  "eval_f1": 0.72,
96
  "eval_loss": 0.876370906829834,
97
+ "eval_runtime": 0.2767,
98
+ "eval_samples_per_second": 1474.695,
99
+ "eval_steps_per_second": 7.229,
100
  "step": 75
101
  },
102
  {
 
112
  "eval_combined_score": 0.7140350877192982,
113
  "eval_f1": 0.7614035087719299,
114
  "eval_loss": 1.1046664714813232,
115
+ "eval_runtime": 0.2943,
116
+ "eval_samples_per_second": 1386.409,
117
+ "eval_steps_per_second": 6.796,
118
  "step": 90
119
  },
120
  {
 
130
  "eval_combined_score": 0.7327924273157539,
131
  "eval_f1": 0.7793103448275862,
132
  "eval_loss": 1.2587286233901978,
133
+ "eval_runtime": 0.2836,
134
+ "eval_samples_per_second": 1438.785,
135
+ "eval_steps_per_second": 7.053,
136
  "step": 105
137
  },
138
  {
 
140
  "step": 105,
141
  "total_flos": 3377819728711680.0,
142
  "train_loss": 0.36015133233297436,
143
+ "train_runtime": 59.2376,
144
+ "train_samples_per_second": 3096.005,
145
+ "train_steps_per_second": 12.661
146
  }
147
  ],
148
  "logging_steps": 1,