Hartunka commited on
Commit
75a890f
·
verified ·
1 Parent(s): ce4bb0c

End of training

Browse files
README.md CHANGED
@@ -1,14 +1,32 @@
1
  ---
2
  library_name: transformers
 
 
3
  base_model: Hartunka/tiny_bert_km_5_v2
4
  tags:
5
  - generated_from_trainer
 
 
6
  metrics:
7
  - matthews_correlation
8
  - accuracy
9
  model-index:
10
  - name: tiny_bert_km_5_v2_cola
11
- results: []
 
 
 
 
 
 
 
 
 
 
 
 
 
 
12
  ---
13
 
14
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
@@ -16,11 +34,11 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # tiny_bert_km_5_v2_cola
18
 
19
- This model is a fine-tuned version of [Hartunka/tiny_bert_km_5_v2](https://huggingface.co/Hartunka/tiny_bert_km_5_v2) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 0.7225
22
- - Matthews Correlation: 0.0664
23
- - Accuracy: 0.6433
24
 
25
  ## Model description
26
 
 
1
  ---
2
  library_name: transformers
3
+ language:
4
+ - en
5
  base_model: Hartunka/tiny_bert_km_5_v2
6
  tags:
7
  - generated_from_trainer
8
+ datasets:
9
+ - glue
10
  metrics:
11
  - matthews_correlation
12
  - accuracy
13
  model-index:
14
  - name: tiny_bert_km_5_v2_cola
15
+ results:
16
+ - task:
17
+ name: Text Classification
18
+ type: text-classification
19
+ dataset:
20
+ name: GLUE COLA
21
+ type: glue
22
+ args: cola
23
+ metrics:
24
+ - name: Matthews Correlation
25
+ type: matthews_correlation
26
+ value: 0.0
27
+ - name: Accuracy
28
+ type: accuracy
29
+ value: 0.6912751793861389
30
  ---
31
 
32
  <!-- This model card has been generated automatically according to the information the Trainer had access to. You
 
34
 
35
  # tiny_bert_km_5_v2_cola
36
 
37
+ This model is a fine-tuned version of [Hartunka/tiny_bert_km_5_v2](https://huggingface.co/Hartunka/tiny_bert_km_5_v2) on the GLUE COLA dataset.
38
  It achieves the following results on the evaluation set:
39
+ - Loss: 0.6132
40
+ - Matthews Correlation: 0.0
41
+ - Accuracy: 0.6913
42
 
43
  ## Model description
44
 
all_results.json CHANGED
@@ -3,14 +3,14 @@
3
  "eval_accuracy": 0.6912751793861389,
4
  "eval_loss": 0.6132072806358337,
5
  "eval_matthews_correlation": 0.0,
6
- "eval_runtime": 0.3395,
7
  "eval_samples": 1043,
8
- "eval_samples_per_second": 3072.424,
9
- "eval_steps_per_second": 14.729,
10
  "total_flos": 1793902531485696.0,
11
  "train_loss": 0.5503367466085097,
12
- "train_runtime": 45.4021,
13
  "train_samples": 8551,
14
- "train_samples_per_second": 9416.971,
15
- "train_steps_per_second": 37.443
16
  }
 
3
  "eval_accuracy": 0.6912751793861389,
4
  "eval_loss": 0.6132072806358337,
5
  "eval_matthews_correlation": 0.0,
6
+ "eval_runtime": 0.35,
7
  "eval_samples": 1043,
8
+ "eval_samples_per_second": 2979.605,
9
+ "eval_steps_per_second": 14.284,
10
  "total_flos": 1793902531485696.0,
11
  "train_loss": 0.5503367466085097,
12
+ "train_runtime": 46.3757,
13
  "train_samples": 8551,
14
+ "train_samples_per_second": 9219.277,
15
+ "train_steps_per_second": 36.657
16
  }
eval_results.json CHANGED
@@ -3,8 +3,8 @@
3
  "eval_accuracy": 0.6912751793861389,
4
  "eval_loss": 0.6132072806358337,
5
  "eval_matthews_correlation": 0.0,
6
- "eval_runtime": 0.3395,
7
  "eval_samples": 1043,
8
- "eval_samples_per_second": 3072.424,
9
- "eval_steps_per_second": 14.729
10
  }
 
3
  "eval_accuracy": 0.6912751793861389,
4
  "eval_loss": 0.6132072806358337,
5
  "eval_matthews_correlation": 0.0,
6
+ "eval_runtime": 0.35,
7
  "eval_samples": 1043,
8
+ "eval_samples_per_second": 2979.605,
9
+ "eval_steps_per_second": 14.284
10
  }
logs/events.out.tfevents.1745268024.s_005_m.2836625.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:806f8964113ce247bcb412364e918fc6c0a8118353cfb0194c4f502ea8078f25
3
+ size 427
train_results.json CHANGED
@@ -2,8 +2,8 @@
2
  "epoch": 8.0,
3
  "total_flos": 1793902531485696.0,
4
  "train_loss": 0.5503367466085097,
5
- "train_runtime": 45.4021,
6
  "train_samples": 8551,
7
- "train_samples_per_second": 9416.971,
8
- "train_steps_per_second": 37.443
9
  }
 
2
  "epoch": 8.0,
3
  "total_flos": 1793902531485696.0,
4
  "train_loss": 0.5503367466085097,
5
+ "train_runtime": 46.3757,
6
  "train_samples": 8551,
7
+ "train_samples_per_second": 9219.277,
8
+ "train_steps_per_second": 36.657
9
  }
trainer_state.json CHANGED
@@ -21,9 +21,9 @@
21
  "eval_accuracy": 0.6912751793861389,
22
  "eval_loss": 0.6185938119888306,
23
  "eval_matthews_correlation": 0.0,
24
- "eval_runtime": 0.325,
25
- "eval_samples_per_second": 3208.865,
26
- "eval_steps_per_second": 15.383,
27
  "step": 34
28
  },
29
  {
@@ -38,9 +38,9 @@
38
  "eval_accuracy": 0.6912751793861389,
39
  "eval_loss": 0.6137447357177734,
40
  "eval_matthews_correlation": 0.0,
41
- "eval_runtime": 0.3406,
42
- "eval_samples_per_second": 3062.365,
43
- "eval_steps_per_second": 14.681,
44
  "step": 68
45
  },
46
  {
@@ -55,9 +55,9 @@
55
  "eval_accuracy": 0.6912751793861389,
56
  "eval_loss": 0.6132072806358337,
57
  "eval_matthews_correlation": 0.0,
58
- "eval_runtime": 0.3117,
59
- "eval_samples_per_second": 3346.424,
60
- "eval_steps_per_second": 16.042,
61
  "step": 102
62
  },
63
  {
@@ -72,9 +72,9 @@
72
  "eval_accuracy": 0.6922339200973511,
73
  "eval_loss": 0.6316416263580322,
74
  "eval_matthews_correlation": 0.0463559874942472,
75
- "eval_runtime": 0.3269,
76
- "eval_samples_per_second": 3190.096,
77
- "eval_steps_per_second": 15.293,
78
  "step": 136
79
  },
80
  {
@@ -89,9 +89,9 @@
89
  "eval_accuracy": 0.7027804255485535,
90
  "eval_loss": 0.6342248916625977,
91
  "eval_matthews_correlation": 0.17712606131822545,
92
- "eval_runtime": 0.3079,
93
- "eval_samples_per_second": 3387.574,
94
- "eval_steps_per_second": 16.24,
95
  "step": 170
96
  },
97
  {
@@ -106,9 +106,9 @@
106
  "eval_accuracy": 0.6318312287330627,
107
  "eval_loss": 0.6609932780265808,
108
  "eval_matthews_correlation": 0.08825845093702572,
109
- "eval_runtime": 0.3339,
110
- "eval_samples_per_second": 3123.819,
111
- "eval_steps_per_second": 14.975,
112
  "step": 204
113
  },
114
  {
@@ -123,9 +123,9 @@
123
  "eval_accuracy": 0.6778523325920105,
124
  "eval_loss": 0.7212586998939514,
125
  "eval_matthews_correlation": 0.07130170780284954,
126
- "eval_runtime": 0.3491,
127
- "eval_samples_per_second": 2987.563,
128
- "eval_steps_per_second": 14.322,
129
  "step": 238
130
  },
131
  {
@@ -140,9 +140,9 @@
140
  "eval_accuracy": 0.6433365345001221,
141
  "eval_loss": 0.7225203514099121,
142
  "eval_matthews_correlation": 0.06635583278930876,
143
- "eval_runtime": 0.3177,
144
- "eval_samples_per_second": 3283.145,
145
- "eval_steps_per_second": 15.739,
146
  "step": 272
147
  },
148
  {
@@ -150,9 +150,9 @@
150
  "step": 272,
151
  "total_flos": 1793902531485696.0,
152
  "train_loss": 0.5503367466085097,
153
- "train_runtime": 45.4021,
154
- "train_samples_per_second": 9416.971,
155
- "train_steps_per_second": 37.443
156
  }
157
  ],
158
  "logging_steps": 1,
 
21
  "eval_accuracy": 0.6912751793861389,
22
  "eval_loss": 0.6185938119888306,
23
  "eval_matthews_correlation": 0.0,
24
+ "eval_runtime": 0.3261,
25
+ "eval_samples_per_second": 3198.315,
26
+ "eval_steps_per_second": 15.332,
27
  "step": 34
28
  },
29
  {
 
38
  "eval_accuracy": 0.6912751793861389,
39
  "eval_loss": 0.6137447357177734,
40
  "eval_matthews_correlation": 0.0,
41
+ "eval_runtime": 0.3136,
42
+ "eval_samples_per_second": 3326.092,
43
+ "eval_steps_per_second": 15.945,
44
  "step": 68
45
  },
46
  {
 
55
  "eval_accuracy": 0.6912751793861389,
56
  "eval_loss": 0.6132072806358337,
57
  "eval_matthews_correlation": 0.0,
58
+ "eval_runtime": 0.3328,
59
+ "eval_samples_per_second": 3134.163,
60
+ "eval_steps_per_second": 15.025,
61
  "step": 102
62
  },
63
  {
 
72
  "eval_accuracy": 0.6922339200973511,
73
  "eval_loss": 0.6316416263580322,
74
  "eval_matthews_correlation": 0.0463559874942472,
75
+ "eval_runtime": 0.3268,
76
+ "eval_samples_per_second": 3191.404,
77
+ "eval_steps_per_second": 15.299,
78
  "step": 136
79
  },
80
  {
 
89
  "eval_accuracy": 0.7027804255485535,
90
  "eval_loss": 0.6342248916625977,
91
  "eval_matthews_correlation": 0.17712606131822545,
92
+ "eval_runtime": 0.3211,
93
+ "eval_samples_per_second": 3248.185,
94
+ "eval_steps_per_second": 15.571,
95
  "step": 170
96
  },
97
  {
 
106
  "eval_accuracy": 0.6318312287330627,
107
  "eval_loss": 0.6609932780265808,
108
  "eval_matthews_correlation": 0.08825845093702572,
109
+ "eval_runtime": 0.3814,
110
+ "eval_samples_per_second": 2734.581,
111
+ "eval_steps_per_second": 13.109,
112
  "step": 204
113
  },
114
  {
 
123
  "eval_accuracy": 0.6778523325920105,
124
  "eval_loss": 0.7212586998939514,
125
  "eval_matthews_correlation": 0.07130170780284954,
126
+ "eval_runtime": 0.3419,
127
+ "eval_samples_per_second": 3050.928,
128
+ "eval_steps_per_second": 14.626,
129
  "step": 238
130
  },
131
  {
 
140
  "eval_accuracy": 0.6433365345001221,
141
  "eval_loss": 0.7225203514099121,
142
  "eval_matthews_correlation": 0.06635583278930876,
143
+ "eval_runtime": 0.339,
144
+ "eval_samples_per_second": 3076.588,
145
+ "eval_steps_per_second": 14.749,
146
  "step": 272
147
  },
148
  {
 
150
  "step": 272,
151
  "total_flos": 1793902531485696.0,
152
  "train_loss": 0.5503367466085097,
153
+ "train_runtime": 46.3757,
154
+ "train_samples_per_second": 9219.277,
155
+ "train_steps_per_second": 36.657
156
  }
157
  ],
158
  "logging_steps": 1,