Merikatori commited on
Commit
c0acdbf
·
verified ·
1 Parent(s): 536f80b

Upload folder using huggingface_hub

Browse files
checkpoint-465/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_global_step": 465,
3
- "best_metric": 0.7698383516941082,
4
  "best_model_checkpoint": "/kaggle/working/transformer_output/checkpoint-465",
5
  "epoch": 3.0,
6
  "eval_steps": 500,
@@ -32,18 +32,18 @@
32
  },
33
  {
34
  "epoch": 1.0,
35
- "eval_accuracy": 0.8886423239862821,
36
- "eval_f1": 0.8959192934594974,
37
- "eval_hate_f1": 0.47107438016528924,
38
- "eval_hate_prec": 0.3886363636363636,
39
- "eval_hate_rec": 0.5979020979020979,
40
- "eval_loss": 0.26823195815086365,
41
- "eval_macro_f1": 0.7588550972474853,
42
- "eval_precision": 0.9065499982342927,
43
- "eval_recall": 0.8886423239862821,
44
- "eval_runtime": 8.5862,
45
- "eval_samples_per_second": 577.325,
46
- "eval_steps_per_second": 9.084,
47
  "step": 155
48
  },
49
  {
@@ -69,18 +69,18 @@
69
  },
70
  {
71
  "epoch": 2.0,
72
- "eval_accuracy": 0.8912648779503732,
73
- "eval_f1": 0.8998036744615823,
74
- "eval_hate_f1": 0.4732620320855615,
75
- "eval_hate_prec": 0.38311688311688313,
76
- "eval_hate_rec": 0.6188811188811189,
77
- "eval_loss": 0.2427479773759842,
78
- "eval_macro_f1": 0.7651698753431324,
79
- "eval_precision": 0.913809087207257,
80
- "eval_recall": 0.8912648779503732,
81
- "eval_runtime": 8.6774,
82
- "eval_samples_per_second": 571.253,
83
- "eval_steps_per_second": 8.989,
84
  "step": 310
85
  },
86
  {
@@ -106,18 +106,18 @@
106
  },
107
  {
108
  "epoch": 3.0,
109
- "eval_accuracy": 0.8912648779503732,
110
- "eval_f1": 0.8998510802952099,
111
- "eval_hate_f1": 0.48548812664907653,
112
- "eval_hate_prec": 0.3898305084745763,
113
- "eval_hate_rec": 0.6433566433566433,
114
- "eval_loss": 0.24792158603668213,
115
- "eval_macro_f1": 0.7698383516941082,
116
- "eval_precision": 0.9136908950590453,
117
- "eval_recall": 0.8912648779503732,
118
- "eval_runtime": 8.7831,
119
- "eval_samples_per_second": 564.382,
120
- "eval_steps_per_second": 8.881,
121
  "step": 465
122
  }
123
  ],
 
1
  {
2
  "best_global_step": 465,
3
+ "best_metric": 0.7806512878301866,
4
  "best_model_checkpoint": "/kaggle/working/transformer_output/checkpoint-465",
5
  "epoch": 3.0,
6
  "eval_steps": 500,
 
32
  },
33
  {
34
  "epoch": 1.0,
35
+ "eval_accuracy": 0.8930589184826473,
36
+ "eval_f1": 0.900084594871237,
37
+ "eval_hate_f1": 0.5027322404371585,
38
+ "eval_hate_prec": 0.4125560538116592,
39
+ "eval_hate_rec": 0.6433566433566433,
40
+ "eval_loss": 0.2638593912124634,
41
+ "eval_macro_f1": 0.7711109967956045,
42
+ "eval_precision": 0.9107537030140248,
43
+ "eval_recall": 0.8930589184826473,
44
+ "eval_runtime": 4.8064,
45
+ "eval_samples_per_second": 515.563,
46
+ "eval_steps_per_second": 8.114,
47
  "step": 155
48
  },
49
  {
 
69
  },
70
  {
71
  "epoch": 2.0,
72
+ "eval_accuracy": 0.8930589184826473,
73
+ "eval_f1": 0.9015939212097996,
74
+ "eval_hate_f1": 0.49604221635883905,
75
+ "eval_hate_prec": 0.3983050847457627,
76
+ "eval_hate_rec": 0.6573426573426573,
77
+ "eval_loss": 0.24266110360622406,
78
+ "eval_macro_f1": 0.7724936604193823,
79
+ "eval_precision": 0.9157473422011047,
80
+ "eval_recall": 0.8930589184826473,
81
+ "eval_runtime": 4.9035,
82
+ "eval_samples_per_second": 505.358,
83
+ "eval_steps_per_second": 7.954,
84
  "step": 310
85
  },
86
  {
 
106
  },
107
  {
108
  "epoch": 3.0,
109
+ "eval_accuracy": 0.8970944309927361,
110
+ "eval_f1": 0.9050220867632944,
111
+ "eval_hate_f1": 0.5053191489361702,
112
+ "eval_hate_prec": 0.40772532188841204,
113
+ "eval_hate_rec": 0.6643356643356644,
114
+ "eval_loss": 0.23981328308582306,
115
+ "eval_macro_f1": 0.7806512878301866,
116
+ "eval_precision": 0.9177721181109427,
117
+ "eval_recall": 0.8970944309927361,
118
+ "eval_runtime": 4.8801,
119
+ "eval_samples_per_second": 507.772,
120
+ "eval_steps_per_second": 7.992,
121
  "step": 465
122
  }
123
  ],
checkpoint-775/trainer_state.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "best_global_step": 465,
3
- "best_metric": 0.7698383516941082,
4
  "best_model_checkpoint": "/kaggle/working/transformer_output/checkpoint-465",
5
  "epoch": 5.0,
6
  "eval_steps": 500,
@@ -32,18 +32,18 @@
32
  },
33
  {
34
  "epoch": 1.0,
35
- "eval_accuracy": 0.8886423239862821,
36
- "eval_f1": 0.8959192934594974,
37
- "eval_hate_f1": 0.47107438016528924,
38
- "eval_hate_prec": 0.3886363636363636,
39
- "eval_hate_rec": 0.5979020979020979,
40
- "eval_loss": 0.26823195815086365,
41
- "eval_macro_f1": 0.7588550972474853,
42
- "eval_precision": 0.9065499982342927,
43
- "eval_recall": 0.8886423239862821,
44
- "eval_runtime": 8.5862,
45
- "eval_samples_per_second": 577.325,
46
- "eval_steps_per_second": 9.084,
47
  "step": 155
48
  },
49
  {
@@ -69,18 +69,18 @@
69
  },
70
  {
71
  "epoch": 2.0,
72
- "eval_accuracy": 0.8912648779503732,
73
- "eval_f1": 0.8998036744615823,
74
- "eval_hate_f1": 0.4732620320855615,
75
- "eval_hate_prec": 0.38311688311688313,
76
- "eval_hate_rec": 0.6188811188811189,
77
- "eval_loss": 0.2427479773759842,
78
- "eval_macro_f1": 0.7651698753431324,
79
- "eval_precision": 0.913809087207257,
80
- "eval_recall": 0.8912648779503732,
81
- "eval_runtime": 8.6774,
82
- "eval_samples_per_second": 571.253,
83
- "eval_steps_per_second": 8.989,
84
  "step": 310
85
  },
86
  {
@@ -106,18 +106,18 @@
106
  },
107
  {
108
  "epoch": 3.0,
109
- "eval_accuracy": 0.8912648779503732,
110
- "eval_f1": 0.8998510802952099,
111
- "eval_hate_f1": 0.48548812664907653,
112
- "eval_hate_prec": 0.3898305084745763,
113
- "eval_hate_rec": 0.6433566433566433,
114
- "eval_loss": 0.24792158603668213,
115
- "eval_macro_f1": 0.7698383516941082,
116
- "eval_precision": 0.9136908950590453,
117
- "eval_recall": 0.8912648779503732,
118
- "eval_runtime": 8.7831,
119
- "eval_samples_per_second": 564.382,
120
- "eval_steps_per_second": 8.881,
121
  "step": 465
122
  },
123
  {
@@ -143,18 +143,18 @@
143
  },
144
  {
145
  "epoch": 4.0,
146
- "eval_accuracy": 0.8809763970143232,
147
- "eval_f1": 0.8935393778095193,
148
- "eval_hate_f1": 0.464839094159714,
149
- "eval_hate_prec": 0.352622061482821,
150
- "eval_hate_rec": 0.6818181818181818,
151
- "eval_loss": 0.2574857175350189,
152
- "eval_macro_f1": 0.760244573017305,
153
- "eval_precision": 0.9147072848857565,
154
- "eval_recall": 0.8809763970143232,
155
- "eval_runtime": 8.7972,
156
- "eval_samples_per_second": 563.474,
157
- "eval_steps_per_second": 8.866,
158
  "step": 620
159
  },
160
  {
@@ -180,18 +180,18 @@
180
  },
181
  {
182
  "epoch": 5.0,
183
- "eval_accuracy": 0.878353843050232,
184
- "eval_f1": 0.8912320589311761,
185
- "eval_hate_f1": 0.4591715976331361,
186
- "eval_hate_prec": 0.3470483005366726,
187
- "eval_hate_rec": 0.6783216783216783,
188
- "eval_loss": 0.2623799443244934,
189
- "eval_macro_f1": 0.7572637429327783,
190
- "eval_precision": 0.9126253015348699,
191
- "eval_recall": 0.878353843050232,
192
- "eval_runtime": 8.7768,
193
- "eval_samples_per_second": 564.787,
194
- "eval_steps_per_second": 8.887,
195
  "step": 775
196
  }
197
  ],
 
1
  {
2
  "best_global_step": 465,
3
+ "best_metric": 0.7806512878301866,
4
  "best_model_checkpoint": "/kaggle/working/transformer_output/checkpoint-465",
5
  "epoch": 5.0,
6
  "eval_steps": 500,
 
32
  },
33
  {
34
  "epoch": 1.0,
35
+ "eval_accuracy": 0.8930589184826473,
36
+ "eval_f1": 0.900084594871237,
37
+ "eval_hate_f1": 0.5027322404371585,
38
+ "eval_hate_prec": 0.4125560538116592,
39
+ "eval_hate_rec": 0.6433566433566433,
40
+ "eval_loss": 0.2638593912124634,
41
+ "eval_macro_f1": 0.7711109967956045,
42
+ "eval_precision": 0.9107537030140248,
43
+ "eval_recall": 0.8930589184826473,
44
+ "eval_runtime": 4.8064,
45
+ "eval_samples_per_second": 515.563,
46
+ "eval_steps_per_second": 8.114,
47
  "step": 155
48
  },
49
  {
 
69
  },
70
  {
71
  "epoch": 2.0,
72
+ "eval_accuracy": 0.8930589184826473,
73
+ "eval_f1": 0.9015939212097996,
74
+ "eval_hate_f1": 0.49604221635883905,
75
+ "eval_hate_prec": 0.3983050847457627,
76
+ "eval_hate_rec": 0.6573426573426573,
77
+ "eval_loss": 0.24266110360622406,
78
+ "eval_macro_f1": 0.7724936604193823,
79
+ "eval_precision": 0.9157473422011047,
80
+ "eval_recall": 0.8930589184826473,
81
+ "eval_runtime": 4.9035,
82
+ "eval_samples_per_second": 505.358,
83
+ "eval_steps_per_second": 7.954,
84
  "step": 310
85
  },
86
  {
 
106
  },
107
  {
108
  "epoch": 3.0,
109
+ "eval_accuracy": 0.8970944309927361,
110
+ "eval_f1": 0.9050220867632944,
111
+ "eval_hate_f1": 0.5053191489361702,
112
+ "eval_hate_prec": 0.40772532188841204,
113
+ "eval_hate_rec": 0.6643356643356644,
114
+ "eval_loss": 0.23981328308582306,
115
+ "eval_macro_f1": 0.7806512878301866,
116
+ "eval_precision": 0.9177721181109427,
117
+ "eval_recall": 0.8970944309927361,
118
+ "eval_runtime": 4.8801,
119
+ "eval_samples_per_second": 507.772,
120
+ "eval_steps_per_second": 7.992,
121
  "step": 465
122
  },
123
  {
 
143
  },
144
  {
145
  "epoch": 4.0,
146
+ "eval_accuracy": 0.887409200968523,
147
+ "eval_f1": 0.8985370069312554,
148
+ "eval_hate_f1": 0.47665847665847666,
149
+ "eval_hate_prec": 0.36742424242424243,
150
+ "eval_hate_rec": 0.6783216783216783,
151
+ "eval_loss": 0.24611614644527435,
152
+ "eval_macro_f1": 0.7688956887260704,
153
+ "eval_precision": 0.9169174752269499,
154
+ "eval_recall": 0.887409200968523,
155
+ "eval_runtime": 4.927,
156
+ "eval_samples_per_second": 502.941,
157
+ "eval_steps_per_second": 7.916,
158
  "step": 620
159
  },
160
  {
 
180
  },
181
  {
182
  "epoch": 5.0,
183
+ "eval_accuracy": 0.8857949959644875,
184
+ "eval_f1": 0.8976954173118289,
185
+ "eval_hate_f1": 0.472289156626506,
186
+ "eval_hate_prec": 0.3602941176470588,
187
+ "eval_hate_rec": 0.6853146853146853,
188
+ "eval_loss": 0.2520979344844818,
189
+ "eval_macro_f1": 0.7679642000169223,
190
+ "eval_precision": 0.9173899334739389,
191
+ "eval_recall": 0.8857949959644875,
192
+ "eval_runtime": 4.8991,
193
+ "eval_samples_per_second": 505.803,
194
+ "eval_steps_per_second": 7.961,
195
  "step": 775
196
  }
197
  ],