Upload folder using huggingface_hub
Browse files- checkpoint-465/trainer_state.json +37 -37
- checkpoint-775/trainer_state.json +61 -61
checkpoint-465/trainer_state.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"best_global_step": 465,
|
| 3 |
-
"best_metric": 0.
|
| 4 |
"best_model_checkpoint": "/kaggle/working/transformer_output/checkpoint-465",
|
| 5 |
"epoch": 3.0,
|
| 6 |
"eval_steps": 500,
|
|
@@ -32,18 +32,18 @@
|
|
| 32 |
},
|
| 33 |
{
|
| 34 |
"epoch": 1.0,
|
| 35 |
-
"eval_accuracy": 0.
|
| 36 |
-
"eval_f1": 0.
|
| 37 |
-
"eval_hate_f1": 0.
|
| 38 |
-
"eval_hate_prec": 0.
|
| 39 |
-
"eval_hate_rec": 0.
|
| 40 |
-
"eval_loss": 0.
|
| 41 |
-
"eval_macro_f1": 0.
|
| 42 |
-
"eval_precision": 0.
|
| 43 |
-
"eval_recall": 0.
|
| 44 |
-
"eval_runtime":
|
| 45 |
-
"eval_samples_per_second":
|
| 46 |
-
"eval_steps_per_second":
|
| 47 |
"step": 155
|
| 48 |
},
|
| 49 |
{
|
|
@@ -69,18 +69,18 @@
|
|
| 69 |
},
|
| 70 |
{
|
| 71 |
"epoch": 2.0,
|
| 72 |
-
"eval_accuracy": 0.
|
| 73 |
-
"eval_f1": 0.
|
| 74 |
-
"eval_hate_f1": 0.
|
| 75 |
-
"eval_hate_prec": 0.
|
| 76 |
-
"eval_hate_rec": 0.
|
| 77 |
-
"eval_loss": 0.
|
| 78 |
-
"eval_macro_f1": 0.
|
| 79 |
-
"eval_precision": 0.
|
| 80 |
-
"eval_recall": 0.
|
| 81 |
-
"eval_runtime":
|
| 82 |
-
"eval_samples_per_second":
|
| 83 |
-
"eval_steps_per_second":
|
| 84 |
"step": 310
|
| 85 |
},
|
| 86 |
{
|
|
@@ -106,18 +106,18 @@
|
|
| 106 |
},
|
| 107 |
{
|
| 108 |
"epoch": 3.0,
|
| 109 |
-
"eval_accuracy": 0.
|
| 110 |
-
"eval_f1": 0.
|
| 111 |
-
"eval_hate_f1": 0.
|
| 112 |
-
"eval_hate_prec": 0.
|
| 113 |
-
"eval_hate_rec": 0.
|
| 114 |
-
"eval_loss": 0.
|
| 115 |
-
"eval_macro_f1": 0.
|
| 116 |
-
"eval_precision": 0.
|
| 117 |
-
"eval_recall": 0.
|
| 118 |
-
"eval_runtime":
|
| 119 |
-
"eval_samples_per_second":
|
| 120 |
-
"eval_steps_per_second":
|
| 121 |
"step": 465
|
| 122 |
}
|
| 123 |
],
|
|
|
|
| 1 |
{
|
| 2 |
"best_global_step": 465,
|
| 3 |
+
"best_metric": 0.7806512878301866,
|
| 4 |
"best_model_checkpoint": "/kaggle/working/transformer_output/checkpoint-465",
|
| 5 |
"epoch": 3.0,
|
| 6 |
"eval_steps": 500,
|
|
|
|
| 32 |
},
|
| 33 |
{
|
| 34 |
"epoch": 1.0,
|
| 35 |
+
"eval_accuracy": 0.8930589184826473,
|
| 36 |
+
"eval_f1": 0.900084594871237,
|
| 37 |
+
"eval_hate_f1": 0.5027322404371585,
|
| 38 |
+
"eval_hate_prec": 0.4125560538116592,
|
| 39 |
+
"eval_hate_rec": 0.6433566433566433,
|
| 40 |
+
"eval_loss": 0.2638593912124634,
|
| 41 |
+
"eval_macro_f1": 0.7711109967956045,
|
| 42 |
+
"eval_precision": 0.9107537030140248,
|
| 43 |
+
"eval_recall": 0.8930589184826473,
|
| 44 |
+
"eval_runtime": 4.8064,
|
| 45 |
+
"eval_samples_per_second": 515.563,
|
| 46 |
+
"eval_steps_per_second": 8.114,
|
| 47 |
"step": 155
|
| 48 |
},
|
| 49 |
{
|
|
|
|
| 69 |
},
|
| 70 |
{
|
| 71 |
"epoch": 2.0,
|
| 72 |
+
"eval_accuracy": 0.8930589184826473,
|
| 73 |
+
"eval_f1": 0.9015939212097996,
|
| 74 |
+
"eval_hate_f1": 0.49604221635883905,
|
| 75 |
+
"eval_hate_prec": 0.3983050847457627,
|
| 76 |
+
"eval_hate_rec": 0.6573426573426573,
|
| 77 |
+
"eval_loss": 0.24266110360622406,
|
| 78 |
+
"eval_macro_f1": 0.7724936604193823,
|
| 79 |
+
"eval_precision": 0.9157473422011047,
|
| 80 |
+
"eval_recall": 0.8930589184826473,
|
| 81 |
+
"eval_runtime": 4.9035,
|
| 82 |
+
"eval_samples_per_second": 505.358,
|
| 83 |
+
"eval_steps_per_second": 7.954,
|
| 84 |
"step": 310
|
| 85 |
},
|
| 86 |
{
|
|
|
|
| 106 |
},
|
| 107 |
{
|
| 108 |
"epoch": 3.0,
|
| 109 |
+
"eval_accuracy": 0.8970944309927361,
|
| 110 |
+
"eval_f1": 0.9050220867632944,
|
| 111 |
+
"eval_hate_f1": 0.5053191489361702,
|
| 112 |
+
"eval_hate_prec": 0.40772532188841204,
|
| 113 |
+
"eval_hate_rec": 0.6643356643356644,
|
| 114 |
+
"eval_loss": 0.23981328308582306,
|
| 115 |
+
"eval_macro_f1": 0.7806512878301866,
|
| 116 |
+
"eval_precision": 0.9177721181109427,
|
| 117 |
+
"eval_recall": 0.8970944309927361,
|
| 118 |
+
"eval_runtime": 4.8801,
|
| 119 |
+
"eval_samples_per_second": 507.772,
|
| 120 |
+
"eval_steps_per_second": 7.992,
|
| 121 |
"step": 465
|
| 122 |
}
|
| 123 |
],
|
checkpoint-775/trainer_state.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"best_global_step": 465,
|
| 3 |
-
"best_metric": 0.
|
| 4 |
"best_model_checkpoint": "/kaggle/working/transformer_output/checkpoint-465",
|
| 5 |
"epoch": 5.0,
|
| 6 |
"eval_steps": 500,
|
|
@@ -32,18 +32,18 @@
|
|
| 32 |
},
|
| 33 |
{
|
| 34 |
"epoch": 1.0,
|
| 35 |
-
"eval_accuracy": 0.
|
| 36 |
-
"eval_f1": 0.
|
| 37 |
-
"eval_hate_f1": 0.
|
| 38 |
-
"eval_hate_prec": 0.
|
| 39 |
-
"eval_hate_rec": 0.
|
| 40 |
-
"eval_loss": 0.
|
| 41 |
-
"eval_macro_f1": 0.
|
| 42 |
-
"eval_precision": 0.
|
| 43 |
-
"eval_recall": 0.
|
| 44 |
-
"eval_runtime":
|
| 45 |
-
"eval_samples_per_second":
|
| 46 |
-
"eval_steps_per_second":
|
| 47 |
"step": 155
|
| 48 |
},
|
| 49 |
{
|
|
@@ -69,18 +69,18 @@
|
|
| 69 |
},
|
| 70 |
{
|
| 71 |
"epoch": 2.0,
|
| 72 |
-
"eval_accuracy": 0.
|
| 73 |
-
"eval_f1": 0.
|
| 74 |
-
"eval_hate_f1": 0.
|
| 75 |
-
"eval_hate_prec": 0.
|
| 76 |
-
"eval_hate_rec": 0.
|
| 77 |
-
"eval_loss": 0.
|
| 78 |
-
"eval_macro_f1": 0.
|
| 79 |
-
"eval_precision": 0.
|
| 80 |
-
"eval_recall": 0.
|
| 81 |
-
"eval_runtime":
|
| 82 |
-
"eval_samples_per_second":
|
| 83 |
-
"eval_steps_per_second":
|
| 84 |
"step": 310
|
| 85 |
},
|
| 86 |
{
|
|
@@ -106,18 +106,18 @@
|
|
| 106 |
},
|
| 107 |
{
|
| 108 |
"epoch": 3.0,
|
| 109 |
-
"eval_accuracy": 0.
|
| 110 |
-
"eval_f1": 0.
|
| 111 |
-
"eval_hate_f1": 0.
|
| 112 |
-
"eval_hate_prec": 0.
|
| 113 |
-
"eval_hate_rec": 0.
|
| 114 |
-
"eval_loss": 0.
|
| 115 |
-
"eval_macro_f1": 0.
|
| 116 |
-
"eval_precision": 0.
|
| 117 |
-
"eval_recall": 0.
|
| 118 |
-
"eval_runtime":
|
| 119 |
-
"eval_samples_per_second":
|
| 120 |
-
"eval_steps_per_second":
|
| 121 |
"step": 465
|
| 122 |
},
|
| 123 |
{
|
|
@@ -143,18 +143,18 @@
|
|
| 143 |
},
|
| 144 |
{
|
| 145 |
"epoch": 4.0,
|
| 146 |
-
"eval_accuracy": 0.
|
| 147 |
-
"eval_f1": 0.
|
| 148 |
-
"eval_hate_f1": 0.
|
| 149 |
-
"eval_hate_prec": 0.
|
| 150 |
-
"eval_hate_rec": 0.
|
| 151 |
-
"eval_loss": 0.
|
| 152 |
-
"eval_macro_f1": 0.
|
| 153 |
-
"eval_precision": 0.
|
| 154 |
-
"eval_recall": 0.
|
| 155 |
-
"eval_runtime":
|
| 156 |
-
"eval_samples_per_second":
|
| 157 |
-
"eval_steps_per_second":
|
| 158 |
"step": 620
|
| 159 |
},
|
| 160 |
{
|
|
@@ -180,18 +180,18 @@
|
|
| 180 |
},
|
| 181 |
{
|
| 182 |
"epoch": 5.0,
|
| 183 |
-
"eval_accuracy": 0.
|
| 184 |
-
"eval_f1": 0.
|
| 185 |
-
"eval_hate_f1": 0.
|
| 186 |
-
"eval_hate_prec": 0.
|
| 187 |
-
"eval_hate_rec": 0.
|
| 188 |
-
"eval_loss": 0.
|
| 189 |
-
"eval_macro_f1": 0.
|
| 190 |
-
"eval_precision": 0.
|
| 191 |
-
"eval_recall": 0.
|
| 192 |
-
"eval_runtime":
|
| 193 |
-
"eval_samples_per_second":
|
| 194 |
-
"eval_steps_per_second":
|
| 195 |
"step": 775
|
| 196 |
}
|
| 197 |
],
|
|
|
|
| 1 |
{
|
| 2 |
"best_global_step": 465,
|
| 3 |
+
"best_metric": 0.7806512878301866,
|
| 4 |
"best_model_checkpoint": "/kaggle/working/transformer_output/checkpoint-465",
|
| 5 |
"epoch": 5.0,
|
| 6 |
"eval_steps": 500,
|
|
|
|
| 32 |
},
|
| 33 |
{
|
| 34 |
"epoch": 1.0,
|
| 35 |
+
"eval_accuracy": 0.8930589184826473,
|
| 36 |
+
"eval_f1": 0.900084594871237,
|
| 37 |
+
"eval_hate_f1": 0.5027322404371585,
|
| 38 |
+
"eval_hate_prec": 0.4125560538116592,
|
| 39 |
+
"eval_hate_rec": 0.6433566433566433,
|
| 40 |
+
"eval_loss": 0.2638593912124634,
|
| 41 |
+
"eval_macro_f1": 0.7711109967956045,
|
| 42 |
+
"eval_precision": 0.9107537030140248,
|
| 43 |
+
"eval_recall": 0.8930589184826473,
|
| 44 |
+
"eval_runtime": 4.8064,
|
| 45 |
+
"eval_samples_per_second": 515.563,
|
| 46 |
+
"eval_steps_per_second": 8.114,
|
| 47 |
"step": 155
|
| 48 |
},
|
| 49 |
{
|
|
|
|
| 69 |
},
|
| 70 |
{
|
| 71 |
"epoch": 2.0,
|
| 72 |
+
"eval_accuracy": 0.8930589184826473,
|
| 73 |
+
"eval_f1": 0.9015939212097996,
|
| 74 |
+
"eval_hate_f1": 0.49604221635883905,
|
| 75 |
+
"eval_hate_prec": 0.3983050847457627,
|
| 76 |
+
"eval_hate_rec": 0.6573426573426573,
|
| 77 |
+
"eval_loss": 0.24266110360622406,
|
| 78 |
+
"eval_macro_f1": 0.7724936604193823,
|
| 79 |
+
"eval_precision": 0.9157473422011047,
|
| 80 |
+
"eval_recall": 0.8930589184826473,
|
| 81 |
+
"eval_runtime": 4.9035,
|
| 82 |
+
"eval_samples_per_second": 505.358,
|
| 83 |
+
"eval_steps_per_second": 7.954,
|
| 84 |
"step": 310
|
| 85 |
},
|
| 86 |
{
|
|
|
|
| 106 |
},
|
| 107 |
{
|
| 108 |
"epoch": 3.0,
|
| 109 |
+
"eval_accuracy": 0.8970944309927361,
|
| 110 |
+
"eval_f1": 0.9050220867632944,
|
| 111 |
+
"eval_hate_f1": 0.5053191489361702,
|
| 112 |
+
"eval_hate_prec": 0.40772532188841204,
|
| 113 |
+
"eval_hate_rec": 0.6643356643356644,
|
| 114 |
+
"eval_loss": 0.23981328308582306,
|
| 115 |
+
"eval_macro_f1": 0.7806512878301866,
|
| 116 |
+
"eval_precision": 0.9177721181109427,
|
| 117 |
+
"eval_recall": 0.8970944309927361,
|
| 118 |
+
"eval_runtime": 4.8801,
|
| 119 |
+
"eval_samples_per_second": 507.772,
|
| 120 |
+
"eval_steps_per_second": 7.992,
|
| 121 |
"step": 465
|
| 122 |
},
|
| 123 |
{
|
|
|
|
| 143 |
},
|
| 144 |
{
|
| 145 |
"epoch": 4.0,
|
| 146 |
+
"eval_accuracy": 0.887409200968523,
|
| 147 |
+
"eval_f1": 0.8985370069312554,
|
| 148 |
+
"eval_hate_f1": 0.47665847665847666,
|
| 149 |
+
"eval_hate_prec": 0.36742424242424243,
|
| 150 |
+
"eval_hate_rec": 0.6783216783216783,
|
| 151 |
+
"eval_loss": 0.24611614644527435,
|
| 152 |
+
"eval_macro_f1": 0.7688956887260704,
|
| 153 |
+
"eval_precision": 0.9169174752269499,
|
| 154 |
+
"eval_recall": 0.887409200968523,
|
| 155 |
+
"eval_runtime": 4.927,
|
| 156 |
+
"eval_samples_per_second": 502.941,
|
| 157 |
+
"eval_steps_per_second": 7.916,
|
| 158 |
"step": 620
|
| 159 |
},
|
| 160 |
{
|
|
|
|
| 180 |
},
|
| 181 |
{
|
| 182 |
"epoch": 5.0,
|
| 183 |
+
"eval_accuracy": 0.8857949959644875,
|
| 184 |
+
"eval_f1": 0.8976954173118289,
|
| 185 |
+
"eval_hate_f1": 0.472289156626506,
|
| 186 |
+
"eval_hate_prec": 0.3602941176470588,
|
| 187 |
+
"eval_hate_rec": 0.6853146853146853,
|
| 188 |
+
"eval_loss": 0.2520979344844818,
|
| 189 |
+
"eval_macro_f1": 0.7679642000169223,
|
| 190 |
+
"eval_precision": 0.9173899334739389,
|
| 191 |
+
"eval_recall": 0.8857949959644875,
|
| 192 |
+
"eval_runtime": 4.8991,
|
| 193 |
+
"eval_samples_per_second": 505.803,
|
| 194 |
+
"eval_steps_per_second": 7.961,
|
| 195 |
"step": 775
|
| 196 |
}
|
| 197 |
],
|