Upload pharo KD Optuna tinyBERT checkpoint
Browse files
checkpoints/pharo/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 57416816
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39c3ec0d25f882af507bd9a3bd3f7cc4bcccf7ad72d4eecf7055aa5dee426d63
|
| 3 |
size 57416816
|
checkpoints/pharo/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5969
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7e4a77e46e9a135af00e8d7bca9030f79a10543a89d5fec47b6da79a48fd9e3
|
| 3 |
size 5969
|
checkpoints/pharo/trial_config.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
-
"lr":
|
| 3 |
-
"batch_size":
|
| 4 |
-
"epochs":
|
| 5 |
-
"temperature":
|
| 6 |
-
"lambda_hard": 0.
|
| 7 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"lr": 3.0496367190909535e-05,
|
| 3 |
+
"batch_size": 32,
|
| 4 |
+
"epochs": 20,
|
| 5 |
+
"temperature": 5.189451597700736,
|
| 6 |
+
"lambda_hard": 0.22898937800658187
|
| 7 |
}
|
checkpoints/pharo/trial_metrics.json
CHANGED
|
@@ -1,25 +1,25 @@
|
|
| 1 |
{
|
| 2 |
-
"eval_loss":
|
| 3 |
-
"eval_macro_f1": 0.
|
| 4 |
-
"eval_micro_f1": 0.
|
| 5 |
-
"eval_macro_precision": 0.
|
| 6 |
-
"eval_macro_recall": 0.
|
| 7 |
"eval_thresholds": {
|
| 8 |
-
"Keyimplementationpoints": 0.
|
| 9 |
-
"Example": 0.
|
| 10 |
-
"Responsibilities": 0.
|
| 11 |
-
"Intent": 0.
|
| 12 |
-
"Keymessages": 0.
|
| 13 |
"Collaborators": 0.54
|
| 14 |
},
|
| 15 |
-
"eval_f1_Keyimplementationpoints": 0.
|
| 16 |
-
"eval_f1_Example": 0.
|
| 17 |
-
"eval_f1_Responsibilities": 0.
|
| 18 |
-
"eval_f1_Intent": 0.
|
| 19 |
-
"eval_f1_Keymessages": 0.
|
| 20 |
-
"eval_f1_Collaborators": 0.
|
| 21 |
-
"eval_runtime": 0.
|
| 22 |
-
"eval_samples_per_second":
|
| 23 |
-
"eval_steps_per_second":
|
| 24 |
-
"epoch":
|
| 25 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"eval_loss": 14.538175582885742,
|
| 3 |
+
"eval_macro_f1": 0.6880698513817102,
|
| 4 |
+
"eval_micro_f1": 0.7300884955752213,
|
| 5 |
+
"eval_macro_precision": 0.669729216505182,
|
| 6 |
+
"eval_macro_recall": 0.7177189227751025,
|
| 7 |
"eval_thresholds": {
|
| 8 |
+
"Keyimplementationpoints": 0.44000000000000006,
|
| 9 |
+
"Example": 0.56,
|
| 10 |
+
"Responsibilities": 0.5000000000000001,
|
| 11 |
+
"Intent": 0.56,
|
| 12 |
+
"Keymessages": 0.5000000000000001,
|
| 13 |
"Collaborators": 0.54
|
| 14 |
},
|
| 15 |
+
"eval_f1_Keyimplementationpoints": 0.5070422535211268,
|
| 16 |
+
"eval_f1_Example": 0.8837209302325582,
|
| 17 |
+
"eval_f1_Responsibilities": 0.6511627906976745,
|
| 18 |
+
"eval_f1_Intent": 0.926829268292683,
|
| 19 |
+
"eval_f1_Keymessages": 0.5882352941176471,
|
| 20 |
+
"eval_f1_Collaborators": 0.5714285714285714,
|
| 21 |
+
"eval_runtime": 0.2497,
|
| 22 |
+
"eval_samples_per_second": 833.13,
|
| 23 |
+
"eval_steps_per_second": 28.038,
|
| 24 |
+
"epoch": 20.0
|
| 25 |
}
|