End of training
Browse files- README.md +3 -1
- all_results.json +9 -9
- eval_results.json +3 -3
- predict_tr_results.json +3 -3
- train_results.json +3 -3
- trainer_state.json +3 -3
README.md
CHANGED
|
@@ -4,6 +4,8 @@ license: apache-2.0
|
|
| 4 |
base_model: albert/albert-base-v2
|
| 5 |
tags:
|
| 6 |
- generated_from_trainer
|
|
|
|
|
|
|
| 7 |
model-index:
|
| 8 |
- name: squad_albert_finetuned2
|
| 9 |
results: []
|
|
@@ -14,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
|
|
| 14 |
|
| 15 |
# squad_albert_finetuned2
|
| 16 |
|
| 17 |
-
This model is a fine-tuned version of [albert/albert-base-v2](https://huggingface.co/albert/albert-base-v2) on
|
| 18 |
|
| 19 |
## Model description
|
| 20 |
|
|
|
|
| 4 |
base_model: albert/albert-base-v2
|
| 5 |
tags:
|
| 6 |
- generated_from_trainer
|
| 7 |
+
datasets:
|
| 8 |
+
- squad
|
| 9 |
model-index:
|
| 10 |
- name: squad_albert_finetuned2
|
| 11 |
results: []
|
|
|
|
| 16 |
|
| 17 |
# squad_albert_finetuned2
|
| 18 |
|
| 19 |
+
This model is a fine-tuned version of [albert/albert-base-v2](https://huggingface.co/albert/albert-base-v2) on the squad dataset.
|
| 20 |
|
| 21 |
## Model description
|
| 22 |
|
all_results.json
CHANGED
|
@@ -602,20 +602,20 @@
|
|
| 602 |
"epoch": 1.0,
|
| 603 |
"eval_exact_match": 13.0,
|
| 604 |
"eval_f1": 22.02673682526624,
|
| 605 |
-
"eval_runtime": 3.
|
| 606 |
"eval_samples": 100,
|
| 607 |
-
"eval_samples_per_second": 29.
|
| 608 |
-
"eval_steps_per_second": 3.
|
| 609 |
"predict_samples_tr": 100,
|
| 610 |
"test_exact_match": 33.0,
|
| 611 |
"test_f1": 43.51652920179235,
|
| 612 |
-
"test_runtime": 3.
|
| 613 |
-
"test_samples_per_second": 31.
|
| 614 |
-
"test_steps_per_second": 4.
|
| 615 |
"total_flos": 1656285235200.0,
|
| 616 |
"train_loss": 0.0,
|
| 617 |
-
"train_runtime": 1.
|
| 618 |
"train_samples": 100,
|
| 619 |
-
"train_samples_per_second":
|
| 620 |
-
"train_steps_per_second":
|
| 621 |
}
|
|
|
|
| 602 |
"epoch": 1.0,
|
| 603 |
"eval_exact_match": 13.0,
|
| 604 |
"eval_f1": 22.02673682526624,
|
| 605 |
+
"eval_runtime": 3.4116,
|
| 606 |
"eval_samples": 100,
|
| 607 |
+
"eval_samples_per_second": 29.312,
|
| 608 |
+
"eval_steps_per_second": 3.811,
|
| 609 |
"predict_samples_tr": 100,
|
| 610 |
"test_exact_match": 33.0,
|
| 611 |
"test_f1": 43.51652920179235,
|
| 612 |
+
"test_runtime": 3.1834,
|
| 613 |
+
"test_samples_per_second": 31.413,
|
| 614 |
+
"test_steps_per_second": 4.084,
|
| 615 |
"total_flos": 1656285235200.0,
|
| 616 |
"train_loss": 0.0,
|
| 617 |
+
"train_runtime": 1.5301,
|
| 618 |
"train_samples": 100,
|
| 619 |
+
"train_samples_per_second": 65.355,
|
| 620 |
+
"train_steps_per_second": 32.677
|
| 621 |
}
|
eval_results.json
CHANGED
|
@@ -2,8 +2,8 @@
|
|
| 2 |
"epoch": 1.0,
|
| 3 |
"eval_exact_match": 13.0,
|
| 4 |
"eval_f1": 22.02673682526624,
|
| 5 |
-
"eval_runtime": 3.
|
| 6 |
"eval_samples": 100,
|
| 7 |
-
"eval_samples_per_second": 29.
|
| 8 |
-
"eval_steps_per_second": 3.
|
| 9 |
}
|
|
|
|
| 2 |
"epoch": 1.0,
|
| 3 |
"eval_exact_match": 13.0,
|
| 4 |
"eval_f1": 22.02673682526624,
|
| 5 |
+
"eval_runtime": 3.4116,
|
| 6 |
"eval_samples": 100,
|
| 7 |
+
"eval_samples_per_second": 29.312,
|
| 8 |
+
"eval_steps_per_second": 3.811
|
| 9 |
}
|
predict_tr_results.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
| 2 |
"predict_samples_tr": 100,
|
| 3 |
"test_exact_match": 33.0,
|
| 4 |
"test_f1": 43.51652920179235,
|
| 5 |
-
"test_runtime": 3.
|
| 6 |
-
"test_samples_per_second": 31.
|
| 7 |
-
"test_steps_per_second": 4.
|
| 8 |
}
|
|
|
|
| 2 |
"predict_samples_tr": 100,
|
| 3 |
"test_exact_match": 33.0,
|
| 4 |
"test_f1": 43.51652920179235,
|
| 5 |
+
"test_runtime": 3.1834,
|
| 6 |
+
"test_samples_per_second": 31.413,
|
| 7 |
+
"test_steps_per_second": 4.084
|
| 8 |
}
|
train_results.json
CHANGED
|
@@ -2,8 +2,8 @@
|
|
| 2 |
"epoch": 1.0,
|
| 3 |
"total_flos": 1656285235200.0,
|
| 4 |
"train_loss": 0.0,
|
| 5 |
-
"train_runtime": 1.
|
| 6 |
"train_samples": 100,
|
| 7 |
-
"train_samples_per_second":
|
| 8 |
-
"train_steps_per_second":
|
| 9 |
}
|
|
|
|
| 2 |
"epoch": 1.0,
|
| 3 |
"total_flos": 1656285235200.0,
|
| 4 |
"train_loss": 0.0,
|
| 5 |
+
"train_runtime": 1.5301,
|
| 6 |
"train_samples": 100,
|
| 7 |
+
"train_samples_per_second": 65.355,
|
| 8 |
+
"train_steps_per_second": 32.677
|
| 9 |
}
|
trainer_state.json
CHANGED
|
@@ -13,9 +13,9 @@
|
|
| 13 |
"step": 50,
|
| 14 |
"total_flos": 1656285235200.0,
|
| 15 |
"train_loss": 0.0,
|
| 16 |
-
"train_runtime": 1.
|
| 17 |
-
"train_samples_per_second":
|
| 18 |
-
"train_steps_per_second":
|
| 19 |
}
|
| 20 |
],
|
| 21 |
"logging_steps": 500,
|
|
|
|
| 13 |
"step": 50,
|
| 14 |
"total_flos": 1656285235200.0,
|
| 15 |
"train_loss": 0.0,
|
| 16 |
+
"train_runtime": 1.5301,
|
| 17 |
+
"train_samples_per_second": 65.355,
|
| 18 |
+
"train_steps_per_second": 32.677
|
| 19 |
}
|
| 20 |
],
|
| 21 |
"logging_steps": 500,
|