Training in progress, epoch 0, checkpoint
Browse files
checkpoint-584/config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "
|
| 3 |
"activation_dropout": 0.1,
|
| 4 |
"activation_function": "gelu",
|
| 5 |
"add_bias_logits": false,
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "nour4286/ArabartModel",
|
| 3 |
"activation_dropout": 0.1,
|
| 4 |
"activation_function": "gelu",
|
| 5 |
"add_bias_logits": false,
|
checkpoint-584/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 557116312
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:76e84445a191839edf84f1d889f276068e769f9a8bf0b989becc3c63c9de697c
|
| 3 |
size 557116312
|
checkpoint-584/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1113991930
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3f520b58c6b87f0f6763b360b74cc218710b87ec4cbc35eaa497a7804486ef2f
|
| 3 |
size 1113991930
|
checkpoint-584/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d9e95035cb1be4618fab3d17f62392c1067c951be1666c8daa0117fb090bb41
|
| 3 |
size 14244
|
checkpoint-584/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2ab9cec4ef0efd312094946ebfdfc4c402610c2b3c556c08dc380f086b68177c
|
| 3 |
size 1064
|
checkpoint-584/trainer_state.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"best_metric":
|
| 3 |
"best_model_checkpoint": "/content/drive/MyDrive/Arabart/checkpoint-584",
|
| 4 |
"epoch": 0.9986106658116918,
|
| 5 |
"eval_steps": 500,
|
|
@@ -10,27 +10,27 @@
|
|
| 10 |
"log_history": [
|
| 11 |
{
|
| 12 |
"epoch": 0.8549748851127498,
|
| 13 |
-
"grad_norm":
|
| 14 |
-
"learning_rate": 4.
|
| 15 |
-
"loss": 2.
|
| 16 |
"step": 500
|
| 17 |
},
|
| 18 |
{
|
| 19 |
"epoch": 0.9986106658116918,
|
| 20 |
-
"eval_loss": 2.
|
| 21 |
-
"eval_rouge1":
|
| 22 |
-
"eval_rouge2": 11.
|
| 23 |
-
"eval_rougeL": 23.
|
| 24 |
-
"eval_runtime":
|
| 25 |
-
"eval_samples_per_second": 5.
|
| 26 |
-
"eval_steps_per_second": 1.
|
| 27 |
"step": 584
|
| 28 |
}
|
| 29 |
],
|
| 30 |
"logging_steps": 500,
|
| 31 |
-
"max_steps":
|
| 32 |
"num_input_tokens_seen": 0,
|
| 33 |
-
"num_train_epochs":
|
| 34 |
"save_steps": 500,
|
| 35 |
"stateful_callbacks": {
|
| 36 |
"TrainerControl": {
|
|
@@ -44,7 +44,7 @@
|
|
| 44 |
"attributes": {}
|
| 45 |
}
|
| 46 |
},
|
| 47 |
-
"total_flos":
|
| 48 |
"train_batch_size": 4,
|
| 49 |
"trial_name": null,
|
| 50 |
"trial_params": null
|
|
|
|
| 1 |
{
|
| 2 |
+
"best_metric": 27.3096,
|
| 3 |
"best_model_checkpoint": "/content/drive/MyDrive/Arabart/checkpoint-584",
|
| 4 |
"epoch": 0.9986106658116918,
|
| 5 |
"eval_steps": 500,
|
|
|
|
| 10 |
"log_history": [
|
| 11 |
{
|
| 12 |
"epoch": 0.8549748851127498,
|
| 13 |
+
"grad_norm": 1.4868409633636475,
|
| 14 |
+
"learning_rate": 4.9128919860627184e-05,
|
| 15 |
+
"loss": 2.0944,
|
| 16 |
"step": 500
|
| 17 |
},
|
| 18 |
{
|
| 19 |
"epoch": 0.9986106658116918,
|
| 20 |
+
"eval_loss": 2.504359483718872,
|
| 21 |
+
"eval_rouge1": 27.3096,
|
| 22 |
+
"eval_rouge2": 11.4756,
|
| 23 |
+
"eval_rougeL": 23.8611,
|
| 24 |
+
"eval_runtime": 914.3973,
|
| 25 |
+
"eval_samples_per_second": 5.128,
|
| 26 |
+
"eval_steps_per_second": 1.283,
|
| 27 |
"step": 584
|
| 28 |
}
|
| 29 |
],
|
| 30 |
"logging_steps": 500,
|
| 31 |
+
"max_steps": 14600,
|
| 32 |
"num_input_tokens_seen": 0,
|
| 33 |
+
"num_train_epochs": 25,
|
| 34 |
"save_steps": 500,
|
| 35 |
"stateful_callbacks": {
|
| 36 |
"TrainerControl": {
|
|
|
|
| 44 |
"attributes": {}
|
| 45 |
}
|
| 46 |
},
|
| 47 |
+
"total_flos": 1.893105654301901e+16,
|
| 48 |
"train_batch_size": 4,
|
| 49 |
"trial_name": null,
|
| 50 |
"trial_params": null
|
checkpoint-584/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 7032
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:576ede367e64eecc72993edf5019ca711a039a382e750df6eee9b32df90b34f4
|
| 3 |
size 7032
|