Training in progress, step 120
Browse files- adapter_model.safetensors +1 -1
- metrics.json +1 -0
- state.json +3 -3
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 35668592
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:991de16316201409d6ee8026268d6e6f98363867bb77e38a127dc24aad73c65c
|
| 3 |
size 35668592
|
metrics.json
CHANGED
|
@@ -3,3 +3,4 @@
|
|
| 3 |
{"Step":60,"eval_loss":1.6613901854,"eval_runtime":295.5311,"eval_samples_per_second":3.384,"eval_steps_per_second":0.423,"epoch":0.48}
|
| 4 |
{"Step":80,"eval_loss":1.6176079512,"eval_runtime":295.123,"eval_samples_per_second":3.388,"eval_steps_per_second":0.424,"epoch":0.64}
|
| 5 |
{"Step":100,"eval_loss":1.5983840227,"eval_runtime":296.3017,"eval_samples_per_second":3.375,"eval_steps_per_second":0.422,"epoch":0.8}
|
|
|
|
|
|
| 3 |
{"Step":60,"eval_loss":1.6613901854,"eval_runtime":295.5311,"eval_samples_per_second":3.384,"eval_steps_per_second":0.423,"epoch":0.48}
|
| 4 |
{"Step":80,"eval_loss":1.6176079512,"eval_runtime":295.123,"eval_samples_per_second":3.388,"eval_steps_per_second":0.424,"epoch":0.64}
|
| 5 |
{"Step":100,"eval_loss":1.5983840227,"eval_runtime":296.3017,"eval_samples_per_second":3.375,"eval_steps_per_second":0.422,"epoch":0.8}
|
| 6 |
+
{"Step":120,"eval_loss":1.5859812498,"eval_runtime":295.6456,"eval_samples_per_second":3.382,"eval_steps_per_second":0.423,"epoch":0.96}
|
state.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
-
"epoch": 0.
|
| 5 |
"eval_steps": 20,
|
| 6 |
-
"global_step":
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
@@ -101,7 +101,7 @@
|
|
| 101 |
"attributes": {}
|
| 102 |
}
|
| 103 |
},
|
| 104 |
-
"total_flos":
|
| 105 |
"train_batch_size": 8,
|
| 106 |
"trial_name": null,
|
| 107 |
"trial_params": null
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
+
"epoch": 0.96,
|
| 5 |
"eval_steps": 20,
|
| 6 |
+
"global_step": 120,
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
|
|
| 101 |
"attributes": {}
|
| 102 |
}
|
| 103 |
},
|
| 104 |
+
"total_flos": 8703928606310400.0,
|
| 105 |
"train_batch_size": 8,
|
| 106 |
"trial_name": null,
|
| 107 |
"trial_params": null
|