Training in progress, step 60
Browse files- adapter_model.safetensors +1 -1
- metrics.json +1 -1
- state.json +3 -3
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 35668592
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:124ef4fdc953020354a6a08a184b25002db40ec1092366cacb4e27ba354d142f
|
| 3 |
size 35668592
|
metrics.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
-
{"Step":60,"eval_loss":1.6613901854,"eval_runtime":295.5311,"eval_samples_per_second":3.384,"eval_steps_per_second":0.423,"epoch":0.48}
|
| 2 |
{"Step":80,"eval_loss":1.6176079512,"eval_runtime":295.123,"eval_samples_per_second":3.388,"eval_steps_per_second":0.424,"epoch":0.64}
|
| 3 |
{"Step":100,"eval_loss":1.5983840227,"eval_runtime":296.3017,"eval_samples_per_second":3.375,"eval_steps_per_second":0.422,"epoch":0.8}
|
| 4 |
{"Step":120,"eval_loss":1.5859812498,"eval_runtime":295.6456,"eval_samples_per_second":3.382,"eval_steps_per_second":0.423,"epoch":0.96}
|
| 5 |
{"Step":20,"eval_loss":1.8241591454,"eval_runtime":297.4682,"eval_samples_per_second":3.362,"eval_steps_per_second":0.42,"epoch":0.16}
|
| 6 |
{"Step":40,"eval_loss":1.5385681391,"eval_runtime":304.6057,"eval_samples_per_second":3.283,"eval_steps_per_second":0.41,"epoch":0.32}
|
|
|
|
|
|
|
|
|
| 1 |
{"Step":80,"eval_loss":1.6176079512,"eval_runtime":295.123,"eval_samples_per_second":3.388,"eval_steps_per_second":0.424,"epoch":0.64}
|
| 2 |
{"Step":100,"eval_loss":1.5983840227,"eval_runtime":296.3017,"eval_samples_per_second":3.375,"eval_steps_per_second":0.422,"epoch":0.8}
|
| 3 |
{"Step":120,"eval_loss":1.5859812498,"eval_runtime":295.6456,"eval_samples_per_second":3.382,"eval_steps_per_second":0.423,"epoch":0.96}
|
| 4 |
{"Step":20,"eval_loss":1.8241591454,"eval_runtime":297.4682,"eval_samples_per_second":3.362,"eval_steps_per_second":0.42,"epoch":0.16}
|
| 5 |
{"Step":40,"eval_loss":1.5385681391,"eval_runtime":304.6057,"eval_samples_per_second":3.283,"eval_steps_per_second":0.41,"epoch":0.32}
|
| 6 |
+
{"Step":60,"eval_loss":1.503634572,"eval_runtime":304.4462,"eval_samples_per_second":3.285,"eval_steps_per_second":0.411,"epoch":0.48}
|
state.json
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
-
"epoch": 0.
|
| 5 |
"eval_steps": 20,
|
| 6 |
-
"global_step":
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
@@ -56,7 +56,7 @@
|
|
| 56 |
"attributes": {}
|
| 57 |
}
|
| 58 |
},
|
| 59 |
-
"total_flos":
|
| 60 |
"train_batch_size": 8,
|
| 61 |
"trial_name": null,
|
| 62 |
"trial_params": null
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": null,
|
| 3 |
"best_model_checkpoint": null,
|
| 4 |
+
"epoch": 0.48,
|
| 5 |
"eval_steps": 20,
|
| 6 |
+
"global_step": 60,
|
| 7 |
"is_hyper_param_search": false,
|
| 8 |
"is_local_process_zero": true,
|
| 9 |
"is_world_process_zero": true,
|
|
|
|
| 56 |
"attributes": {}
|
| 57 |
}
|
| 58 |
},
|
| 59 |
+
"total_flos": 3880094771036160.0,
|
| 60 |
"train_batch_size": 8,
|
| 61 |
"trial_name": null,
|
| 62 |
"trial_params": null
|