Training in progress, step 120
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +11 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 80013120
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a8b443a7dc2992ee50b59246c313423fb72c73121010b72d7622b64f0ba1b215
|
| 3 |
size 80013120
|
trainer_log.jsonl
CHANGED
|
@@ -119,3 +119,14 @@
|
|
| 119 |
{"current_steps": 109, "total_steps": 125, "loss": 0.1084, "lr": 4.951556604879048e-06, "epoch": 4.306172839506173, "percentage": 87.2, "elapsed_time": "0:57:53", "remaining_time": "0:08:29"}
|
| 120 |
{"current_steps": 110, "total_steps": 125, "loss": 0.0893, "lr": 4.360836746934055e-06, "epoch": 4.345679012345679, "percentage": 88.0, "elapsed_time": "0:58:22", "remaining_time": "0:07:57"}
|
| 121 |
{"current_steps": 110, "total_steps": 125, "eval_loss": 0.15510736405849457, "epoch": 4.345679012345679, "percentage": 88.0, "elapsed_time": "0:58:47", "remaining_time": "0:08:01"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 119 |
{"current_steps": 109, "total_steps": 125, "loss": 0.1084, "lr": 4.951556604879048e-06, "epoch": 4.306172839506173, "percentage": 87.2, "elapsed_time": "0:57:53", "remaining_time": "0:08:29"}
|
| 120 |
{"current_steps": 110, "total_steps": 125, "loss": 0.0893, "lr": 4.360836746934055e-06, "epoch": 4.345679012345679, "percentage": 88.0, "elapsed_time": "0:58:22", "remaining_time": "0:07:57"}
|
| 121 |
{"current_steps": 110, "total_steps": 125, "eval_loss": 0.15510736405849457, "epoch": 4.345679012345679, "percentage": 88.0, "elapsed_time": "0:58:47", "remaining_time": "0:08:01"}
|
| 122 |
+
{"current_steps": 111, "total_steps": 125, "loss": 0.0718, "lr": 3.8060233744356633e-06, "epoch": 4.385185185185185, "percentage": 88.8, "elapsed_time": "0:59:19", "remaining_time": "0:07:29"}
|
| 123 |
+
{"current_steps": 112, "total_steps": 125, "loss": 0.1311, "lr": 3.2875529852700147e-06, "epoch": 4.424691358024692, "percentage": 89.6, "elapsed_time": "0:59:51", "remaining_time": "0:06:56"}
|
| 124 |
+
{"current_steps": 113, "total_steps": 125, "loss": 0.0756, "lr": 2.8058334845816213e-06, "epoch": 4.4641975308641975, "percentage": 90.4, "elapsed_time": "1:00:19", "remaining_time": "0:06:24"}
|
| 125 |
+
{"current_steps": 114, "total_steps": 125, "loss": 0.087, "lr": 2.361243863855184e-06, "epoch": 4.503703703703704, "percentage": 91.2, "elapsed_time": "1:00:48", "remaining_time": "0:05:52"}
|
| 126 |
+
{"current_steps": 115, "total_steps": 125, "loss": 0.0901, "lr": 1.9541339027450256e-06, "epoch": 4.54320987654321, "percentage": 92.0, "elapsed_time": "1:01:16", "remaining_time": "0:05:19"}
|
| 127 |
+
{"current_steps": 116, "total_steps": 125, "loss": 0.0835, "lr": 1.584823893886933e-06, "epoch": 4.582716049382716, "percentage": 92.8, "elapsed_time": "1:01:41", "remaining_time": "0:04:47"}
|
| 128 |
+
{"current_steps": 117, "total_steps": 125, "loss": 0.0946, "lr": 1.2536043909088191e-06, "epoch": 4.622222222222222, "percentage": 93.6, "elapsed_time": "1:02:10", "remaining_time": "0:04:15"}
|
| 129 |
+
{"current_steps": 118, "total_steps": 125, "loss": 0.1277, "lr": 9.607359798384785e-07, "epoch": 4.661728395061728, "percentage": 94.4, "elapsed_time": "1:02:37", "remaining_time": "0:03:42"}
|
| 130 |
+
{"current_steps": 119, "total_steps": 125, "loss": 0.1015, "lr": 7.064490740882057e-07, "epoch": 4.701234567901235, "percentage": 95.2, "elapsed_time": "1:03:05", "remaining_time": "0:03:10"}
|
| 131 |
+
{"current_steps": 120, "total_steps": 125, "loss": 0.1005, "lr": 4.909437331777179e-07, "epoch": 4.7407407407407405, "percentage": 96.0, "elapsed_time": "1:03:36", "remaining_time": "0:02:39"}
|
| 132 |
+
{"current_steps": 120, "total_steps": 125, "eval_loss": 0.15540145337581635, "epoch": 4.7407407407407405, "percentage": 96.0, "elapsed_time": "1:04:01", "remaining_time": "0:02:40"}
|