Training in progress, step 1350
Browse files- adapter_model.safetensors +1 -1
- trainer_log.jsonl +6 -0
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 25200088
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:42e5c6f577a5db1527d5fde86c1e8af7d9c8b94e21324e7861916ef3352adc90
|
| 3 |
size 25200088
|
trainer_log.jsonl
CHANGED
|
@@ -154,3 +154,9 @@
|
|
| 154 |
{"current_steps": 1290, "total_steps": 1500, "loss": 0.1807, "accuracy": 0.925000011920929, "learning_rate": 2.3793236883495164e-07, "epoch": 1.1082939406961754, "percentage": 86.0, "elapsed_time": "2:49:50", "remaining_time": "0:27:38", "throughput": "0.00", "total_tokens": 0}
|
| 155 |
{"current_steps": 1300, "total_steps": 1500, "loss": 0.2061, "accuracy": 0.949999988079071, "learning_rate": 2.1613635589349756e-07, "epoch": 1.1168886978942845, "percentage": 86.67, "elapsed_time": "2:51:00", "remaining_time": "0:26:18", "throughput": "0.00", "total_tokens": 0}
|
| 156 |
{"current_steps": 1300, "total_steps": 1500, "eval_loss": 0.21187786757946014, "epoch": 1.1168886978942845, "percentage": 86.67, "elapsed_time": "2:51:26", "remaining_time": "0:26:22", "throughput": "0.00", "total_tokens": 0}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 154 |
{"current_steps": 1290, "total_steps": 1500, "loss": 0.1807, "accuracy": 0.925000011920929, "learning_rate": 2.3793236883495164e-07, "epoch": 1.1082939406961754, "percentage": 86.0, "elapsed_time": "2:49:50", "remaining_time": "0:27:38", "throughput": "0.00", "total_tokens": 0}
|
| 155 |
{"current_steps": 1300, "total_steps": 1500, "loss": 0.2061, "accuracy": 0.949999988079071, "learning_rate": 2.1613635589349756e-07, "epoch": 1.1168886978942845, "percentage": 86.67, "elapsed_time": "2:51:00", "remaining_time": "0:26:18", "throughput": "0.00", "total_tokens": 0}
|
| 156 |
{"current_steps": 1300, "total_steps": 1500, "eval_loss": 0.21187786757946014, "epoch": 1.1168886978942845, "percentage": 86.67, "elapsed_time": "2:51:26", "remaining_time": "0:26:22", "throughput": "0.00", "total_tokens": 0}
|
| 157 |
+
{"current_steps": 1310, "total_steps": 1500, "loss": 0.1841, "accuracy": 0.949999988079071, "learning_rate": 1.95342121028749e-07, "epoch": 1.1254834550923936, "percentage": 87.33, "elapsed_time": "2:52:51", "remaining_time": "0:25:04", "throughput": "0.00", "total_tokens": 0}
|
| 158 |
+
{"current_steps": 1320, "total_steps": 1500, "loss": 0.191, "accuracy": 0.9750000238418579, "learning_rate": 1.7555878527937164e-07, "epoch": 1.1340782122905029, "percentage": 88.0, "elapsed_time": "2:54:09", "remaining_time": "0:23:44", "throughput": "0.00", "total_tokens": 0}
|
| 159 |
+
{"current_steps": 1330, "total_steps": 1500, "loss": 0.1726, "accuracy": 0.9624999761581421, "learning_rate": 1.567950262702714e-07, "epoch": 1.142672969488612, "percentage": 88.67, "elapsed_time": "2:55:22", "remaining_time": "0:22:25", "throughput": "0.00", "total_tokens": 0}
|
| 160 |
+
{"current_steps": 1340, "total_steps": 1500, "loss": 0.1844, "accuracy": 0.949999988079071, "learning_rate": 1.3905907440629752e-07, "epoch": 1.151267726686721, "percentage": 89.33, "elapsed_time": "2:56:34", "remaining_time": "0:21:04", "throughput": "0.00", "total_tokens": 0}
|
| 161 |
+
{"current_steps": 1350, "total_steps": 1500, "loss": 0.1844, "accuracy": 0.949999988079071, "learning_rate": 1.223587092621162e-07, "epoch": 1.1598624838848304, "percentage": 90.0, "elapsed_time": "2:57:46", "remaining_time": "0:19:45", "throughput": "0.00", "total_tokens": 0}
|
| 162 |
+
{"current_steps": 1350, "total_steps": 1500, "eval_loss": 0.21017144620418549, "epoch": 1.1598624838848304, "percentage": 90.0, "elapsed_time": "2:58:12", "remaining_time": "0:19:48", "throughput": "0.00", "total_tokens": 0}
|