Training in progress, epoch 1

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:70a84472690ee94ab4fc659ce9e59640181ccab26852ca8f51cb4760acbd3e15
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:e51c2b68688c65e39784574e2ad95ce905566522879d31f116353b01de077bed
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0b3aac3ab3987ddf2f2467de7884bdd6fb0ca1ea94a3647bace1ed0a4671ef62
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:212595710eb925e97b45a355a9bcf17f2538ff211915ba56385a1bb83c42ac26
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3e8dcea7a77027536c9481f78daa46e228058f3440d46feac4ae483c529615a1
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:e0162f29fbce7b0f4ab1459375afe66c24a32fdcb304d2c57a78fe3ad90d9a5a
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6d56c2833c3de7d70bb5a80d665e5e5888d1d9e006c29af2f9b6f31b2c85f31c
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:2848e2acc1061595ba5ff316a24e3fb017e7bc278f4a96f0a206cdc9271d3707
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -2,3 +2,8 @@
 {"current_steps": 20, "total_steps": 99, "loss": 0.7619, "lr": 5e-06, "epoch": 0.5904059040590406, "percentage": 20.2, "elapsed_time": "0:10:42", "remaining_time": "0:42:19"}
 {"current_steps": 30, "total_steps": 99, "loss": 0.7397, "lr": 5e-06, "epoch": 0.8856088560885609, "percentage": 30.3, "elapsed_time": "0:16:02", "remaining_time": "0:36:53"}
 {"current_steps": 33, "total_steps": 99, "eval_loss": 0.7080272436141968, "epoch": 0.974169741697417, "percentage": 33.33, "elapsed_time": "0:18:19", "remaining_time": "0:36:38"}

 {"current_steps": 20, "total_steps": 99, "loss": 0.7619, "lr": 5e-06, "epoch": 0.5904059040590406, "percentage": 20.2, "elapsed_time": "0:10:42", "remaining_time": "0:42:19"}
 {"current_steps": 30, "total_steps": 99, "loss": 0.7397, "lr": 5e-06, "epoch": 0.8856088560885609, "percentage": 30.3, "elapsed_time": "0:16:02", "remaining_time": "0:36:53"}
 {"current_steps": 33, "total_steps": 99, "eval_loss": 0.7080272436141968, "epoch": 0.974169741697417, "percentage": 33.33, "elapsed_time": "0:18:19", "remaining_time": "0:36:38"}
+{"current_steps": 40, "total_steps": 99, "loss": 0.7258, "lr": 5e-06, "epoch": 1.1918819188191883, "percentage": 40.4, "elapsed_time": "0:23:00", "remaining_time": "0:33:55"}
+{"current_steps": 50, "total_steps": 99, "loss": 0.6617, "lr": 5e-06, "epoch": 1.4870848708487086, "percentage": 50.51, "elapsed_time": "0:28:20", "remaining_time": "0:27:46"}
+{"current_steps": 60, "total_steps": 99, "loss": 0.6487, "lr": 5e-06, "epoch": 1.7822878228782288, "percentage": 60.61, "elapsed_time": "0:33:40", "remaining_time": "0:21:53"}
+{"current_steps": 67, "total_steps": 99, "eval_loss": 0.6627019643783569, "epoch": 1.988929889298893, "percentage": 67.68, "elapsed_time": "0:37:45", "remaining_time": "0:18:01"}
+{"current_steps": 70, "total_steps": 99, "loss": 0.6553, "lr": 5e-06, "epoch": 2.088560885608856, "percentage": 70.71, "elapsed_time": "0:40:37", "remaining_time": "0:16:49"}