Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3fdc5e60ef036f23cdad5a1c98071df178493d5ead503805abcfcfd0437a624b
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af132704c6eab1afbdfb69a557a51726e853c5942f9fed895f156252e1ee7544
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c8c096ec018b1c335114f6f848a760002c066d6e9ab9afdd85666f1a5abf9e2
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0545853ccc9aaab23bba744cf260d87993666ab532e80c6778c912e559a56b04
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -65,3 +65,15 @@
|
|
| 65 |
{"current_steps": 65, "total_steps": 78, "loss": 0.6397, "lr": 8.271337313934869e-07, "epoch": 2.4683544303797467, "percentage": 83.33, "elapsed_time": "0:14:53", "remaining_time": "0:02:58"}
|
| 66 |
{"current_steps": 66, "total_steps": 78, "loss": 0.7229, "lr": 7.077560319906696e-07, "epoch": 2.5063291139240507, "percentage": 84.62, "elapsed_time": "0:15:07", "remaining_time": "0:02:44"}
|
| 67 |
{"current_steps": 67, "total_steps": 78, "loss": 0.7062, "lr": 5.9702234071631e-07, "epoch": 2.5443037974683547, "percentage": 85.9, "elapsed_time": "0:15:22", "remaining_time": "0:02:31"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 65 |
{"current_steps": 65, "total_steps": 78, "loss": 0.6397, "lr": 8.271337313934869e-07, "epoch": 2.4683544303797467, "percentage": 83.33, "elapsed_time": "0:14:53", "remaining_time": "0:02:58"}
|
| 66 |
{"current_steps": 66, "total_steps": 78, "loss": 0.7229, "lr": 7.077560319906696e-07, "epoch": 2.5063291139240507, "percentage": 84.62, "elapsed_time": "0:15:07", "remaining_time": "0:02:44"}
|
| 67 |
{"current_steps": 67, "total_steps": 78, "loss": 0.7062, "lr": 5.9702234071631e-07, "epoch": 2.5443037974683547, "percentage": 85.9, "elapsed_time": "0:15:22", "remaining_time": "0:02:31"}
|
| 68 |
+
{"current_steps": 68, "total_steps": 78, "loss": 0.747, "lr": 4.951556604879049e-07, "epoch": 2.5822784810126582, "percentage": 87.18, "elapsed_time": "0:15:33", "remaining_time": "0:02:17"}
|
| 69 |
+
{"current_steps": 69, "total_steps": 78, "loss": 0.6617, "lr": 4.0236113724274716e-07, "epoch": 2.620253164556962, "percentage": 88.46, "elapsed_time": "0:15:47", "remaining_time": "0:02:03"}
|
| 70 |
+
{"current_steps": 70, "total_steps": 78, "loss": 0.7664, "lr": 3.18825646801314e-07, "epoch": 2.6582278481012658, "percentage": 89.74, "elapsed_time": "0:16:00", "remaining_time": "0:01:49"}
|
| 71 |
+
{"current_steps": 71, "total_steps": 78, "loss": 0.7053, "lr": 2.447174185242324e-07, "epoch": 2.6962025316455698, "percentage": 91.03, "elapsed_time": "0:16:11", "remaining_time": "0:01:35"}
|
| 72 |
+
{"current_steps": 72, "total_steps": 78, "loss": 0.7124, "lr": 1.801856965207338e-07, "epoch": 2.7341772151898733, "percentage": 92.31, "elapsed_time": "0:16:22", "remaining_time": "0:01:21"}
|
| 73 |
+
{"current_steps": 73, "total_steps": 78, "loss": 0.7179, "lr": 1.253604390908819e-07, "epoch": 2.7721518987341773, "percentage": 93.59, "elapsed_time": "0:16:35", "remaining_time": "0:01:08"}
|
| 74 |
+
{"current_steps": 74, "total_steps": 78, "loss": 0.7522, "lr": 8.035205700685167e-08, "epoch": 2.810126582278481, "percentage": 94.87, "elapsed_time": "0:16:47", "remaining_time": "0:00:54"}
|
| 75 |
+
{"current_steps": 75, "total_steps": 78, "loss": 0.6989, "lr": 4.52511911603265e-08, "epoch": 2.848101265822785, "percentage": 96.15, "elapsed_time": "0:16:59", "remaining_time": "0:00:40"}
|
| 76 |
+
{"current_steps": 76, "total_steps": 78, "loss": 0.729, "lr": 2.012853002380466e-08, "epoch": 2.8860759493670884, "percentage": 97.44, "elapsed_time": "0:17:11", "remaining_time": "0:00:27"}
|
| 77 |
+
{"current_steps": 77, "total_steps": 78, "loss": 0.7252, "lr": 5.034667293427053e-09, "epoch": 2.9240506329113924, "percentage": 98.72, "elapsed_time": "0:17:22", "remaining_time": "0:00:13"}
|
| 78 |
+
{"current_steps": 78, "total_steps": 78, "loss": 0.7423, "lr": 0.0, "epoch": 2.962025316455696, "percentage": 100.0, "elapsed_time": "0:17:37", "remaining_time": "0:00:00"}
|
| 79 |
+
{"current_steps": 78, "total_steps": 78, "epoch": 2.962025316455696, "percentage": 100.0, "elapsed_time": "0:19:50", "remaining_time": "0:00:00"}
|