Training in progress, step 522
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4c5fac17614be21f328ad8de803fc4d54903c618cc086c62358f24d5aad18bfd
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9cd19cf74015656cfe27b6cef41b0754b8cb5ad2fc3fbf865ab9f4832be44f80
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:214da3d83436f605ed006feb29ba5d5e58edb17a79b9297a909e60e978676263
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ea45e5e235201bb8cb7065a6f5354f608a57f87123dd1b65a9f0be5b9152a82
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -502,3 +502,22 @@
|
|
| 502 |
{"current_steps": 502, "total_steps": 522, "loss": 0.4724, "lr": 4.4802722571561374e-08, "epoch": 2.8836764001914794, "percentage": 96.17, "elapsed_time": "7:06:11", "remaining_time": "0:16:58"}
|
| 503 |
{"current_steps": 503, "total_steps": 522, "loss": 0.4222, "lr": 4.044035565804793e-08, "epoch": 2.8894207754906653, "percentage": 96.36, "elapsed_time": "7:07:04", "remaining_time": "0:16:07"}
|
| 504 |
{"current_steps": 504, "total_steps": 522, "loss": 0.3833, "lr": 3.6300522323969855e-08, "epoch": 2.8951651507898517, "percentage": 96.55, "elapsed_time": "7:07:41", "remaining_time": "0:15:16"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 502 |
{"current_steps": 502, "total_steps": 522, "loss": 0.4724, "lr": 4.4802722571561374e-08, "epoch": 2.8836764001914794, "percentage": 96.17, "elapsed_time": "7:06:11", "remaining_time": "0:16:58"}
|
| 503 |
{"current_steps": 503, "total_steps": 522, "loss": 0.4222, "lr": 4.044035565804793e-08, "epoch": 2.8894207754906653, "percentage": 96.36, "elapsed_time": "7:07:04", "remaining_time": "0:16:07"}
|
| 504 |
{"current_steps": 504, "total_steps": 522, "loss": 0.3833, "lr": 3.6300522323969855e-08, "epoch": 2.8951651507898517, "percentage": 96.55, "elapsed_time": "7:07:41", "remaining_time": "0:15:16"}
|
| 505 |
+
{"current_steps": 505, "total_steps": 522, "loss": 0.4841, "lr": 3.2383408322095856e-08, "epoch": 2.9009095260890376, "percentage": 96.74, "elapsed_time": "7:08:42", "remaining_time": "0:14:25"}
|
| 506 |
+
{"current_steps": 506, "total_steps": 522, "loss": 0.4119, "lr": 2.8689189411859607e-08, "epoch": 2.906653901388224, "percentage": 96.93, "elapsed_time": "7:09:35", "remaining_time": "0:13:35"}
|
| 507 |
+
{"current_steps": 507, "total_steps": 522, "loss": 0.5207, "lr": 2.5218031351478268e-08, "epoch": 2.9123982766874104, "percentage": 97.13, "elapsed_time": "7:10:31", "remaining_time": "0:12:44"}
|
| 508 |
+
{"current_steps": 508, "total_steps": 522, "loss": 0.4163, "lr": 2.1970089890509527e-08, "epoch": 2.9181426519865967, "percentage": 97.32, "elapsed_time": "7:11:29", "remaining_time": "0:11:53"}
|
| 509 |
+
{"current_steps": 509, "total_steps": 522, "loss": 0.4461, "lr": 1.8945510762868325e-08, "epoch": 2.9238870272857826, "percentage": 97.51, "elapsed_time": "7:12:14", "remaining_time": "0:11:02"}
|
| 510 |
+
{"current_steps": 510, "total_steps": 522, "loss": 0.455, "lr": 1.614442968028429e-08, "epoch": 2.929631402584969, "percentage": 97.7, "elapsed_time": "7:13:05", "remaining_time": "0:10:11"}
|
| 511 |
+
{"current_steps": 511, "total_steps": 522, "loss": 0.4412, "lr": 1.3566972326214956e-08, "epoch": 2.935375777884155, "percentage": 97.89, "elapsed_time": "7:14:03", "remaining_time": "0:09:20"}
|
| 512 |
+
{"current_steps": 512, "total_steps": 522, "loss": 0.4247, "lr": 1.1213254350202486e-08, "epoch": 2.9411201531833413, "percentage": 98.08, "elapsed_time": "7:14:49", "remaining_time": "0:08:29"}
|
| 513 |
+
{"current_steps": 513, "total_steps": 522, "loss": 0.4326, "lr": 9.083381362690603e-09, "epoch": 2.9468645284825277, "percentage": 98.28, "elapsed_time": "7:15:45", "remaining_time": "0:07:38"}
|
| 514 |
+
{"current_steps": 514, "total_steps": 522, "loss": 0.4514, "lr": 7.177448930279496e-09, "epoch": 2.9526089037817136, "percentage": 98.47, "elapsed_time": "7:16:30", "remaining_time": "0:06:47"}
|
| 515 |
+
{"current_steps": 515, "total_steps": 522, "loss": 0.4163, "lr": 5.495542571443135e-09, "epoch": 2.9583532790809, "percentage": 98.66, "elapsed_time": "7:17:21", "remaining_time": "0:05:56"}
|
| 516 |
+
{"current_steps": 516, "total_steps": 522, "loss": 0.441, "lr": 4.037737752686788e-09, "epoch": 2.9640976543800863, "percentage": 98.85, "elapsed_time": "7:18:01", "remaining_time": "0:05:05"}
|
| 517 |
+
{"current_steps": 517, "total_steps": 522, "loss": 0.4451, "lr": 2.8040998851674996e-09, "epoch": 2.9698420296792722, "percentage": 99.04, "elapsed_time": "7:18:53", "remaining_time": "0:04:14"}
|
| 518 |
+
{"current_steps": 518, "total_steps": 522, "loss": 0.4208, "lr": 1.7946843217514498e-09, "epoch": 2.9755864049784586, "percentage": 99.23, "elapsed_time": "7:19:44", "remaining_time": "0:03:23"}
|
| 519 |
+
{"current_steps": 519, "total_steps": 522, "loss": 0.393, "lr": 1.009536354537044e-09, "epoch": 2.981330780277645, "percentage": 99.43, "elapsed_time": "7:20:30", "remaining_time": "0:02:32"}
|
| 520 |
+
{"current_steps": 520, "total_steps": 522, "loss": 0.5064, "lr": 4.486912128182086e-10, "epoch": 2.987075155576831, "percentage": 99.62, "elapsed_time": "7:21:24", "remaining_time": "0:01:41"}
|
| 521 |
+
{"current_steps": 521, "total_steps": 522, "loss": 0.4423, "lr": 1.1217406150676457e-10, "epoch": 2.9928195308760173, "percentage": 99.81, "elapsed_time": "7:22:12", "remaining_time": "0:00:50"}
|
| 522 |
+
{"current_steps": 522, "total_steps": 522, "loss": 0.4217, "lr": 0.0, "epoch": 2.998563906175203, "percentage": 100.0, "elapsed_time": "7:22:58", "remaining_time": "0:00:00"}
|
| 523 |
+
{"current_steps": 522, "total_steps": 522, "epoch": 2.998563906175203, "percentage": 100.0, "elapsed_time": "7:24:05", "remaining_time": "0:00:00"}
|