Training in progress, step 400
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1df44194b32f263dfba9be329058741d708b94cbc88cb1cc7374fe58909d7781
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4635e0d935a82a93b0fe29e2245045b9f217cf10c0525770fe9288ef6277b587
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a471a7dd491963f9a6995dfed0a64b573e7c83e307c354435a8b2bf02896362
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc2746917e9269045dbae911a97213dca3a1fa65366972b4eac2c390bdfc2e31
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -51,3 +51,30 @@
|
|
| 51 |
{"current_steps": 255, "total_steps": 9128, "loss": 0.2757, "lr": 1.1128148959474261e-05, "epoch": 0.1956271576524741, "percentage": 2.79, "elapsed_time": "2:26:03", "remaining_time": "3 days, 12:42:25"}
|
| 52 |
{"current_steps": 260, "total_steps": 9128, "loss": 0.2808, "lr": 1.1347207009857613e-05, "epoch": 0.19946298427311085, "percentage": 2.85, "elapsed_time": "2:28:56", "remaining_time": "3 days, 12:40:07"}
|
| 53 |
{"current_steps": 265, "total_steps": 9128, "loss": 0.2751, "lr": 1.1566265060240964e-05, "epoch": 0.2032988108937476, "percentage": 2.9, "elapsed_time": "2:31:37", "remaining_time": "3 days, 12:31:18"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 51 |
{"current_steps": 255, "total_steps": 9128, "loss": 0.2757, "lr": 1.1128148959474261e-05, "epoch": 0.1956271576524741, "percentage": 2.79, "elapsed_time": "2:26:03", "remaining_time": "3 days, 12:42:25"}
|
| 52 |
{"current_steps": 260, "total_steps": 9128, "loss": 0.2808, "lr": 1.1347207009857613e-05, "epoch": 0.19946298427311085, "percentage": 2.85, "elapsed_time": "2:28:56", "remaining_time": "3 days, 12:40:07"}
|
| 53 |
{"current_steps": 265, "total_steps": 9128, "loss": 0.2751, "lr": 1.1566265060240964e-05, "epoch": 0.2032988108937476, "percentage": 2.9, "elapsed_time": "2:31:37", "remaining_time": "3 days, 12:31:18"}
|
| 54 |
+
{"current_steps": 270, "total_steps": 9128, "loss": 0.2608, "lr": 1.1785323110624316e-05, "epoch": 0.20713463751438435, "percentage": 2.96, "elapsed_time": "2:34:31", "remaining_time": "3 days, 12:29:30"}
|
| 55 |
+
{"current_steps": 275, "total_steps": 9128, "loss": 0.2757, "lr": 1.2004381161007668e-05, "epoch": 0.2109704641350211, "percentage": 3.01, "elapsed_time": "2:37:27", "remaining_time": "3 days, 12:28:58"}
|
| 56 |
+
{"current_steps": 280, "total_steps": 9128, "loss": 0.3343, "lr": 1.222343921139102e-05, "epoch": 0.21480629075565785, "percentage": 3.07, "elapsed_time": "2:39:41", "remaining_time": "3 days, 12:06:05"}
|
| 57 |
+
{"current_steps": 285, "total_steps": 9128, "loss": 0.4158, "lr": 1.2442497261774372e-05, "epoch": 0.2186421173762946, "percentage": 3.12, "elapsed_time": "2:40:56", "remaining_time": "3 days, 11:13:35"}
|
| 58 |
+
{"current_steps": 290, "total_steps": 9128, "loss": 0.3653, "lr": 1.2661555312157722e-05, "epoch": 0.22247794399693133, "percentage": 3.18, "elapsed_time": "2:42:11", "remaining_time": "3 days, 10:23:07"}
|
| 59 |
+
{"current_steps": 295, "total_steps": 9128, "loss": 0.3475, "lr": 1.2880613362541074e-05, "epoch": 0.22631377061756808, "percentage": 3.23, "elapsed_time": "2:43:26", "remaining_time": "3 days, 9:33:55"}
|
| 60 |
+
{"current_steps": 300, "total_steps": 9128, "loss": 0.337, "lr": 1.3099671412924427e-05, "epoch": 0.23014959723820483, "percentage": 3.29, "elapsed_time": "2:44:45", "remaining_time": "3 days, 8:48:14"}
|
| 61 |
+
{"current_steps": 305, "total_steps": 9128, "loss": 0.3226, "lr": 1.3318729463307779e-05, "epoch": 0.23398542385884158, "percentage": 3.34, "elapsed_time": "2:46:01", "remaining_time": "3 days, 8:02:34"}
|
| 62 |
+
{"current_steps": 310, "total_steps": 9128, "loss": 0.3273, "lr": 1.3537787513691129e-05, "epoch": 0.23782125047947833, "percentage": 3.4, "elapsed_time": "2:47:17", "remaining_time": "3 days, 7:18:27"}
|
| 63 |
+
{"current_steps": 315, "total_steps": 9128, "loss": 0.2963, "lr": 1.3756845564074481e-05, "epoch": 0.24165707710011508, "percentage": 3.45, "elapsed_time": "2:48:32", "remaining_time": "3 days, 6:35:16"}
|
| 64 |
+
{"current_steps": 320, "total_steps": 9128, "loss": 0.3139, "lr": 1.3975903614457833e-05, "epoch": 0.24549290372075183, "percentage": 3.51, "elapsed_time": "2:49:46", "remaining_time": "3 days, 5:53:03"}
|
| 65 |
+
{"current_steps": 325, "total_steps": 9128, "loss": 0.2929, "lr": 1.4194961664841185e-05, "epoch": 0.24932873034138858, "percentage": 3.56, "elapsed_time": "2:51:00", "remaining_time": "3 days, 5:12:02"}
|
| 66 |
+
{"current_steps": 330, "total_steps": 9128, "loss": 0.2917, "lr": 1.4414019715224536e-05, "epoch": 0.25316455696202533, "percentage": 3.62, "elapsed_time": "2:52:17", "remaining_time": "3 days, 4:33:25"}
|
| 67 |
+
{"current_steps": 335, "total_steps": 9128, "loss": 0.3017, "lr": 1.4633077765607888e-05, "epoch": 0.2570003835826621, "percentage": 3.67, "elapsed_time": "2:53:34", "remaining_time": "3 days, 3:55:51"}
|
| 68 |
+
{"current_steps": 340, "total_steps": 9128, "loss": 0.2892, "lr": 1.485213581599124e-05, "epoch": 0.26083621020329883, "percentage": 3.72, "elapsed_time": "2:54:49", "remaining_time": "3 days, 3:18:55"}
|
| 69 |
+
{"current_steps": 345, "total_steps": 9128, "loss": 0.2705, "lr": 1.5071193866374592e-05, "epoch": 0.2646720368239356, "percentage": 3.78, "elapsed_time": "2:56:03", "remaining_time": "3 days, 2:42:09"}
|
| 70 |
+
{"current_steps": 350, "total_steps": 9128, "loss": 0.2785, "lr": 1.5290251916757942e-05, "epoch": 0.2685078634445723, "percentage": 3.83, "elapsed_time": "2:57:17", "remaining_time": "3 days, 2:06:38"}
|
| 71 |
+
{"current_steps": 355, "total_steps": 9128, "loss": 0.2818, "lr": 1.5509309967141293e-05, "epoch": 0.27234369006520903, "percentage": 3.89, "elapsed_time": "2:58:35", "remaining_time": "3 days, 1:33:25"}
|
| 72 |
+
{"current_steps": 360, "total_steps": 9128, "loss": 0.279, "lr": 1.5728368017524643e-05, "epoch": 0.2761795166858458, "percentage": 3.94, "elapsed_time": "2:59:50", "remaining_time": "3 days, 1:00:10"}
|
| 73 |
+
{"current_steps": 365, "total_steps": 9128, "loss": 0.2851, "lr": 1.5947426067907997e-05, "epoch": 0.28001534330648253, "percentage": 4.0, "elapsed_time": "3:01:09", "remaining_time": "3 days, 0:29:19"}
|
| 74 |
+
{"current_steps": 370, "total_steps": 9128, "loss": 0.2818, "lr": 1.6166484118291347e-05, "epoch": 0.2838511699271193, "percentage": 4.05, "elapsed_time": "3:02:23", "remaining_time": "2 days, 23:57:10"}
|
| 75 |
+
{"current_steps": 375, "total_steps": 9128, "loss": 0.2841, "lr": 1.63855421686747e-05, "epoch": 0.28768699654775604, "percentage": 4.11, "elapsed_time": "3:03:40", "remaining_time": "2 days, 23:27:22"}
|
| 76 |
+
{"current_steps": 380, "total_steps": 9128, "loss": 0.2694, "lr": 1.660460021905805e-05, "epoch": 0.2915228231683928, "percentage": 4.16, "elapsed_time": "3:04:58", "remaining_time": "2 days, 22:58:26"}
|
| 77 |
+
{"current_steps": 385, "total_steps": 9128, "loss": 0.2791, "lr": 1.6823658269441402e-05, "epoch": 0.29535864978902954, "percentage": 4.22, "elapsed_time": "3:06:20", "remaining_time": "2 days, 22:31:41"}
|
| 78 |
+
{"current_steps": 390, "total_steps": 9128, "loss": 0.2846, "lr": 1.7042716319824756e-05, "epoch": 0.2991944764096663, "percentage": 4.27, "elapsed_time": "3:07:35", "remaining_time": "2 days, 22:02:57"}
|
| 79 |
+
{"current_steps": 395, "total_steps": 9128, "loss": 0.2566, "lr": 1.7261774370208106e-05, "epoch": 0.30303030303030304, "percentage": 4.33, "elapsed_time": "3:08:49", "remaining_time": "2 days, 21:34:38"}
|
| 80 |
+
{"current_steps": 400, "total_steps": 9128, "loss": 0.2695, "lr": 1.7480832420591457e-05, "epoch": 0.3068661296509398, "percentage": 4.38, "elapsed_time": "3:10:04", "remaining_time": "2 days, 21:07:21"}
|