Training in progress, step 2148
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6918c5d2e8247eca0a4c81d753e689637ef8b29991a598bda9ee7be161dadc2
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d8b77c03381f488bcbd2c327c5336f9d4ba44b8c8050964f1279cc531a4508dd
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:20cd87ede661105d5b08ae2c36f132944c7e581567201c132884859b8bcb843b
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:15b47a1b1906ee1c0353cee6be06237ed466bcf021c879862b8049e52231438a
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -2044,3 +2044,106 @@
|
|
| 2044 |
{"current_steps": 2044, "total_steps": 2148, "loss": 0.2272, "lr": 7.262739110200923e-08, "epoch": 2.8537549407114624, "percentage": 95.16, "elapsed_time": "4:45:21", "remaining_time": "0:14:31"}
|
| 2045 |
{"current_steps": 2045, "total_steps": 2148, "loss": 0.2544, "lr": 7.125387924872552e-08, "epoch": 2.8551499651243897, "percentage": 95.2, "elapsed_time": "4:45:31", "remaining_time": "0:14:22"}
|
| 2046 |
{"current_steps": 2046, "total_steps": 2148, "loss": 0.2132, "lr": 6.98933862384521e-08, "epoch": 2.856544989537317, "percentage": 95.25, "elapsed_time": "4:45:38", "remaining_time": "0:14:14"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2044 |
{"current_steps": 2044, "total_steps": 2148, "loss": 0.2272, "lr": 7.262739110200923e-08, "epoch": 2.8537549407114624, "percentage": 95.16, "elapsed_time": "4:45:21", "remaining_time": "0:14:31"}
|
| 2045 |
{"current_steps": 2045, "total_steps": 2148, "loss": 0.2544, "lr": 7.125387924872552e-08, "epoch": 2.8551499651243897, "percentage": 95.2, "elapsed_time": "4:45:31", "remaining_time": "0:14:22"}
|
| 2046 |
{"current_steps": 2046, "total_steps": 2148, "loss": 0.2132, "lr": 6.98933862384521e-08, "epoch": 2.856544989537317, "percentage": 95.25, "elapsed_time": "4:45:38", "remaining_time": "0:14:14"}
|
| 2047 |
+
{"current_steps": 2047, "total_steps": 2148, "loss": 0.1864, "lr": 6.854591566480884e-08, "epoch": 2.857940013950244, "percentage": 95.3, "elapsed_time": "4:45:47", "remaining_time": "0:14:06"}
|
| 2048 |
+
{"current_steps": 2048, "total_steps": 2148, "loss": 0.2338, "lr": 6.721147108701864e-08, "epoch": 2.8593350383631715, "percentage": 95.34, "elapsed_time": "4:45:54", "remaining_time": "0:13:57"}
|
| 2049 |
+
{"current_steps": 2049, "total_steps": 2148, "loss": 0.2299, "lr": 6.589005602989862e-08, "epoch": 2.8607300627760983, "percentage": 95.39, "elapsed_time": "4:46:02", "remaining_time": "0:13:49"}
|
| 2050 |
+
{"current_steps": 2050, "total_steps": 2148, "loss": 0.2375, "lr": 6.458167398384896e-08, "epoch": 2.8621250871890256, "percentage": 95.44, "elapsed_time": "4:46:09", "remaining_time": "0:13:40"}
|
| 2051 |
+
{"current_steps": 2051, "total_steps": 2148, "loss": 0.1987, "lr": 6.328632840484294e-08, "epoch": 2.863520111601953, "percentage": 95.48, "elapsed_time": "4:46:16", "remaining_time": "0:13:32"}
|
| 2052 |
+
{"current_steps": 2052, "total_steps": 2148, "loss": 0.2252, "lr": 6.200402271442085e-08, "epoch": 2.86491513601488, "percentage": 95.53, "elapsed_time": "4:46:23", "remaining_time": "0:13:23"}
|
| 2053 |
+
{"current_steps": 2053, "total_steps": 2148, "loss": 0.2308, "lr": 6.073476029967884e-08, "epoch": 2.8663101604278074, "percentage": 95.58, "elapsed_time": "4:46:31", "remaining_time": "0:13:15"}
|
| 2054 |
+
{"current_steps": 2054, "total_steps": 2148, "loss": 0.2437, "lr": 5.947854451326007e-08, "epoch": 2.8677051848407347, "percentage": 95.62, "elapsed_time": "4:46:39", "remaining_time": "0:13:07"}
|
| 2055 |
+
{"current_steps": 2055, "total_steps": 2148, "loss": 0.2112, "lr": 5.823537867334694e-08, "epoch": 2.869100209253662, "percentage": 95.67, "elapsed_time": "4:46:47", "remaining_time": "0:12:58"}
|
| 2056 |
+
{"current_steps": 2056, "total_steps": 2148, "loss": 0.2251, "lr": 5.7005266063650534e-08, "epoch": 2.870495233666589, "percentage": 95.72, "elapsed_time": "4:46:53", "remaining_time": "0:12:50"}
|
| 2057 |
+
{"current_steps": 2057, "total_steps": 2148, "loss": 0.2792, "lr": 5.5788209933403944e-08, "epoch": 2.8718902580795165, "percentage": 95.76, "elapsed_time": "4:47:00", "remaining_time": "0:12:41"}
|
| 2058 |
+
{"current_steps": 2058, "total_steps": 2148, "loss": 0.2251, "lr": 5.4584213497351766e-08, "epoch": 2.8732852824924437, "percentage": 95.81, "elapsed_time": "4:47:07", "remaining_time": "0:12:33"}
|
| 2059 |
+
{"current_steps": 2059, "total_steps": 2148, "loss": 0.2103, "lr": 5.339327993574339e-08, "epoch": 2.874680306905371, "percentage": 95.86, "elapsed_time": "4:47:14", "remaining_time": "0:12:24"}
|
| 2060 |
+
{"current_steps": 2060, "total_steps": 2148, "loss": 0.1968, "lr": 5.221541239432415e-08, "epoch": 2.8760753313182983, "percentage": 95.9, "elapsed_time": "4:47:23", "remaining_time": "0:12:16"}
|
| 2061 |
+
{"current_steps": 2061, "total_steps": 2148, "loss": 0.2034, "lr": 5.1050613984324756e-08, "epoch": 2.8774703557312256, "percentage": 95.95, "elapsed_time": "4:47:33", "remaining_time": "0:12:08"}
|
| 2062 |
+
{"current_steps": 2062, "total_steps": 2148, "loss": 0.2559, "lr": 4.989888778245744e-08, "epoch": 2.8788653801441524, "percentage": 96.0, "elapsed_time": "4:47:42", "remaining_time": "0:11:59"}
|
| 2063 |
+
{"current_steps": 2063, "total_steps": 2148, "loss": 0.2391, "lr": 4.8760236830903697e-08, "epoch": 2.8802604045570797, "percentage": 96.04, "elapsed_time": "4:47:52", "remaining_time": "0:11:51"}
|
| 2064 |
+
{"current_steps": 2064, "total_steps": 2148, "loss": 0.2426, "lr": 4.763466413730822e-08, "epoch": 2.881655428970007, "percentage": 96.09, "elapsed_time": "4:47:59", "remaining_time": "0:11:43"}
|
| 2065 |
+
{"current_steps": 2065, "total_steps": 2148, "loss": 0.237, "lr": 4.65221726747711e-08, "epoch": 2.883050453382934, "percentage": 96.14, "elapsed_time": "4:48:09", "remaining_time": "0:11:34"}
|
| 2066 |
+
{"current_steps": 2066, "total_steps": 2148, "loss": 0.2231, "lr": 4.542276538183954e-08, "epoch": 2.8844454777958615, "percentage": 96.18, "elapsed_time": "4:48:24", "remaining_time": "0:11:26"}
|
| 2067 |
+
{"current_steps": 2067, "total_steps": 2148, "loss": 0.2465, "lr": 4.433644516249891e-08, "epoch": 2.8858405022087887, "percentage": 96.23, "elapsed_time": "4:48:31", "remaining_time": "0:11:18"}
|
| 2068 |
+
{"current_steps": 2068, "total_steps": 2148, "loss": 0.251, "lr": 4.326321488616836e-08, "epoch": 2.887235526621716, "percentage": 96.28, "elapsed_time": "4:48:50", "remaining_time": "0:11:10"}
|
| 2069 |
+
{"current_steps": 2069, "total_steps": 2148, "loss": 0.2239, "lr": 4.220307738768859e-08, "epoch": 2.888630551034643, "percentage": 96.32, "elapsed_time": "4:48:56", "remaining_time": "0:11:01"}
|
| 2070 |
+
{"current_steps": 2070, "total_steps": 2148, "loss": 0.2451, "lr": 4.11560354673185e-08, "epoch": 2.89002557544757, "percentage": 96.37, "elapsed_time": "4:49:04", "remaining_time": "0:10:53"}
|
| 2071 |
+
{"current_steps": 2071, "total_steps": 2148, "loss": 0.2296, "lr": 4.0122091890726354e-08, "epoch": 2.8914205998604974, "percentage": 96.42, "elapsed_time": "4:49:11", "remaining_time": "0:10:45"}
|
| 2072 |
+
{"current_steps": 2072, "total_steps": 2148, "loss": 0.2019, "lr": 3.9101249388981965e-08, "epoch": 2.8928156242734246, "percentage": 96.46, "elapsed_time": "4:49:24", "remaining_time": "0:10:36"}
|
| 2073 |
+
{"current_steps": 2073, "total_steps": 2148, "loss": 0.2576, "lr": 3.809351065854894e-08, "epoch": 2.894210648686352, "percentage": 96.51, "elapsed_time": "4:49:34", "remaining_time": "0:10:28"}
|
| 2074 |
+
{"current_steps": 2074, "total_steps": 2148, "loss": 0.2611, "lr": 3.709887836128023e-08, "epoch": 2.895605673099279, "percentage": 96.55, "elapsed_time": "4:49:44", "remaining_time": "0:10:20"}
|
| 2075 |
+
{"current_steps": 2075, "total_steps": 2148, "loss": 0.251, "lr": 3.611735512440706e-08, "epoch": 2.8970006975122065, "percentage": 96.6, "elapsed_time": "4:49:50", "remaining_time": "0:10:11"}
|
| 2076 |
+
{"current_steps": 2076, "total_steps": 2148, "loss": 0.2257, "lr": 3.5148943540536105e-08, "epoch": 2.8983957219251337, "percentage": 96.65, "elapsed_time": "4:49:59", "remaining_time": "0:10:03"}
|
| 2077 |
+
{"current_steps": 2077, "total_steps": 2148, "loss": 0.253, "lr": 3.4193646167640646e-08, "epoch": 2.899790746338061, "percentage": 96.69, "elapsed_time": "4:50:07", "remaining_time": "0:09:55"}
|
| 2078 |
+
{"current_steps": 2078, "total_steps": 2148, "loss": 0.2262, "lr": 3.325146552905223e-08, "epoch": 2.9011857707509883, "percentage": 96.74, "elapsed_time": "4:50:15", "remaining_time": "0:09:46"}
|
| 2079 |
+
{"current_steps": 2079, "total_steps": 2148, "loss": 0.2547, "lr": 3.2322404113457886e-08, "epoch": 2.9025807951639155, "percentage": 96.79, "elapsed_time": "4:50:24", "remaining_time": "0:09:38"}
|
| 2080 |
+
{"current_steps": 2080, "total_steps": 2148, "loss": 0.2294, "lr": 3.1406464374890144e-08, "epoch": 2.903975819576843, "percentage": 96.83, "elapsed_time": "4:50:31", "remaining_time": "0:09:29"}
|
| 2081 |
+
{"current_steps": 2081, "total_steps": 2148, "loss": 0.25, "lr": 3.0503648732722046e-08, "epoch": 2.90537084398977, "percentage": 96.88, "elapsed_time": "4:50:41", "remaining_time": "0:09:21"}
|
| 2082 |
+
{"current_steps": 2082, "total_steps": 2148, "loss": 0.2189, "lr": 2.9613959571660468e-08, "epoch": 2.906765868402697, "percentage": 96.93, "elapsed_time": "4:50:48", "remaining_time": "0:09:13"}
|
| 2083 |
+
{"current_steps": 2083, "total_steps": 2148, "loss": 0.2187, "lr": 2.8737399241740016e-08, "epoch": 2.908160892815624, "percentage": 96.97, "elapsed_time": "4:50:55", "remaining_time": "0:09:04"}
|
| 2084 |
+
{"current_steps": 2084, "total_steps": 2148, "loss": 0.224, "lr": 2.7873970058316934e-08, "epoch": 2.9095559172285514, "percentage": 97.02, "elapsed_time": "4:51:05", "remaining_time": "0:08:56"}
|
| 2085 |
+
{"current_steps": 2085, "total_steps": 2148, "loss": 0.225, "lr": 2.7023674302061875e-08, "epoch": 2.9109509416414787, "percentage": 97.07, "elapsed_time": "4:51:11", "remaining_time": "0:08:47"}
|
| 2086 |
+
{"current_steps": 2086, "total_steps": 2148, "loss": 0.2088, "lr": 2.6186514218954905e-08, "epoch": 2.912345966054406, "percentage": 97.11, "elapsed_time": "4:51:18", "remaining_time": "0:08:39"}
|
| 2087 |
+
{"current_steps": 2087, "total_steps": 2148, "loss": 0.216, "lr": 2.5362492020280517e-08, "epoch": 2.9137409904673333, "percentage": 97.16, "elapsed_time": "4:51:31", "remaining_time": "0:08:31"}
|
| 2088 |
+
{"current_steps": 2088, "total_steps": 2148, "loss": 0.2513, "lr": 2.4551609882619288e-08, "epoch": 2.9151360148802605, "percentage": 97.21, "elapsed_time": "4:51:40", "remaining_time": "0:08:22"}
|
| 2089 |
+
{"current_steps": 2089, "total_steps": 2148, "loss": 0.2172, "lr": 2.3753869947843457e-08, "epoch": 2.9165310392931874, "percentage": 97.25, "elapsed_time": "4:51:47", "remaining_time": "0:08:14"}
|
| 2090 |
+
{"current_steps": 2090, "total_steps": 2148, "loss": 0.2448, "lr": 2.296927432311358e-08, "epoch": 2.9179260637061146, "percentage": 97.3, "elapsed_time": "4:51:54", "remaining_time": "0:08:06"}
|
| 2091 |
+
{"current_steps": 2091, "total_steps": 2148, "loss": 0.2196, "lr": 2.2197825080867432e-08, "epoch": 2.919321088119042, "percentage": 97.35, "elapsed_time": "4:52:05", "remaining_time": "0:07:57"}
|
| 2092 |
+
{"current_steps": 2092, "total_steps": 2148, "loss": 0.2498, "lr": 2.1439524258819456e-08, "epoch": 2.920716112531969, "percentage": 97.39, "elapsed_time": "4:52:15", "remaining_time": "0:07:49"}
|
| 2093 |
+
{"current_steps": 2093, "total_steps": 2148, "loss": 0.22, "lr": 2.0694373859954653e-08, "epoch": 2.9221111369448964, "percentage": 97.44, "elapsed_time": "4:52:22", "remaining_time": "0:07:40"}
|
| 2094 |
+
{"current_steps": 2094, "total_steps": 2148, "loss": 0.237, "lr": 1.99623758525197e-08, "epoch": 2.9235061613578237, "percentage": 97.49, "elapsed_time": "4:52:29", "remaining_time": "0:07:32"}
|
| 2095 |
+
{"current_steps": 2095, "total_steps": 2148, "loss": 0.2211, "lr": 1.9243532170023504e-08, "epoch": 2.924901185770751, "percentage": 97.53, "elapsed_time": "4:52:38", "remaining_time": "0:07:24"}
|
| 2096 |
+
{"current_steps": 2096, "total_steps": 2148, "loss": 0.2026, "lr": 1.8537844711227215e-08, "epoch": 2.9262962101836782, "percentage": 97.58, "elapsed_time": "4:52:46", "remaining_time": "0:07:15"}
|
| 2097 |
+
{"current_steps": 2097, "total_steps": 2148, "loss": 0.2107, "lr": 1.7845315340140334e-08, "epoch": 2.9276912345966055, "percentage": 97.63, "elapsed_time": "4:52:57", "remaining_time": "0:07:07"}
|
| 2098 |
+
{"current_steps": 2098, "total_steps": 2148, "loss": 0.1909, "lr": 1.7165945886018498e-08, "epoch": 2.929086259009533, "percentage": 97.67, "elapsed_time": "4:53:06", "remaining_time": "0:06:59"}
|
| 2099 |
+
{"current_steps": 2099, "total_steps": 2148, "loss": 0.2141, "lr": 1.6499738143354594e-08, "epoch": 2.93048128342246, "percentage": 97.72, "elapsed_time": "4:53:14", "remaining_time": "0:06:50"}
|
| 2100 |
+
{"current_steps": 2100, "total_steps": 2148, "loss": 0.2288, "lr": 1.584669387187765e-08, "epoch": 2.9318763078353873, "percentage": 97.77, "elapsed_time": "4:53:29", "remaining_time": "0:06:42"}
|
| 2101 |
+
{"current_steps": 2101, "total_steps": 2148, "loss": 0.2178, "lr": 1.520681479654562e-08, "epoch": 2.9332713322483146, "percentage": 97.81, "elapsed_time": "4:53:38", "remaining_time": "0:06:34"}
|
| 2102 |
+
{"current_steps": 2102, "total_steps": 2148, "loss": 0.2275, "lr": 1.4580102607541502e-08, "epoch": 2.9346663566612414, "percentage": 97.86, "elapsed_time": "4:53:45", "remaining_time": "0:06:25"}
|
| 2103 |
+
{"current_steps": 2103, "total_steps": 2148, "loss": 0.2084, "lr": 1.3966558960269994e-08, "epoch": 2.9360613810741687, "percentage": 97.91, "elapsed_time": "4:53:52", "remaining_time": "0:06:17"}
|
| 2104 |
+
{"current_steps": 2104, "total_steps": 2148, "loss": 0.2093, "lr": 1.3366185475351957e-08, "epoch": 2.937456405487096, "percentage": 97.95, "elapsed_time": "4:53:59", "remaining_time": "0:06:08"}
|
| 2105 |
+
{"current_steps": 2105, "total_steps": 2148, "loss": 0.2305, "lr": 1.2778983738620521e-08, "epoch": 2.9388514299000232, "percentage": 98.0, "elapsed_time": "4:54:08", "remaining_time": "0:06:00"}
|
| 2106 |
+
{"current_steps": 2106, "total_steps": 2148, "loss": 0.2105, "lr": 1.2204955301116095e-08, "epoch": 2.9402464543129505, "percentage": 98.04, "elapsed_time": "4:54:15", "remaining_time": "0:05:52"}
|
| 2107 |
+
{"current_steps": 2107, "total_steps": 2148, "loss": 0.2199, "lr": 1.164410167908414e-08, "epoch": 2.941641478725878, "percentage": 98.09, "elapsed_time": "4:54:23", "remaining_time": "0:05:43"}
|
| 2108 |
+
{"current_steps": 2108, "total_steps": 2148, "loss": 0.2152, "lr": 1.109642435396907e-08, "epoch": 2.943036503138805, "percentage": 98.14, "elapsed_time": "4:54:33", "remaining_time": "0:05:35"}
|
| 2109 |
+
{"current_steps": 2109, "total_steps": 2148, "loss": 0.2228, "lr": 1.0561924772412024e-08, "epoch": 2.9444315275517323, "percentage": 98.18, "elapsed_time": "4:54:40", "remaining_time": "0:05:26"}
|
| 2110 |
+
{"current_steps": 2110, "total_steps": 2148, "loss": 0.27, "lr": 1.0040604346245319e-08, "epoch": 2.945826551964659, "percentage": 98.23, "elapsed_time": "4:54:47", "remaining_time": "0:05:18"}
|
| 2111 |
+
{"current_steps": 2111, "total_steps": 2148, "loss": 0.2221, "lr": 9.532464452491341e-09, "epoch": 2.9472215763775864, "percentage": 98.28, "elapsed_time": "4:54:54", "remaining_time": "0:05:10"}
|
| 2112 |
+
{"current_steps": 2112, "total_steps": 2148, "loss": 0.228, "lr": 9.037506433355325e-09, "epoch": 2.9486166007905137, "percentage": 98.32, "elapsed_time": "4:55:02", "remaining_time": "0:05:01"}
|
| 2113 |
+
{"current_steps": 2113, "total_steps": 2148, "loss": 0.2096, "lr": 8.555731596224803e-09, "epoch": 2.950011625203441, "percentage": 98.37, "elapsed_time": "4:55:11", "remaining_time": "0:04:53"}
|
| 2114 |
+
{"current_steps": 2114, "total_steps": 2148, "loss": 0.2394, "lr": 8.087141213665717e-09, "epoch": 2.9514066496163682, "percentage": 98.42, "elapsed_time": "4:55:19", "remaining_time": "0:04:44"}
|
| 2115 |
+
{"current_steps": 2115, "total_steps": 2148, "loss": 0.2302, "lr": 7.631736523416867e-09, "epoch": 2.9528016740292955, "percentage": 98.46, "elapsed_time": "4:55:26", "remaining_time": "0:04:36"}
|
| 2116 |
+
{"current_steps": 2116, "total_steps": 2148, "loss": 0.1825, "lr": 7.1895187283899104e-09, "epoch": 2.9541966984422228, "percentage": 98.51, "elapsed_time": "4:55:37", "remaining_time": "0:04:28"}
|
| 2117 |
+
{"current_steps": 2117, "total_steps": 2148, "loss": 0.2352, "lr": 6.760488996662706e-09, "epoch": 2.95559172285515, "percentage": 98.56, "elapsed_time": "4:55:47", "remaining_time": "0:04:19"}
|
| 2118 |
+
{"current_steps": 2118, "total_steps": 2148, "loss": 0.1935, "lr": 6.3446484614798635e-09, "epoch": 2.9569867472680773, "percentage": 98.6, "elapsed_time": "4:55:56", "remaining_time": "0:04:11"}
|
| 2119 |
+
{"current_steps": 2119, "total_steps": 2148, "loss": 0.236, "lr": 5.941998221247192e-09, "epoch": 2.9583817716810046, "percentage": 98.65, "elapsed_time": "4:56:03", "remaining_time": "0:04:03"}
|
| 2120 |
+
{"current_steps": 2120, "total_steps": 2148, "loss": 0.2755, "lr": 5.552539339528373e-09, "epoch": 2.959776796093932, "percentage": 98.7, "elapsed_time": "4:56:12", "remaining_time": "0:03:54"}
|
| 2121 |
+
{"current_steps": 2121, "total_steps": 2148, "loss": 0.2264, "lr": 5.176272845045516e-09, "epoch": 2.961171820506859, "percentage": 98.74, "elapsed_time": "4:56:21", "remaining_time": "0:03:46"}
|
| 2122 |
+
{"current_steps": 2122, "total_steps": 2148, "loss": 0.2042, "lr": 4.813199731671381e-09, "epoch": 2.962566844919786, "percentage": 98.79, "elapsed_time": "4:56:29", "remaining_time": "0:03:37"}
|
| 2123 |
+
{"current_steps": 2123, "total_steps": 2148, "loss": 0.1929, "lr": 4.463320958432716e-09, "epoch": 2.963961869332713, "percentage": 98.84, "elapsed_time": "4:56:35", "remaining_time": "0:03:29"}
|
| 2124 |
+
{"current_steps": 2124, "total_steps": 2148, "loss": 0.2185, "lr": 4.1266374495024795e-09, "epoch": 2.9653568937456405, "percentage": 98.88, "elapsed_time": "4:56:42", "remaining_time": "0:03:21"}
|
| 2125 |
+
{"current_steps": 2125, "total_steps": 2148, "loss": 0.2181, "lr": 3.803150094200403e-09, "epoch": 2.9667519181585678, "percentage": 98.93, "elapsed_time": "4:56:48", "remaining_time": "0:03:12"}
|
| 2126 |
+
{"current_steps": 2126, "total_steps": 2148, "loss": 0.2124, "lr": 3.4928597469885416e-09, "epoch": 2.968146942571495, "percentage": 98.98, "elapsed_time": "4:56:58", "remaining_time": "0:03:04"}
|
| 2127 |
+
{"current_steps": 2127, "total_steps": 2148, "loss": 0.2311, "lr": 3.1957672274723907e-09, "epoch": 2.9695419669844223, "percentage": 99.02, "elapsed_time": "4:57:05", "remaining_time": "0:02:55"}
|
| 2128 |
+
{"current_steps": 2128, "total_steps": 2148, "loss": 0.2369, "lr": 2.9118733203942207e-09, "epoch": 2.9709369913973496, "percentage": 99.07, "elapsed_time": "4:57:13", "remaining_time": "0:02:47"}
|
| 2129 |
+
{"current_steps": 2129, "total_steps": 2148, "loss": 0.237, "lr": 2.6411787756353e-09, "epoch": 2.972332015810277, "percentage": 99.12, "elapsed_time": "4:57:21", "remaining_time": "0:02:39"}
|
| 2130 |
+
{"current_steps": 2130, "total_steps": 2148, "loss": 0.2468, "lr": 2.3836843082108987e-09, "epoch": 2.9737270402232037, "percentage": 99.16, "elapsed_time": "4:57:30", "remaining_time": "0:02:30"}
|
| 2131 |
+
{"current_steps": 2131, "total_steps": 2148, "loss": 0.2164, "lr": 2.1393905982691752e-09, "epoch": 2.975122064636131, "percentage": 99.21, "elapsed_time": "4:57:38", "remaining_time": "0:02:22"}
|
| 2132 |
+
{"current_steps": 2132, "total_steps": 2148, "loss": 0.2264, "lr": 1.9082982910911817e-09, "epoch": 2.976517089049058, "percentage": 99.26, "elapsed_time": "4:57:46", "remaining_time": "0:02:14"}
|
| 2133 |
+
{"current_steps": 2133, "total_steps": 2148, "loss": 0.2187, "lr": 1.6904079970853083e-09, "epoch": 2.9779121134619855, "percentage": 99.3, "elapsed_time": "4:57:59", "remaining_time": "0:02:05"}
|
| 2134 |
+
{"current_steps": 2134, "total_steps": 2148, "loss": 0.2224, "lr": 1.4857202917900604e-09, "epoch": 2.9793071378749127, "percentage": 99.35, "elapsed_time": "4:58:12", "remaining_time": "0:01:57"}
|
| 2135 |
+
{"current_steps": 2135, "total_steps": 2148, "loss": 0.2136, "lr": 1.2942357158701734e-09, "epoch": 2.98070216228784, "percentage": 99.39, "elapsed_time": "4:58:19", "remaining_time": "0:01:48"}
|
| 2136 |
+
{"current_steps": 2136, "total_steps": 2148, "loss": 0.2397, "lr": 1.1159547751143918e-09, "epoch": 2.9820971867007673, "percentage": 99.44, "elapsed_time": "4:58:26", "remaining_time": "0:01:40"}
|
| 2137 |
+
{"current_steps": 2137, "total_steps": 2148, "loss": 0.2472, "lr": 9.508779404360235e-10, "epoch": 2.9834922111136946, "percentage": 99.49, "elapsed_time": "4:58:34", "remaining_time": "0:01:32"}
|
| 2138 |
+
{"current_steps": 2138, "total_steps": 2148, "loss": 0.222, "lr": 7.990056478707209e-10, "epoch": 2.984887235526622, "percentage": 99.53, "elapsed_time": "4:58:40", "remaining_time": "0:01:23"}
|
| 2139 |
+
{"current_steps": 2139, "total_steps": 2148, "loss": 0.225, "lr": 6.603382985759244e-10, "epoch": 2.986282259939549, "percentage": 99.58, "elapsed_time": "4:58:48", "remaining_time": "0:01:15"}
|
| 2140 |
+
{"current_steps": 2140, "total_steps": 2148, "loss": 0.2621, "lr": 5.348762588286427e-10, "epoch": 2.9876772843524764, "percentage": 99.63, "elapsed_time": "4:58:55", "remaining_time": "0:01:07"}
|
| 2141 |
+
{"current_steps": 2141, "total_steps": 2148, "loss": 0.251, "lr": 4.2261986002600783e-10, "epoch": 2.9890723087654036, "percentage": 99.67, "elapsed_time": "4:59:06", "remaining_time": "0:00:58"}
|
| 2142 |
+
{"current_steps": 2142, "total_steps": 2148, "loss": 0.2618, "lr": 3.235693986830546e-10, "epoch": 2.9904673331783305, "percentage": 99.72, "elapsed_time": "4:59:16", "remaining_time": "0:00:50"}
|
| 2143 |
+
{"current_steps": 2143, "total_steps": 2148, "loss": 0.2406, "lr": 2.3772513643327555e-10, "epoch": 2.9918623575912577, "percentage": 99.77, "elapsed_time": "4:59:25", "remaining_time": "0:00:41"}
|
| 2144 |
+
{"current_steps": 2144, "total_steps": 2148, "loss": 0.2249, "lr": 1.650873000258457e-10, "epoch": 2.993257382004185, "percentage": 99.81, "elapsed_time": "4:59:35", "remaining_time": "0:00:33"}
|
| 2145 |
+
{"current_steps": 2145, "total_steps": 2148, "loss": 0.2308, "lr": 1.0565608132728778e-10, "epoch": 2.9946524064171123, "percentage": 99.86, "elapsed_time": "4:59:46", "remaining_time": "0:00:25"}
|
| 2146 |
+
{"current_steps": 2146, "total_steps": 2148, "loss": 0.2503, "lr": 5.943163732036183e-11, "epoch": 2.9960474308300395, "percentage": 99.91, "elapsed_time": "4:59:53", "remaining_time": "0:00:16"}
|
| 2147 |
+
{"current_steps": 2147, "total_steps": 2148, "loss": 0.2435, "lr": 2.6414090102400147e-11, "epoch": 2.997442455242967, "percentage": 99.95, "elapsed_time": "5:00:01", "remaining_time": "0:00:08"}
|
| 2148 |
+
{"current_steps": 2148, "total_steps": 2148, "loss": 0.2391, "lr": 6.6035268864173e-12, "epoch": 2.998837479655894, "percentage": 100.0, "elapsed_time": "5:00:09", "remaining_time": "0:00:00"}
|
| 2149 |
+
{"current_steps": 2148, "total_steps": 2148, "epoch": 2.998837479655894, "percentage": 100.0, "elapsed_time": "5:02:04", "remaining_time": "0:00:00"}
|