Training in progress, step 9400
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:098c66a66fcc14deabc66f12753bff071d233722893c0c17f511a49e6e717fd0
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eb67372fcdbbaf294b0722aff8d566efb15a7c96c679f80eb5e6871e84dc7c20
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6bbb6742468e75881577517d19dc58eaac8d938d0ae84351bd8f0ac8ffd2b1fa
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8676e4fcdc1daafc8b713f5f82f9295a64707eddee55386857a392f4ba8900b
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -1852,3 +1852,43 @@
|
|
| 1852 |
{"current_steps": 9190, "total_steps": 9625, "loss": 0.1855, "lr": 2.49534843018866e-07, "epoch": 6.684612586395053, "percentage": 95.48, "elapsed_time": "13:50:16", "remaining_time": "0:39:18"}
|
| 1853 |
{"current_steps": 9195, "total_steps": 9625, "loss": 0.1898, "lr": 2.4385597615269376e-07, "epoch": 6.688250272826482, "percentage": 95.53, "elapsed_time": "13:51:55", "remaining_time": "0:38:54"}
|
| 1854 |
{"current_steps": 9200, "total_steps": 9625, "loss": 0.1902, "lr": 2.382420781784589e-07, "epoch": 6.691887959257912, "percentage": 95.58, "elapsed_time": "13:53:33", "remaining_time": "0:38:30"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1852 |
{"current_steps": 9190, "total_steps": 9625, "loss": 0.1855, "lr": 2.49534843018866e-07, "epoch": 6.684612586395053, "percentage": 95.48, "elapsed_time": "13:50:16", "remaining_time": "0:39:18"}
|
| 1853 |
{"current_steps": 9195, "total_steps": 9625, "loss": 0.1898, "lr": 2.4385597615269376e-07, "epoch": 6.688250272826482, "percentage": 95.53, "elapsed_time": "13:51:55", "remaining_time": "0:38:54"}
|
| 1854 |
{"current_steps": 9200, "total_steps": 9625, "loss": 0.1902, "lr": 2.382420781784589e-07, "epoch": 6.691887959257912, "percentage": 95.58, "elapsed_time": "13:53:33", "remaining_time": "0:38:30"}
|
| 1855 |
+
{"current_steps": 9205, "total_steps": 9625, "loss": 0.1813, "lr": 2.3269316755768933e-07, "epoch": 6.695525645689342, "percentage": 95.64, "elapsed_time": "13:56:37", "remaining_time": "0:38:10"}
|
| 1856 |
+
{"current_steps": 9210, "total_steps": 9625, "loss": 0.1924, "lr": 2.2720926253821273e-07, "epoch": 6.699163332120771, "percentage": 95.69, "elapsed_time": "13:58:10", "remaining_time": "0:37:46"}
|
| 1857 |
+
{"current_steps": 9215, "total_steps": 9625, "loss": 0.1891, "lr": 2.2179038115407003e-07, "epoch": 6.702801018552201, "percentage": 95.74, "elapsed_time": "13:59:46", "remaining_time": "0:37:21"}
|
| 1858 |
+
{"current_steps": 9220, "total_steps": 9625, "loss": 0.1898, "lr": 2.1643654122548207e-07, "epoch": 6.70643870498363, "percentage": 95.79, "elapsed_time": "14:01:25", "remaining_time": "0:36:57"}
|
| 1859 |
+
{"current_steps": 9225, "total_steps": 9625, "loss": 0.1871, "lr": 2.1114776035876748e-07, "epoch": 6.71007639141506, "percentage": 95.84, "elapsed_time": "14:03:08", "remaining_time": "0:36:33"}
|
| 1860 |
+
{"current_steps": 9230, "total_steps": 9625, "loss": 0.1907, "lr": 2.059240559463005e-07, "epoch": 6.71371407784649, "percentage": 95.9, "elapsed_time": "14:04:48", "remaining_time": "0:36:09"}
|
| 1861 |
+
{"current_steps": 9235, "total_steps": 9625, "loss": 0.1891, "lr": 2.0076544516644646e-07, "epoch": 6.717351764277919, "percentage": 95.95, "elapsed_time": "14:06:35", "remaining_time": "0:35:45"}
|
| 1862 |
+
{"current_steps": 9240, "total_steps": 9625, "loss": 0.1928, "lr": 1.9567194498351093e-07, "epoch": 6.720989450709348, "percentage": 96.0, "elapsed_time": "14:08:15", "remaining_time": "0:35:20"}
|
| 1863 |
+
{"current_steps": 9245, "total_steps": 9625, "loss": 0.1861, "lr": 1.906435721476796e-07, "epoch": 6.724627137140779, "percentage": 96.05, "elapsed_time": "14:09:52", "remaining_time": "0:34:55"}
|
| 1864 |
+
{"current_steps": 9250, "total_steps": 9625, "loss": 0.1923, "lr": 1.8568034319495832e-07, "epoch": 6.728264823572208, "percentage": 96.1, "elapsed_time": "14:11:35", "remaining_time": "0:34:31"}
|
| 1865 |
+
{"current_steps": 9255, "total_steps": 9625, "loss": 0.1838, "lr": 1.8078227444713548e-07, "epoch": 6.731902510003637, "percentage": 96.16, "elapsed_time": "14:13:19", "remaining_time": "0:34:06"}
|
| 1866 |
+
{"current_steps": 9260, "total_steps": 9625, "loss": 0.1862, "lr": 1.7594938201170863e-07, "epoch": 6.735540196435068, "percentage": 96.21, "elapsed_time": "14:14:58", "remaining_time": "0:33:42"}
|
| 1867 |
+
{"current_steps": 9265, "total_steps": 9625, "loss": 0.1847, "lr": 1.7118168178184236e-07, "epoch": 6.739177882866497, "percentage": 96.26, "elapsed_time": "14:16:36", "remaining_time": "0:33:17"}
|
| 1868 |
+
{"current_steps": 9270, "total_steps": 9625, "loss": 0.1884, "lr": 1.6647918943631937e-07, "epoch": 6.742815569297926, "percentage": 96.31, "elapsed_time": "14:18:20", "remaining_time": "0:32:52"}
|
| 1869 |
+
{"current_steps": 9275, "total_steps": 9625, "loss": 0.1913, "lr": 1.6184192043947166e-07, "epoch": 6.746453255729357, "percentage": 96.36, "elapsed_time": "14:19:57", "remaining_time": "0:32:27"}
|
| 1870 |
+
{"current_steps": 9280, "total_steps": 9625, "loss": 0.192, "lr": 1.5726989004115622e-07, "epoch": 6.750090942160786, "percentage": 96.42, "elapsed_time": "14:21:37", "remaining_time": "0:32:01"}
|
| 1871 |
+
{"current_steps": 9285, "total_steps": 9625, "loss": 0.1895, "lr": 1.5276311327667936e-07, "epoch": 6.753728628592215, "percentage": 96.47, "elapsed_time": "14:23:19", "remaining_time": "0:31:36"}
|
| 1872 |
+
{"current_steps": 9290, "total_steps": 9625, "loss": 0.1926, "lr": 1.4832160496676128e-07, "epoch": 6.757366315023645, "percentage": 96.52, "elapsed_time": "14:25:03", "remaining_time": "0:31:11"}
|
| 1873 |
+
{"current_steps": 9295, "total_steps": 9625, "loss": 0.1907, "lr": 1.4394537971748946e-07, "epoch": 6.761004001455074, "percentage": 96.57, "elapsed_time": "14:26:36", "remaining_time": "0:30:46"}
|
| 1874 |
+
{"current_steps": 9300, "total_steps": 9625, "loss": 0.1898, "lr": 1.3963445192025417e-07, "epoch": 6.764641687886504, "percentage": 96.62, "elapsed_time": "14:28:19", "remaining_time": "0:30:20"}
|
| 1875 |
+
{"current_steps": 9305, "total_steps": 9625, "loss": 0.1757, "lr": 1.3538883575171967e-07, "epoch": 6.768279374317934, "percentage": 96.68, "elapsed_time": "14:30:01", "remaining_time": "0:29:55"}
|
| 1876 |
+
{"current_steps": 9310, "total_steps": 9625, "loss": 0.1875, "lr": 1.3120854517377324e-07, "epoch": 6.771917060749363, "percentage": 96.73, "elapsed_time": "14:31:36", "remaining_time": "0:29:29"}
|
| 1877 |
+
{"current_steps": 9315, "total_steps": 9625, "loss": 0.1746, "lr": 1.2709359393347165e-07, "epoch": 6.775554747180793, "percentage": 96.78, "elapsed_time": "14:33:18", "remaining_time": "0:29:03"}
|
| 1878 |
+
{"current_steps": 9320, "total_steps": 9625, "loss": 0.2044, "lr": 1.2304399556299917e-07, "epoch": 6.779192433612223, "percentage": 96.83, "elapsed_time": "14:34:57", "remaining_time": "0:28:38"}
|
| 1879 |
+
{"current_steps": 9325, "total_steps": 9625, "loss": 0.1901, "lr": 1.1905976337962533e-07, "epoch": 6.782830120043652, "percentage": 96.88, "elapsed_time": "14:36:47", "remaining_time": "0:28:12"}
|
| 1880 |
+
{"current_steps": 9330, "total_steps": 9625, "loss": 0.193, "lr": 1.1514091048566489e-07, "epoch": 6.786467806475082, "percentage": 96.94, "elapsed_time": "14:38:30", "remaining_time": "0:27:46"}
|
| 1881 |
+
{"current_steps": 9335, "total_steps": 9625, "loss": 0.195, "lr": 1.1128744976842465e-07, "epoch": 6.790105492906512, "percentage": 96.99, "elapsed_time": "14:40:12", "remaining_time": "0:27:20"}
|
| 1882 |
+
{"current_steps": 9340, "total_steps": 9625, "loss": 0.1974, "lr": 1.0749939390017006e-07, "epoch": 6.793743179337941, "percentage": 97.04, "elapsed_time": "14:41:53", "remaining_time": "0:26:54"}
|
| 1883 |
+
{"current_steps": 9345, "total_steps": 9625, "loss": 0.1921, "lr": 1.0377675533807641e-07, "epoch": 6.79738086576937, "percentage": 97.09, "elapsed_time": "14:43:32", "remaining_time": "0:26:28"}
|
| 1884 |
+
{"current_steps": 9350, "total_steps": 9625, "loss": 0.18, "lr": 1.0011954632419551e-07, "epoch": 6.801018552200801, "percentage": 97.14, "elapsed_time": "14:45:11", "remaining_time": "0:26:02"}
|
| 1885 |
+
{"current_steps": 9355, "total_steps": 9625, "loss": 0.1836, "lr": 9.652777888541131e-08, "epoch": 6.80465623863223, "percentage": 97.19, "elapsed_time": "14:46:47", "remaining_time": "0:25:35"}
|
| 1886 |
+
{"current_steps": 9360, "total_steps": 9625, "loss": 0.1788, "lr": 9.300146483339323e-08, "epoch": 6.808293925063659, "percentage": 97.25, "elapsed_time": "14:48:25", "remaining_time": "0:25:09"}
|
| 1887 |
+
{"current_steps": 9365, "total_steps": 9625, "loss": 0.18, "lr": 8.954061576457396e-08, "epoch": 6.811931611495089, "percentage": 97.3, "elapsed_time": "14:50:07", "remaining_time": "0:24:42"}
|
| 1888 |
+
{"current_steps": 9370, "total_steps": 9625, "loss": 0.1742, "lr": 8.614524306009842e-08, "epoch": 6.815569297926519, "percentage": 97.35, "elapsed_time": "14:51:48", "remaining_time": "0:24:16"}
|
| 1889 |
+
{"current_steps": 9375, "total_steps": 9625, "loss": 0.1705, "lr": 8.28153578857882e-08, "epoch": 6.819206984357948, "percentage": 97.4, "elapsed_time": "14:53:25", "remaining_time": "0:23:49"}
|
| 1890 |
+
{"current_steps": 9380, "total_steps": 9625, "loss": 0.1865, "lr": 7.955097119210609e-08, "epoch": 6.822844670789378, "percentage": 97.45, "elapsed_time": "14:55:05", "remaining_time": "0:23:22"}
|
| 1891 |
+
{"current_steps": 9385, "total_steps": 9625, "loss": 0.2029, "lr": 7.635209371412489e-08, "epoch": 6.826482357220808, "percentage": 97.51, "elapsed_time": "14:56:43", "remaining_time": "0:22:55"}
|
| 1892 |
+
{"current_steps": 9390, "total_steps": 9625, "loss": 0.1898, "lr": 7.32187359714831e-08, "epoch": 6.830120043652237, "percentage": 97.56, "elapsed_time": "14:58:21", "remaining_time": "0:22:28"}
|
| 1893 |
+
{"current_steps": 9395, "total_steps": 9625, "loss": 0.1931, "lr": 7.015090826835603e-08, "epoch": 6.833757730083667, "percentage": 97.61, "elapsed_time": "15:00:01", "remaining_time": "0:22:02"}
|
| 1894 |
+
{"current_steps": 9400, "total_steps": 9625, "loss": 0.1869, "lr": 6.714862069342021e-08, "epoch": 6.837395416515096, "percentage": 97.66, "elapsed_time": "15:01:42", "remaining_time": "0:21:35"}
|