penfever commited on
Commit
ab0cdc6
·
verified ·
1 Parent(s): 074f149

Training in progress, step 9400

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b1122f99e3fb1dd69991499b44f455fea57f40e717fcde33a21664d3f92004b7
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:098c66a66fcc14deabc66f12753bff071d233722893c0c17f511a49e6e717fd0
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7a8eaf068c58e3112cf54a3a8cfce6b33bbfd15f517616ad0160ae8d868afd7f
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb67372fcdbbaf294b0722aff8d566efb15a7c96c679f80eb5e6871e84dc7c20
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:eeab04c372de4b5cec4efe5fab6e32a2d71c625b0a7462e33e27568aee2bb755
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bbb6742468e75881577517d19dc58eaac8d938d0ae84351bd8f0ac8ffd2b1fa
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:71f17007a095747f77dce426b7d760ad5cbfa51eca1f13530bbcfd6e00036ef2
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8676e4fcdc1daafc8b713f5f82f9295a64707eddee55386857a392f4ba8900b
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1852,3 +1852,43 @@
1852
  {"current_steps": 9190, "total_steps": 9625, "loss": 0.1855, "lr": 2.49534843018866e-07, "epoch": 6.684612586395053, "percentage": 95.48, "elapsed_time": "13:50:16", "remaining_time": "0:39:18"}
1853
  {"current_steps": 9195, "total_steps": 9625, "loss": 0.1898, "lr": 2.4385597615269376e-07, "epoch": 6.688250272826482, "percentage": 95.53, "elapsed_time": "13:51:55", "remaining_time": "0:38:54"}
1854
  {"current_steps": 9200, "total_steps": 9625, "loss": 0.1902, "lr": 2.382420781784589e-07, "epoch": 6.691887959257912, "percentage": 95.58, "elapsed_time": "13:53:33", "remaining_time": "0:38:30"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1852
  {"current_steps": 9190, "total_steps": 9625, "loss": 0.1855, "lr": 2.49534843018866e-07, "epoch": 6.684612586395053, "percentage": 95.48, "elapsed_time": "13:50:16", "remaining_time": "0:39:18"}
1853
  {"current_steps": 9195, "total_steps": 9625, "loss": 0.1898, "lr": 2.4385597615269376e-07, "epoch": 6.688250272826482, "percentage": 95.53, "elapsed_time": "13:51:55", "remaining_time": "0:38:54"}
1854
  {"current_steps": 9200, "total_steps": 9625, "loss": 0.1902, "lr": 2.382420781784589e-07, "epoch": 6.691887959257912, "percentage": 95.58, "elapsed_time": "13:53:33", "remaining_time": "0:38:30"}
1855
+ {"current_steps": 9205, "total_steps": 9625, "loss": 0.1813, "lr": 2.3269316755768933e-07, "epoch": 6.695525645689342, "percentage": 95.64, "elapsed_time": "13:56:37", "remaining_time": "0:38:10"}
1856
+ {"current_steps": 9210, "total_steps": 9625, "loss": 0.1924, "lr": 2.2720926253821273e-07, "epoch": 6.699163332120771, "percentage": 95.69, "elapsed_time": "13:58:10", "remaining_time": "0:37:46"}
1857
+ {"current_steps": 9215, "total_steps": 9625, "loss": 0.1891, "lr": 2.2179038115407003e-07, "epoch": 6.702801018552201, "percentage": 95.74, "elapsed_time": "13:59:46", "remaining_time": "0:37:21"}
1858
+ {"current_steps": 9220, "total_steps": 9625, "loss": 0.1898, "lr": 2.1643654122548207e-07, "epoch": 6.70643870498363, "percentage": 95.79, "elapsed_time": "14:01:25", "remaining_time": "0:36:57"}
1859
+ {"current_steps": 9225, "total_steps": 9625, "loss": 0.1871, "lr": 2.1114776035876748e-07, "epoch": 6.71007639141506, "percentage": 95.84, "elapsed_time": "14:03:08", "remaining_time": "0:36:33"}
1860
+ {"current_steps": 9230, "total_steps": 9625, "loss": 0.1907, "lr": 2.059240559463005e-07, "epoch": 6.71371407784649, "percentage": 95.9, "elapsed_time": "14:04:48", "remaining_time": "0:36:09"}
1861
+ {"current_steps": 9235, "total_steps": 9625, "loss": 0.1891, "lr": 2.0076544516644646e-07, "epoch": 6.717351764277919, "percentage": 95.95, "elapsed_time": "14:06:35", "remaining_time": "0:35:45"}
1862
+ {"current_steps": 9240, "total_steps": 9625, "loss": 0.1928, "lr": 1.9567194498351093e-07, "epoch": 6.720989450709348, "percentage": 96.0, "elapsed_time": "14:08:15", "remaining_time": "0:35:20"}
1863
+ {"current_steps": 9245, "total_steps": 9625, "loss": 0.1861, "lr": 1.906435721476796e-07, "epoch": 6.724627137140779, "percentage": 96.05, "elapsed_time": "14:09:52", "remaining_time": "0:34:55"}
1864
+ {"current_steps": 9250, "total_steps": 9625, "loss": 0.1923, "lr": 1.8568034319495832e-07, "epoch": 6.728264823572208, "percentage": 96.1, "elapsed_time": "14:11:35", "remaining_time": "0:34:31"}
1865
+ {"current_steps": 9255, "total_steps": 9625, "loss": 0.1838, "lr": 1.8078227444713548e-07, "epoch": 6.731902510003637, "percentage": 96.16, "elapsed_time": "14:13:19", "remaining_time": "0:34:06"}
1866
+ {"current_steps": 9260, "total_steps": 9625, "loss": 0.1862, "lr": 1.7594938201170863e-07, "epoch": 6.735540196435068, "percentage": 96.21, "elapsed_time": "14:14:58", "remaining_time": "0:33:42"}
1867
+ {"current_steps": 9265, "total_steps": 9625, "loss": 0.1847, "lr": 1.7118168178184236e-07, "epoch": 6.739177882866497, "percentage": 96.26, "elapsed_time": "14:16:36", "remaining_time": "0:33:17"}
1868
+ {"current_steps": 9270, "total_steps": 9625, "loss": 0.1884, "lr": 1.6647918943631937e-07, "epoch": 6.742815569297926, "percentage": 96.31, "elapsed_time": "14:18:20", "remaining_time": "0:32:52"}
1869
+ {"current_steps": 9275, "total_steps": 9625, "loss": 0.1913, "lr": 1.6184192043947166e-07, "epoch": 6.746453255729357, "percentage": 96.36, "elapsed_time": "14:19:57", "remaining_time": "0:32:27"}
1870
+ {"current_steps": 9280, "total_steps": 9625, "loss": 0.192, "lr": 1.5726989004115622e-07, "epoch": 6.750090942160786, "percentage": 96.42, "elapsed_time": "14:21:37", "remaining_time": "0:32:01"}
1871
+ {"current_steps": 9285, "total_steps": 9625, "loss": 0.1895, "lr": 1.5276311327667936e-07, "epoch": 6.753728628592215, "percentage": 96.47, "elapsed_time": "14:23:19", "remaining_time": "0:31:36"}
1872
+ {"current_steps": 9290, "total_steps": 9625, "loss": 0.1926, "lr": 1.4832160496676128e-07, "epoch": 6.757366315023645, "percentage": 96.52, "elapsed_time": "14:25:03", "remaining_time": "0:31:11"}
1873
+ {"current_steps": 9295, "total_steps": 9625, "loss": 0.1907, "lr": 1.4394537971748946e-07, "epoch": 6.761004001455074, "percentage": 96.57, "elapsed_time": "14:26:36", "remaining_time": "0:30:46"}
1874
+ {"current_steps": 9300, "total_steps": 9625, "loss": 0.1898, "lr": 1.3963445192025417e-07, "epoch": 6.764641687886504, "percentage": 96.62, "elapsed_time": "14:28:19", "remaining_time": "0:30:20"}
1875
+ {"current_steps": 9305, "total_steps": 9625, "loss": 0.1757, "lr": 1.3538883575171967e-07, "epoch": 6.768279374317934, "percentage": 96.68, "elapsed_time": "14:30:01", "remaining_time": "0:29:55"}
1876
+ {"current_steps": 9310, "total_steps": 9625, "loss": 0.1875, "lr": 1.3120854517377324e-07, "epoch": 6.771917060749363, "percentage": 96.73, "elapsed_time": "14:31:36", "remaining_time": "0:29:29"}
1877
+ {"current_steps": 9315, "total_steps": 9625, "loss": 0.1746, "lr": 1.2709359393347165e-07, "epoch": 6.775554747180793, "percentage": 96.78, "elapsed_time": "14:33:18", "remaining_time": "0:29:03"}
1878
+ {"current_steps": 9320, "total_steps": 9625, "loss": 0.2044, "lr": 1.2304399556299917e-07, "epoch": 6.779192433612223, "percentage": 96.83, "elapsed_time": "14:34:57", "remaining_time": "0:28:38"}
1879
+ {"current_steps": 9325, "total_steps": 9625, "loss": 0.1901, "lr": 1.1905976337962533e-07, "epoch": 6.782830120043652, "percentage": 96.88, "elapsed_time": "14:36:47", "remaining_time": "0:28:12"}
1880
+ {"current_steps": 9330, "total_steps": 9625, "loss": 0.193, "lr": 1.1514091048566489e-07, "epoch": 6.786467806475082, "percentage": 96.94, "elapsed_time": "14:38:30", "remaining_time": "0:27:46"}
1881
+ {"current_steps": 9335, "total_steps": 9625, "loss": 0.195, "lr": 1.1128744976842465e-07, "epoch": 6.790105492906512, "percentage": 96.99, "elapsed_time": "14:40:12", "remaining_time": "0:27:20"}
1882
+ {"current_steps": 9340, "total_steps": 9625, "loss": 0.1974, "lr": 1.0749939390017006e-07, "epoch": 6.793743179337941, "percentage": 97.04, "elapsed_time": "14:41:53", "remaining_time": "0:26:54"}
1883
+ {"current_steps": 9345, "total_steps": 9625, "loss": 0.1921, "lr": 1.0377675533807641e-07, "epoch": 6.79738086576937, "percentage": 97.09, "elapsed_time": "14:43:32", "remaining_time": "0:26:28"}
1884
+ {"current_steps": 9350, "total_steps": 9625, "loss": 0.18, "lr": 1.0011954632419551e-07, "epoch": 6.801018552200801, "percentage": 97.14, "elapsed_time": "14:45:11", "remaining_time": "0:26:02"}
1885
+ {"current_steps": 9355, "total_steps": 9625, "loss": 0.1836, "lr": 9.652777888541131e-08, "epoch": 6.80465623863223, "percentage": 97.19, "elapsed_time": "14:46:47", "remaining_time": "0:25:35"}
1886
+ {"current_steps": 9360, "total_steps": 9625, "loss": 0.1788, "lr": 9.300146483339323e-08, "epoch": 6.808293925063659, "percentage": 97.25, "elapsed_time": "14:48:25", "remaining_time": "0:25:09"}
1887
+ {"current_steps": 9365, "total_steps": 9625, "loss": 0.18, "lr": 8.954061576457396e-08, "epoch": 6.811931611495089, "percentage": 97.3, "elapsed_time": "14:50:07", "remaining_time": "0:24:42"}
1888
+ {"current_steps": 9370, "total_steps": 9625, "loss": 0.1742, "lr": 8.614524306009842e-08, "epoch": 6.815569297926519, "percentage": 97.35, "elapsed_time": "14:51:48", "remaining_time": "0:24:16"}
1889
+ {"current_steps": 9375, "total_steps": 9625, "loss": 0.1705, "lr": 8.28153578857882e-08, "epoch": 6.819206984357948, "percentage": 97.4, "elapsed_time": "14:53:25", "remaining_time": "0:23:49"}
1890
+ {"current_steps": 9380, "total_steps": 9625, "loss": 0.1865, "lr": 7.955097119210609e-08, "epoch": 6.822844670789378, "percentage": 97.45, "elapsed_time": "14:55:05", "remaining_time": "0:23:22"}
1891
+ {"current_steps": 9385, "total_steps": 9625, "loss": 0.2029, "lr": 7.635209371412489e-08, "epoch": 6.826482357220808, "percentage": 97.51, "elapsed_time": "14:56:43", "remaining_time": "0:22:55"}
1892
+ {"current_steps": 9390, "total_steps": 9625, "loss": 0.1898, "lr": 7.32187359714831e-08, "epoch": 6.830120043652237, "percentage": 97.56, "elapsed_time": "14:58:21", "remaining_time": "0:22:28"}
1893
+ {"current_steps": 9395, "total_steps": 9625, "loss": 0.1931, "lr": 7.015090826835603e-08, "epoch": 6.833757730083667, "percentage": 97.61, "elapsed_time": "15:00:01", "remaining_time": "0:22:02"}
1894
+ {"current_steps": 9400, "total_steps": 9625, "loss": 0.1869, "lr": 6.714862069342021e-08, "epoch": 6.837395416515096, "percentage": 97.66, "elapsed_time": "15:01:42", "remaining_time": "0:21:35"}