penfever commited on
Commit
69609e8
·
verified ·
1 Parent(s): 69d449b

Training in progress, step 8600

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8cca581268f84db32402d3a5d5a696d25449755c38410afe48dcdb207a58efc
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5643e0ae46a74668c1f95870e0e0a94560f189b106b9a0db8ba3ad52a0871d6b
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6e5248e1e7e430d5f32387fcb7a62dc9148c4e79d1f726e7793412325bfa9517
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46357eaa8c2036198a6f24a88dacf7b4137d22e322c42f2cda31c21ea308f4cc
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9fd646f173467a5f94a2a9924aff2ffe467e6f2436365912dcc884dd2d8827c1
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9aba8533cb5780106aac1cc163616692079f819d177e84559a1f42d9da18b750
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:07b7fc6114fb01c41e7aa8e80291ea0992e5034e07e73b6c3ddedd357ac8514a
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f84b9f322129f4fa4a7c37d94d056f299d3fdad2c4e11b58c661ffe46c84844
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1712,3 +1712,42 @@
1712
  {"current_steps": 8395, "total_steps": 9128, "loss": 0.1195, "lr": 7.827504264331298e-07, "epoch": 6.438818565400844, "percentage": 91.97, "elapsed_time": "5:13:01", "remaining_time": "0:27:19"}
1713
  {"current_steps": 8400, "total_steps": 9128, "loss": 0.1209, "lr": 7.721915009777902e-07, "epoch": 6.44265439202148, "percentage": 92.02, "elapsed_time": "5:14:18", "remaining_time": "0:27:14"}
1714
  {"current_steps": 8405, "total_steps": 9128, "loss": 0.1102, "lr": 7.617028753523725e-07, "epoch": 6.446490218642118, "percentage": 92.08, "elapsed_time": "5:17:03", "remaining_time": "0:27:16"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1712
  {"current_steps": 8395, "total_steps": 9128, "loss": 0.1195, "lr": 7.827504264331298e-07, "epoch": 6.438818565400844, "percentage": 91.97, "elapsed_time": "5:13:01", "remaining_time": "0:27:19"}
1713
  {"current_steps": 8400, "total_steps": 9128, "loss": 0.1209, "lr": 7.721915009777902e-07, "epoch": 6.44265439202148, "percentage": 92.02, "elapsed_time": "5:14:18", "remaining_time": "0:27:14"}
1714
  {"current_steps": 8405, "total_steps": 9128, "loss": 0.1102, "lr": 7.617028753523725e-07, "epoch": 6.446490218642118, "percentage": 92.08, "elapsed_time": "5:17:03", "remaining_time": "0:27:16"}
1715
+ {"current_steps": 8410, "total_steps": 9128, "loss": 0.1194, "lr": 7.512845879048968e-07, "epoch": 6.450326045262754, "percentage": 92.13, "elapsed_time": "5:18:19", "remaining_time": "0:27:10"}
1716
+ {"current_steps": 8415, "total_steps": 9128, "loss": 0.1193, "lr": 7.409366767262316e-07, "epoch": 6.454161871883391, "percentage": 92.19, "elapsed_time": "5:19:36", "remaining_time": "0:27:04"}
1717
+ {"current_steps": 8420, "total_steps": 9128, "loss": 0.1155, "lr": 7.306591796499374e-07, "epoch": 6.457997698504028, "percentage": 92.24, "elapsed_time": "5:20:52", "remaining_time": "0:26:58"}
1718
+ {"current_steps": 8425, "total_steps": 9128, "loss": 0.1188, "lr": 7.204521342521209e-07, "epoch": 6.461833525124664, "percentage": 92.3, "elapsed_time": "5:22:07", "remaining_time": "0:26:52"}
1719
+ {"current_steps": 8430, "total_steps": 9128, "loss": 0.1111, "lr": 7.103155778513149e-07, "epoch": 6.465669351745301, "percentage": 92.35, "elapsed_time": "5:23:24", "remaining_time": "0:26:46"}
1720
+ {"current_steps": 8435, "total_steps": 9128, "loss": 0.1201, "lr": 7.002495475083337e-07, "epoch": 6.469505178365938, "percentage": 92.41, "elapsed_time": "5:24:40", "remaining_time": "0:26:40"}
1721
+ {"current_steps": 8440, "total_steps": 9128, "loss": 0.1112, "lr": 6.902540800261292e-07, "epoch": 6.473341004986574, "percentage": 92.46, "elapsed_time": "5:25:55", "remaining_time": "0:26:34"}
1722
+ {"current_steps": 8445, "total_steps": 9128, "loss": 0.1288, "lr": 6.803292119496774e-07, "epoch": 6.477176831607212, "percentage": 92.52, "elapsed_time": "5:27:12", "remaining_time": "0:26:27"}
1723
+ {"current_steps": 8450, "total_steps": 9128, "loss": 0.1182, "lr": 6.704749795658227e-07, "epoch": 6.481012658227848, "percentage": 92.57, "elapsed_time": "5:28:31", "remaining_time": "0:26:21"}
1724
+ {"current_steps": 8455, "total_steps": 9128, "loss": 0.1196, "lr": 6.606914189031499e-07, "epoch": 6.484848484848484, "percentage": 92.63, "elapsed_time": "5:29:48", "remaining_time": "0:26:15"}
1725
+ {"current_steps": 8460, "total_steps": 9128, "loss": 0.1155, "lr": 6.509785657318723e-07, "epoch": 6.488684311469122, "percentage": 92.68, "elapsed_time": "5:31:02", "remaining_time": "0:26:08"}
1726
+ {"current_steps": 8465, "total_steps": 9128, "loss": 0.1104, "lr": 6.413364555636769e-07, "epoch": 6.492520138089758, "percentage": 92.74, "elapsed_time": "5:32:17", "remaining_time": "0:26:01"}
1727
+ {"current_steps": 8470, "total_steps": 9128, "loss": 0.117, "lr": 6.317651236515954e-07, "epoch": 6.4963559647103954, "percentage": 92.79, "elapsed_time": "5:33:34", "remaining_time": "0:25:54"}
1728
+ {"current_steps": 8475, "total_steps": 9128, "loss": 0.1099, "lr": 6.222646049899039e-07, "epoch": 6.500191791331032, "percentage": 92.85, "elapsed_time": "5:34:49", "remaining_time": "0:25:47"}
1729
+ {"current_steps": 8480, "total_steps": 9128, "loss": 0.1111, "lr": 6.128349343139506e-07, "epoch": 6.504027617951668, "percentage": 92.9, "elapsed_time": "5:36:05", "remaining_time": "0:25:40"}
1730
+ {"current_steps": 8485, "total_steps": 9128, "loss": 0.1105, "lr": 6.034761461000727e-07, "epoch": 6.507863444572306, "percentage": 92.96, "elapsed_time": "5:37:20", "remaining_time": "0:25:33"}
1731
+ {"current_steps": 8490, "total_steps": 9128, "loss": 0.1217, "lr": 5.941882745654393e-07, "epoch": 6.511699271192942, "percentage": 93.01, "elapsed_time": "5:38:37", "remaining_time": "0:25:26"}
1732
+ {"current_steps": 8495, "total_steps": 9128, "loss": 0.1117, "lr": 5.849713536679357e-07, "epoch": 6.515535097813579, "percentage": 93.07, "elapsed_time": "5:39:52", "remaining_time": "0:25:19"}
1733
+ {"current_steps": 8500, "total_steps": 9128, "loss": 0.1103, "lr": 5.758254171060507e-07, "epoch": 6.519370924434216, "percentage": 93.12, "elapsed_time": "5:41:15", "remaining_time": "0:25:12"}
1734
+ {"current_steps": 8505, "total_steps": 9128, "loss": 0.11, "lr": 5.667504983187311e-07, "epoch": 6.523206751054852, "percentage": 93.17, "elapsed_time": "5:42:36", "remaining_time": "0:25:05"}
1735
+ {"current_steps": 8510, "total_steps": 9128, "loss": 0.1024, "lr": 5.57746630485283e-07, "epoch": 6.5270425776754895, "percentage": 93.23, "elapsed_time": "5:43:51", "remaining_time": "0:24:58"}
1736
+ {"current_steps": 8515, "total_steps": 9128, "loss": 0.1144, "lr": 5.488138465252335e-07, "epoch": 6.530878404296126, "percentage": 93.28, "elapsed_time": "5:45:06", "remaining_time": "0:24:50"}
1737
+ {"current_steps": 8520, "total_steps": 9128, "loss": 0.114, "lr": 5.399521790982131e-07, "epoch": 6.534714230916762, "percentage": 93.34, "elapsed_time": "5:46:24", "remaining_time": "0:24:43"}
1738
+ {"current_steps": 8525, "total_steps": 9128, "loss": 0.1147, "lr": 5.311616606038472e-07, "epoch": 6.5385500575374, "percentage": 93.39, "elapsed_time": "5:47:41", "remaining_time": "0:24:35"}
1739
+ {"current_steps": 8530, "total_steps": 9128, "loss": 0.1162, "lr": 5.224423231816223e-07, "epoch": 6.542385884158036, "percentage": 93.45, "elapsed_time": "5:48:57", "remaining_time": "0:24:27"}
1740
+ {"current_steps": 8535, "total_steps": 9128, "loss": 0.1119, "lr": 5.13794198710782e-07, "epoch": 6.546221710778672, "percentage": 93.5, "elapsed_time": "5:50:13", "remaining_time": "0:24:19"}
1741
+ {"current_steps": 8540, "total_steps": 9128, "loss": 0.1122, "lr": 5.052173188102005e-07, "epoch": 6.55005753739931, "percentage": 93.56, "elapsed_time": "5:51:28", "remaining_time": "0:24:12"}
1742
+ {"current_steps": 8545, "total_steps": 9128, "loss": 0.2227, "lr": 4.967117148382716e-07, "epoch": 6.553893364019946, "percentage": 93.61, "elapsed_time": "5:53:35", "remaining_time": "0:24:07"}
1743
+ {"current_steps": 8550, "total_steps": 9128, "loss": 0.2159, "lr": 4.882774178927951e-07, "epoch": 6.557729190640583, "percentage": 93.67, "elapsed_time": "5:55:45", "remaining_time": "0:24:03"}
1744
+ {"current_steps": 8555, "total_steps": 9128, "loss": 0.2124, "lr": 4.799144588108595e-07, "epoch": 6.56156501726122, "percentage": 93.72, "elapsed_time": "5:58:18", "remaining_time": "0:23:59"}
1745
+ {"current_steps": 8560, "total_steps": 9128, "loss": 0.2041, "lr": 4.716228681687285e-07, "epoch": 6.565400843881856, "percentage": 93.78, "elapsed_time": "6:00:36", "remaining_time": "0:23:55"}
1746
+ {"current_steps": 8565, "total_steps": 9128, "loss": 0.2134, "lr": 4.63402676281739e-07, "epoch": 6.569236670502494, "percentage": 93.83, "elapsed_time": "6:02:55", "remaining_time": "0:23:51"}
1747
+ {"current_steps": 8570, "total_steps": 9128, "loss": 0.2118, "lr": 4.5525391320417667e-07, "epoch": 6.57307249712313, "percentage": 93.89, "elapsed_time": "6:05:14", "remaining_time": "0:23:46"}
1748
+ {"current_steps": 8575, "total_steps": 9128, "loss": 0.2048, "lr": 4.4717660872917624e-07, "epoch": 6.576908323743766, "percentage": 93.94, "elapsed_time": "6:07:43", "remaining_time": "0:23:42"}
1749
+ {"current_steps": 8580, "total_steps": 9128, "loss": 0.2052, "lr": 4.391707923886035e-07, "epoch": 6.580744150364404, "percentage": 94.0, "elapsed_time": "6:09:55", "remaining_time": "0:23:37"}
1750
+ {"current_steps": 8585, "total_steps": 9128, "loss": 0.2136, "lr": 4.312364934529623e-07, "epoch": 6.58457997698504, "percentage": 94.05, "elapsed_time": "6:12:23", "remaining_time": "0:23:33"}
1751
+ {"current_steps": 8590, "total_steps": 9128, "loss": 0.2121, "lr": 4.233737409312655e-07, "epoch": 6.5884158036056775, "percentage": 94.11, "elapsed_time": "6:14:36", "remaining_time": "0:23:27"}
1752
+ {"current_steps": 8595, "total_steps": 9128, "loss": 0.2109, "lr": 4.155825635709509e-07, "epoch": 6.592251630226314, "percentage": 94.16, "elapsed_time": "6:16:57", "remaining_time": "0:23:22"}
1753
+ {"current_steps": 8600, "total_steps": 9128, "loss": 0.2018, "lr": 4.078629898577635e-07, "epoch": 6.59608745684695, "percentage": 94.22, "elapsed_time": "6:19:33", "remaining_time": "0:23:18"}