penfever commited on
Commit
79826ea
·
verified ·
1 Parent(s): be0da4b

Training in progress, step 7600

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:79682ff1f86458886b55ed95c5d41c1dc5af2bf263bf71f12a816419928ed63d
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5f334f5afe449a3011d215337373b7326b2460b08dcc4f033940513e27c6f9a
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:57138e8cd57d91dce5e47e0a886d9cf69d701ad1b9495033413bf23230e1d986
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:62ec755d06127e628b922395015710ab55c9ca048e27538356b0e16a409e1db4
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c89ac1c8a505b35e19ff7e3a73784ffe349b344494f8ca6348d6c2968b826a6
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6b54065f4695921ea58283c3f620f2e7ac4cab716f4a5a8a9b0603eff88bfdf
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:96f6f91db3ec86805ec9eacf5f8faa0c3f8b68ea80a356c8c11f847210f9c6ad
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:736de5030acda2b7dbb38923f822e5d5b41450ab6cd1cbaba89bd495fd8ea864
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1504,3 +1504,31 @@
1504
  {"current_steps": 7450, "total_steps": 9625, "loss": 0.1639, "lr": 5.911823029029531e-06, "epoch": 5.4183339396144055, "percentage": 77.4, "elapsed_time": "1:43:00", "remaining_time": "0:30:04"}
1505
  {"current_steps": 7455, "total_steps": 9625, "loss": 0.157, "lr": 5.8861029031564185e-06, "epoch": 5.421971626045835, "percentage": 77.45, "elapsed_time": "1:45:55", "remaining_time": "0:30:49"}
1506
  {"current_steps": 7460, "total_steps": 9625, "loss": 0.1584, "lr": 5.860429191414232e-06, "epoch": 5.425609312477264, "percentage": 77.51, "elapsed_time": "1:48:33", "remaining_time": "0:31:30"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1504
  {"current_steps": 7450, "total_steps": 9625, "loss": 0.1639, "lr": 5.911823029029531e-06, "epoch": 5.4183339396144055, "percentage": 77.4, "elapsed_time": "1:43:00", "remaining_time": "0:30:04"}
1505
  {"current_steps": 7455, "total_steps": 9625, "loss": 0.157, "lr": 5.8861029031564185e-06, "epoch": 5.421971626045835, "percentage": 77.45, "elapsed_time": "1:45:55", "remaining_time": "0:30:49"}
1506
  {"current_steps": 7460, "total_steps": 9625, "loss": 0.1584, "lr": 5.860429191414232e-06, "epoch": 5.425609312477264, "percentage": 77.51, "elapsed_time": "1:48:33", "remaining_time": "0:31:30"}
1507
+ {"current_steps": 7465, "total_steps": 9625, "loss": 0.1663, "lr": 5.834801978232019e-06, "epoch": 5.429246998908694, "percentage": 77.56, "elapsed_time": "1:51:15", "remaining_time": "0:32:11"}
1508
+ {"current_steps": 7470, "total_steps": 9625, "loss": 0.1589, "lr": 5.809221347885929e-06, "epoch": 5.432884685340124, "percentage": 77.61, "elapsed_time": "1:54:04", "remaining_time": "0:32:54"}
1509
+ {"current_steps": 7475, "total_steps": 9625, "loss": 0.1661, "lr": 5.7836873844989195e-06, "epoch": 5.436522371771553, "percentage": 77.66, "elapsed_time": "1:57:03", "remaining_time": "0:33:40"}
1510
+ {"current_steps": 7480, "total_steps": 9625, "loss": 0.1754, "lr": 5.758200172040484e-06, "epoch": 5.4401600582029825, "percentage": 77.71, "elapsed_time": "1:59:51", "remaining_time": "0:34:22"}
1511
+ {"current_steps": 7485, "total_steps": 9625, "loss": 0.1473, "lr": 5.732759794326355e-06, "epoch": 5.443797744634413, "percentage": 77.77, "elapsed_time": "2:02:13", "remaining_time": "0:34:56"}
1512
+ {"current_steps": 7490, "total_steps": 9625, "loss": 0.1499, "lr": 5.707366335018267e-06, "epoch": 5.447435431065842, "percentage": 77.82, "elapsed_time": "2:05:07", "remaining_time": "0:35:39"}
1513
+ {"current_steps": 7495, "total_steps": 9625, "loss": 0.1587, "lr": 5.682019877623666e-06, "epoch": 5.4510731174972715, "percentage": 77.87, "elapsed_time": "2:08:01", "remaining_time": "0:36:22"}
1514
+ {"current_steps": 7500, "total_steps": 9625, "loss": 0.1574, "lr": 5.656720505495399e-06, "epoch": 5.454710803928702, "percentage": 77.92, "elapsed_time": "2:10:48", "remaining_time": "0:37:03"}
1515
+ {"current_steps": 7505, "total_steps": 9625, "loss": 0.1639, "lr": 5.631468301831509e-06, "epoch": 5.458348490360131, "percentage": 77.97, "elapsed_time": "2:13:42", "remaining_time": "0:37:46"}
1516
+ {"current_steps": 7510, "total_steps": 9625, "loss": 0.1565, "lr": 5.606263349674894e-06, "epoch": 5.4619861767915605, "percentage": 78.03, "elapsed_time": "2:16:46", "remaining_time": "0:38:31"}
1517
+ {"current_steps": 7515, "total_steps": 9625, "loss": 0.1501, "lr": 5.581105731913079e-06, "epoch": 5.46562386322299, "percentage": 78.08, "elapsed_time": "2:19:46", "remaining_time": "0:39:14"}
1518
+ {"current_steps": 7520, "total_steps": 9625, "loss": 0.14, "lr": 5.555995531277931e-06, "epoch": 5.46926154965442, "percentage": 78.13, "elapsed_time": "2:22:48", "remaining_time": "0:39:58"}
1519
+ {"current_steps": 7525, "total_steps": 9625, "loss": 0.1386, "lr": 5.530932830345368e-06, "epoch": 5.4728992360858495, "percentage": 78.18, "elapsed_time": "2:25:39", "remaining_time": "0:40:38"}
1520
+ {"current_steps": 7530, "total_steps": 9625, "loss": 0.1635, "lr": 5.50591771153512e-06, "epoch": 5.476536922517279, "percentage": 78.23, "elapsed_time": "2:28:28", "remaining_time": "0:41:18"}
1521
+ {"current_steps": 7535, "total_steps": 9625, "loss": 0.1483, "lr": 5.480950257110424e-06, "epoch": 5.480174608948708, "percentage": 78.29, "elapsed_time": "2:30:47", "remaining_time": "0:41:49"}
1522
+ {"current_steps": 7540, "total_steps": 9625, "loss": 0.1654, "lr": 5.4560305491777885e-06, "epoch": 5.4838122953801385, "percentage": 78.34, "elapsed_time": "2:33:34", "remaining_time": "0:42:28"}
1523
+ {"current_steps": 7545, "total_steps": 9625, "loss": 0.1709, "lr": 5.431158669686696e-06, "epoch": 5.487449981811568, "percentage": 78.39, "elapsed_time": "2:36:32", "remaining_time": "0:43:09"}
1524
+ {"current_steps": 7550, "total_steps": 9625, "loss": 0.1685, "lr": 5.4063347004293495e-06, "epoch": 5.491087668242997, "percentage": 78.44, "elapsed_time": "2:39:25", "remaining_time": "0:43:48"}
1525
+ {"current_steps": 7555, "total_steps": 9625, "loss": 0.1593, "lr": 5.381558723040388e-06, "epoch": 5.4947253546744275, "percentage": 78.49, "elapsed_time": "2:42:21", "remaining_time": "0:44:29"}
1526
+ {"current_steps": 7560, "total_steps": 9625, "loss": 0.1683, "lr": 5.356830818996621e-06, "epoch": 5.498363041105857, "percentage": 78.55, "elapsed_time": "2:45:20", "remaining_time": "0:45:09"}
1527
+ {"current_steps": 7565, "total_steps": 9625, "loss": 0.1602, "lr": 5.332151069616797e-06, "epoch": 5.502000727537286, "percentage": 78.6, "elapsed_time": "2:48:22", "remaining_time": "0:45:50"}
1528
+ {"current_steps": 7570, "total_steps": 9625, "loss": 0.164, "lr": 5.307519556061276e-06, "epoch": 5.505638413968716, "percentage": 78.65, "elapsed_time": "2:51:20", "remaining_time": "0:46:30"}
1529
+ {"current_steps": 7575, "total_steps": 9625, "loss": 0.1639, "lr": 5.2829363593318075e-06, "epoch": 5.509276100400146, "percentage": 78.7, "elapsed_time": "2:54:22", "remaining_time": "0:47:11"}
1530
+ {"current_steps": 7580, "total_steps": 9625, "loss": 0.1668, "lr": 5.258401560271238e-06, "epoch": 5.512913786831575, "percentage": 78.75, "elapsed_time": "2:57:18", "remaining_time": "0:47:50"}
1531
+ {"current_steps": 7585, "total_steps": 9625, "loss": 0.162, "lr": 5.2339152395632675e-06, "epoch": 5.5165514732630045, "percentage": 78.81, "elapsed_time": "3:00:00", "remaining_time": "0:48:24"}
1532
+ {"current_steps": 7590, "total_steps": 9625, "loss": 0.1609, "lr": 5.209477477732172e-06, "epoch": 5.520189159694434, "percentage": 78.86, "elapsed_time": "3:02:43", "remaining_time": "0:48:59"}
1533
+ {"current_steps": 7595, "total_steps": 9625, "loss": 0.1276, "lr": 5.185088355142529e-06, "epoch": 5.523826846125864, "percentage": 78.91, "elapsed_time": "3:04:41", "remaining_time": "0:49:21"}
1534
+ {"current_steps": 7600, "total_steps": 9625, "loss": 0.1633, "lr": 5.160747951998979e-06, "epoch": 5.5274645325572935, "percentage": 78.96, "elapsed_time": "3:07:38", "remaining_time": "0:49:59"}