penfever commited on
Commit
87a8729
·
verified ·
1 Parent(s): 7febd3d

Training in progress, step 7200

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f7a46a7360648b302ad0496bf93b6d3883c74942d028f41e2f50657143073314
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c39c2d24789d65d10f0dfebdf84f843a010e8c08dac8ff2fea274383c9234d0
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1bb33d70743fcb25214de545b3a46fb9e6288d529b974bd563cb20cbff66a685
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a765b5aa61737baf73c915ef982e1df97d2c8016d8f5d515e85a69597083061c
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8dac38a9b4adcb43291642a70a5ef6eb103ddcbf339b577cce72743807483c0
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1add20774d9340611116747bfdec561ebf6496b1ebe60ea91a66d233e073c4cf
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e63b56d38c9ba30bc8ae30cd09cbfcc7e90f6cc5f31636110e5ace74deae0df8
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c986d44f3fcc5c85c4a17f48766386f8f68b2610a10cf631befee7a3cd6ea69
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1401,3 +1401,43 @@
1401
  {"current_steps": 7005, "total_steps": 9128, "loss": 0.1314, "lr": 6.242851839053132e-06, "epoch": 5.3720751822017645, "percentage": 76.74, "elapsed_time": "1 day, 19:47:20", "remaining_time": "13:16:15"}
1402
  {"current_steps": 7010, "total_steps": 9128, "loss": 0.1332, "lr": 6.2151190992568745e-06, "epoch": 5.375911008822401, "percentage": 76.8, "elapsed_time": "1 day, 19:48:39", "remaining_time": "13:14:13"}
1403
  {"current_steps": 7015, "total_steps": 9128, "loss": 0.1341, "lr": 6.187436759108749e-06, "epoch": 5.379746835443038, "percentage": 76.85, "elapsed_time": "1 day, 19:49:57", "remaining_time": "13:12:10"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1401
  {"current_steps": 7005, "total_steps": 9128, "loss": 0.1314, "lr": 6.242851839053132e-06, "epoch": 5.3720751822017645, "percentage": 76.74, "elapsed_time": "1 day, 19:47:20", "remaining_time": "13:16:15"}
1402
  {"current_steps": 7010, "total_steps": 9128, "loss": 0.1332, "lr": 6.2151190992568745e-06, "epoch": 5.375911008822401, "percentage": 76.8, "elapsed_time": "1 day, 19:48:39", "remaining_time": "13:14:13"}
1403
  {"current_steps": 7015, "total_steps": 9128, "loss": 0.1341, "lr": 6.187436759108749e-06, "epoch": 5.379746835443038, "percentage": 76.85, "elapsed_time": "1 day, 19:49:57", "remaining_time": "13:12:10"}
1404
+ {"current_steps": 7020, "total_steps": 9128, "loss": 0.1196, "lr": 6.159804919819658e-06, "epoch": 5.383582662063675, "percentage": 76.91, "elapsed_time": "1 day, 19:51:13", "remaining_time": "13:10:07"}
1405
+ {"current_steps": 7025, "total_steps": 9128, "loss": 0.1196, "lr": 6.132223682415861e-06, "epoch": 5.387418488684311, "percentage": 76.96, "elapsed_time": "1 day, 19:52:30", "remaining_time": "13:08:03"}
1406
+ {"current_steps": 7030, "total_steps": 9128, "loss": 0.133, "lr": 6.104693147738612e-06, "epoch": 5.391254315304948, "percentage": 77.02, "elapsed_time": "1 day, 19:53:45", "remaining_time": "13:06:00"}
1407
+ {"current_steps": 7035, "total_steps": 9128, "loss": 0.1217, "lr": 6.0772134164437855e-06, "epoch": 5.395090141925585, "percentage": 77.07, "elapsed_time": "1 day, 19:55:01", "remaining_time": "13:03:57"}
1408
+ {"current_steps": 7040, "total_steps": 9128, "loss": 0.1165, "lr": 6.049784589001515e-06, "epoch": 5.398925968546222, "percentage": 77.13, "elapsed_time": "1 day, 19:56:15", "remaining_time": "13:01:53"}
1409
+ {"current_steps": 7045, "total_steps": 9128, "loss": 0.1237, "lr": 6.022406765695816e-06, "epoch": 5.4027617951668585, "percentage": 77.18, "elapsed_time": "1 day, 19:57:32", "remaining_time": "12:59:50"}
1410
+ {"current_steps": 7050, "total_steps": 9128, "loss": 0.1271, "lr": 5.995080046624229e-06, "epoch": 5.406597621787495, "percentage": 77.23, "elapsed_time": "1 day, 19:58:47", "remaining_time": "12:57:47"}
1411
+ {"current_steps": 7055, "total_steps": 9128, "loss": 0.1262, "lr": 5.96780453169745e-06, "epoch": 5.410433448408132, "percentage": 77.29, "elapsed_time": "1 day, 20:00:02", "remaining_time": "12:55:44"}
1412
+ {"current_steps": 7060, "total_steps": 9128, "loss": 0.1189, "lr": 5.940580320638956e-06, "epoch": 5.414269275028769, "percentage": 77.34, "elapsed_time": "1 day, 20:01:17", "remaining_time": "12:53:40"}
1413
+ {"current_steps": 7065, "total_steps": 9128, "loss": 0.1292, "lr": 5.913407512984674e-06, "epoch": 5.418105101649405, "percentage": 77.4, "elapsed_time": "1 day, 20:02:33", "remaining_time": "12:51:38"}
1414
+ {"current_steps": 7070, "total_steps": 9128, "loss": 0.1194, "lr": 5.886286208082559e-06, "epoch": 5.421940928270042, "percentage": 77.45, "elapsed_time": "1 day, 20:03:50", "remaining_time": "12:49:35"}
1415
+ {"current_steps": 7075, "total_steps": 9128, "loss": 0.1261, "lr": 5.859216505092285e-06, "epoch": 5.425776754890679, "percentage": 77.51, "elapsed_time": "1 day, 20:05:04", "remaining_time": "12:47:32"}
1416
+ {"current_steps": 7080, "total_steps": 9128, "loss": 0.1221, "lr": 5.832198502984852e-06, "epoch": 5.429612581511316, "percentage": 77.56, "elapsed_time": "1 day, 20:06:19", "remaining_time": "12:45:29"}
1417
+ {"current_steps": 7085, "total_steps": 9128, "loss": 0.1193, "lr": 5.805232300542245e-06, "epoch": 5.4334484081319525, "percentage": 77.62, "elapsed_time": "1 day, 20:07:33", "remaining_time": "12:43:26"}
1418
+ {"current_steps": 7090, "total_steps": 9128, "loss": 0.1195, "lr": 5.778317996357048e-06, "epoch": 5.437284234752589, "percentage": 77.67, "elapsed_time": "1 day, 20:08:49", "remaining_time": "12:41:23"}
1419
+ {"current_steps": 7095, "total_steps": 9128, "loss": 0.1292, "lr": 5.751455688832108e-06, "epoch": 5.441120061373226, "percentage": 77.73, "elapsed_time": "1 day, 20:10:05", "remaining_time": "12:39:21"}
1420
+ {"current_steps": 7100, "total_steps": 9128, "loss": 0.1214, "lr": 5.724645476180151e-06, "epoch": 5.444955887993863, "percentage": 77.78, "elapsed_time": "1 day, 20:11:20", "remaining_time": "12:37:18"}
1421
+ {"current_steps": 7105, "total_steps": 9128, "loss": 0.1251, "lr": 5.697887456423461e-06, "epoch": 5.448791714614499, "percentage": 77.84, "elapsed_time": "1 day, 20:12:33", "remaining_time": "12:35:15"}
1422
+ {"current_steps": 7110, "total_steps": 9128, "loss": 0.1279, "lr": 5.671181727393467e-06, "epoch": 5.452627541235136, "percentage": 77.89, "elapsed_time": "1 day, 20:13:47", "remaining_time": "12:33:12"}
1423
+ {"current_steps": 7115, "total_steps": 9128, "loss": 0.1254, "lr": 5.644528386730424e-06, "epoch": 5.456463367855773, "percentage": 77.95, "elapsed_time": "1 day, 20:15:03", "remaining_time": "12:31:10"}
1424
+ {"current_steps": 7120, "total_steps": 9128, "loss": 0.1254, "lr": 5.617927531883072e-06, "epoch": 5.460299194476409, "percentage": 78.0, "elapsed_time": "1 day, 20:16:20", "remaining_time": "12:29:08"}
1425
+ {"current_steps": 7125, "total_steps": 9128, "loss": 0.1227, "lr": 5.591379260108214e-06, "epoch": 5.4641350210970465, "percentage": 78.06, "elapsed_time": "1 day, 20:17:35", "remaining_time": "12:27:06"}
1426
+ {"current_steps": 7130, "total_steps": 9128, "loss": 0.1225, "lr": 5.564883668470422e-06, "epoch": 5.467970847717683, "percentage": 78.11, "elapsed_time": "1 day, 20:18:49", "remaining_time": "12:25:04"}
1427
+ {"current_steps": 7135, "total_steps": 9128, "loss": 0.1201, "lr": 5.538440853841682e-06, "epoch": 5.47180667433832, "percentage": 78.17, "elapsed_time": "1 day, 20:20:02", "remaining_time": "12:23:01"}
1428
+ {"current_steps": 7140, "total_steps": 9128, "loss": 0.1338, "lr": 5.512050912900968e-06, "epoch": 5.475642500958957, "percentage": 78.22, "elapsed_time": "1 day, 20:21:17", "remaining_time": "12:20:59"}
1429
+ {"current_steps": 7145, "total_steps": 9128, "loss": 0.132, "lr": 5.485713942133992e-06, "epoch": 5.479478327579593, "percentage": 78.28, "elapsed_time": "1 day, 20:22:37", "remaining_time": "12:18:58"}
1430
+ {"current_steps": 7150, "total_steps": 9128, "loss": 0.1263, "lr": 5.459430037832776e-06, "epoch": 5.48331415420023, "percentage": 78.33, "elapsed_time": "1 day, 20:23:53", "remaining_time": "12:16:56"}
1431
+ {"current_steps": 7155, "total_steps": 9128, "loss": 0.1232, "lr": 5.433199296095302e-06, "epoch": 5.487149980820867, "percentage": 78.39, "elapsed_time": "1 day, 20:25:08", "remaining_time": "12:14:54"}
1432
+ {"current_steps": 7160, "total_steps": 9128, "loss": 0.1193, "lr": 5.40702181282523e-06, "epoch": 5.490985807441504, "percentage": 78.44, "elapsed_time": "1 day, 20:26:21", "remaining_time": "12:12:52"}
1433
+ {"current_steps": 7165, "total_steps": 9128, "loss": 0.1189, "lr": 5.380897683731452e-06, "epoch": 5.4948216340621405, "percentage": 78.49, "elapsed_time": "1 day, 20:27:37", "remaining_time": "12:10:50"}
1434
+ {"current_steps": 7170, "total_steps": 9128, "loss": 0.1232, "lr": 5.354827004327807e-06, "epoch": 5.498657460682777, "percentage": 78.55, "elapsed_time": "1 day, 20:28:52", "remaining_time": "12:08:49"}
1435
+ {"current_steps": 7175, "total_steps": 9128, "loss": 0.1169, "lr": 5.328809869932736e-06, "epoch": 5.502493287303414, "percentage": 78.6, "elapsed_time": "1 day, 20:30:07", "remaining_time": "12:06:47"}
1436
+ {"current_steps": 7180, "total_steps": 9128, "loss": 0.1195, "lr": 5.302846375668864e-06, "epoch": 5.506329113924051, "percentage": 78.66, "elapsed_time": "1 day, 20:31:22", "remaining_time": "12:04:46"}
1437
+ {"current_steps": 7185, "total_steps": 9128, "loss": 0.1293, "lr": 5.276936616462744e-06, "epoch": 5.510164940544687, "percentage": 78.71, "elapsed_time": "1 day, 20:32:37", "remaining_time": "12:02:44"}
1438
+ {"current_steps": 7190, "total_steps": 9128, "loss": 0.1207, "lr": 5.2510806870444476e-06, "epoch": 5.514000767165324, "percentage": 78.77, "elapsed_time": "1 day, 20:33:52", "remaining_time": "12:00:43"}
1439
+ {"current_steps": 7195, "total_steps": 9128, "loss": 0.1181, "lr": 5.225278681947219e-06, "epoch": 5.517836593785961, "percentage": 78.82, "elapsed_time": "1 day, 20:35:08", "remaining_time": "11:58:41"}
1440
+ {"current_steps": 7200, "total_steps": 9128, "loss": 0.1213, "lr": 5.19953069550718e-06, "epoch": 5.521672420406597, "percentage": 78.88, "elapsed_time": "1 day, 20:36:33", "remaining_time": "11:56:43"}
1441
+ {"current_steps": 7205, "total_steps": 9128, "loss": 0.1088, "lr": 5.173836821862937e-06, "epoch": 5.5255082470272345, "percentage": 78.93, "elapsed_time": "1 day, 20:39:10", "remaining_time": "11:55:04"}
1442
+ {"current_steps": 7210, "total_steps": 9128, "loss": 0.1216, "lr": 5.14819715495523e-06, "epoch": 5.529344073647871, "percentage": 78.99, "elapsed_time": "1 day, 20:40:25", "remaining_time": "11:53:02"}
1443
+ {"current_steps": 7215, "total_steps": 9128, "loss": 0.1176, "lr": 5.12261178852665e-06, "epoch": 5.533179900268507, "percentage": 79.04, "elapsed_time": "1 day, 20:41:41", "remaining_time": "11:51:01"}