penfever commited on
Commit
fe1bfe4
·
verified ·
1 Parent(s): 7ec2d4b

Training in progress, step 2400

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a404183474528b6bcd927c3999a1502fb5122d0318664fea83cbe695f236f3d
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b9f6976626ee793388b3c152c52a7f85152c9b758be988ace11b51341b12740
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af6099e253e716e86128aa33d9f1b9483352e37ad2d31697dc4548d67cafa75f
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba91d5c2836f44d84c61c34be3bfe7a1738d833f6e5b60da4c9ed0b8afcd1e04
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:81e80bcad604e4cfe5795cb677e667e7e5e816890ef31cf5b9ef9632cec2d141
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c93c68bc389a6a48442592e60e4dbeceea73ff32fb976591cbc1c94e02655672
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:29292b100cc2ee2457bc0dc61596ce1ac9e30c27c16af163764002e7d3958179
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8173e150f6a9f91c231ba85abc04eedc0e4b84b0eb31430974c8034e15430d9
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -438,3 +438,43 @@
438
  {"current_steps": 2190, "total_steps": 3850, "loss": 0.2209, "lr": 1.8704377614196963e-05, "epoch": 3.9827115559599635, "percentage": 56.88, "elapsed_time": "14:39:39", "remaining_time": "11:06:46"}
439
  {"current_steps": 2195, "total_steps": 3850, "loss": 0.2489, "lr": 1.8613915227736584e-05, "epoch": 3.991810737033667, "percentage": 57.01, "elapsed_time": "14:41:37", "remaining_time": "11:04:43"}
440
  {"current_steps": 2200, "total_steps": 3850, "loss": 0.2441, "lr": 1.852348132667635e-05, "epoch": 4.0, "percentage": 57.14, "elapsed_time": "14:43:07", "remaining_time": "11:02:20"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
438
  {"current_steps": 2190, "total_steps": 3850, "loss": 0.2209, "lr": 1.8704377614196963e-05, "epoch": 3.9827115559599635, "percentage": 56.88, "elapsed_time": "14:39:39", "remaining_time": "11:06:46"}
439
  {"current_steps": 2195, "total_steps": 3850, "loss": 0.2489, "lr": 1.8613915227736584e-05, "epoch": 3.991810737033667, "percentage": 57.01, "elapsed_time": "14:41:37", "remaining_time": "11:04:43"}
440
  {"current_steps": 2200, "total_steps": 3850, "loss": 0.2441, "lr": 1.852348132667635e-05, "epoch": 4.0, "percentage": 57.14, "elapsed_time": "14:43:07", "remaining_time": "11:02:20"}
441
+ {"current_steps": 2205, "total_steps": 3850, "loss": 0.2054, "lr": 1.843307776952155e-05, "epoch": 4.0090991810737036, "percentage": 57.27, "elapsed_time": "14:46:24", "remaining_time": "11:01:17"}
442
+ {"current_steps": 2210, "total_steps": 3850, "loss": 0.2276, "lr": 1.834270641415386e-05, "epoch": 4.018198362147407, "percentage": 57.4, "elapsed_time": "14:48:16", "remaining_time": "10:59:10"}
443
+ {"current_steps": 2215, "total_steps": 3850, "loss": 0.2078, "lr": 1.8252369117793172e-05, "epoch": 4.02729754322111, "percentage": 57.53, "elapsed_time": "14:50:07", "remaining_time": "10:57:03"}
444
+ {"current_steps": 2220, "total_steps": 3850, "loss": 0.2153, "lr": 1.8162067736959454e-05, "epoch": 4.036396724294813, "percentage": 57.66, "elapsed_time": "14:51:56", "remaining_time": "10:54:53"}
445
+ {"current_steps": 2225, "total_steps": 3850, "loss": 0.2098, "lr": 1.8071804127434545e-05, "epoch": 4.045495905368517, "percentage": 57.79, "elapsed_time": "14:53:49", "remaining_time": "10:52:47"}
446
+ {"current_steps": 2230, "total_steps": 3850, "loss": 0.2029, "lr": 1.7981580144224066e-05, "epoch": 4.05459508644222, "percentage": 57.92, "elapsed_time": "14:55:44", "remaining_time": "10:50:43"}
447
+ {"current_steps": 2235, "total_steps": 3850, "loss": 0.1952, "lr": 1.7891397641519272e-05, "epoch": 4.063694267515924, "percentage": 58.05, "elapsed_time": "14:57:53", "remaining_time": "10:48:48"}
448
+ {"current_steps": 2240, "total_steps": 3850, "loss": 0.2011, "lr": 1.7801258472658964e-05, "epoch": 4.072793448589627, "percentage": 58.18, "elapsed_time": "14:59:51", "remaining_time": "10:46:46"}
449
+ {"current_steps": 2245, "total_steps": 3850, "loss": 0.2032, "lr": 1.7711164490091365e-05, "epoch": 4.08189262966333, "percentage": 58.31, "elapsed_time": "15:01:34", "remaining_time": "10:44:33"}
450
+ {"current_steps": 2250, "total_steps": 3850, "loss": 0.2079, "lr": 1.7621117545336098e-05, "epoch": 4.090991810737034, "percentage": 58.44, "elapsed_time": "15:03:42", "remaining_time": "10:42:38"}
451
+ {"current_steps": 2255, "total_steps": 3850, "loss": 0.2149, "lr": 1.7531119488946107e-05, "epoch": 4.100090991810737, "percentage": 58.57, "elapsed_time": "15:05:47", "remaining_time": "10:40:41"}
452
+ {"current_steps": 2260, "total_steps": 3850, "loss": 0.208, "lr": 1.7441172170469634e-05, "epoch": 4.10919017288444, "percentage": 58.7, "elapsed_time": "15:07:45", "remaining_time": "10:38:38"}
453
+ {"current_steps": 2265, "total_steps": 3850, "loss": 0.2117, "lr": 1.7351277438412197e-05, "epoch": 4.1182893539581436, "percentage": 58.83, "elapsed_time": "15:09:38", "remaining_time": "10:36:32"}
454
+ {"current_steps": 2270, "total_steps": 3850, "loss": 0.2098, "lr": 1.726143714019862e-05, "epoch": 4.127388535031847, "percentage": 58.96, "elapsed_time": "15:11:32", "remaining_time": "10:34:27"}
455
+ {"current_steps": 2275, "total_steps": 3850, "loss": 0.2144, "lr": 1.7171653122135065e-05, "epoch": 4.136487716105551, "percentage": 59.09, "elapsed_time": "15:13:25", "remaining_time": "10:32:22"}
456
+ {"current_steps": 2280, "total_steps": 3850, "loss": 0.2024, "lr": 1.708192722937106e-05, "epoch": 4.145586897179254, "percentage": 59.22, "elapsed_time": "15:15:16", "remaining_time": "10:30:15"}
457
+ {"current_steps": 2285, "total_steps": 3850, "loss": 0.2041, "lr": 1.6992261305861635e-05, "epoch": 4.154686078252957, "percentage": 59.35, "elapsed_time": "15:17:15", "remaining_time": "10:28:13"}
458
+ {"current_steps": 2290, "total_steps": 3850, "loss": 0.2016, "lr": 1.6902657194329357e-05, "epoch": 4.16378525932666, "percentage": 59.48, "elapsed_time": "15:19:15", "remaining_time": "10:26:12"}
459
+ {"current_steps": 2295, "total_steps": 3850, "loss": 0.2046, "lr": 1.681311673622651e-05, "epoch": 4.172884440400364, "percentage": 59.61, "elapsed_time": "15:21:27", "remaining_time": "10:24:20"}
460
+ {"current_steps": 2300, "total_steps": 3850, "loss": 0.2067, "lr": 1.6723641771697246e-05, "epoch": 4.1819836214740675, "percentage": 59.74, "elapsed_time": "15:23:31", "remaining_time": "10:22:22"}
461
+ {"current_steps": 2305, "total_steps": 3850, "loss": 0.2171, "lr": 1.663423413953976e-05, "epoch": 4.191082802547771, "percentage": 59.87, "elapsed_time": "15:25:38", "remaining_time": "10:20:26"}
462
+ {"current_steps": 2310, "total_steps": 3850, "loss": 0.2097, "lr": 1.6544895677168483e-05, "epoch": 4.200181983621474, "percentage": 60.0, "elapsed_time": "15:27:35", "remaining_time": "10:18:23"}
463
+ {"current_steps": 2315, "total_steps": 3850, "loss": 0.2176, "lr": 1.6455628220576357e-05, "epoch": 4.209281164695177, "percentage": 60.13, "elapsed_time": "15:29:22", "remaining_time": "10:16:14"}
464
+ {"current_steps": 2320, "total_steps": 3850, "loss": 0.2042, "lr": 1.6366433604297072e-05, "epoch": 4.218380345768881, "percentage": 60.26, "elapsed_time": "15:31:16", "remaining_time": "10:14:09"}
465
+ {"current_steps": 2325, "total_steps": 3850, "loss": 0.2183, "lr": 1.62773136613674e-05, "epoch": 4.227479526842584, "percentage": 60.39, "elapsed_time": "15:33:15", "remaining_time": "10:12:08"}
466
+ {"current_steps": 2330, "total_steps": 3850, "loss": 0.2024, "lr": 1.6188270223289483e-05, "epoch": 4.236578707916287, "percentage": 60.52, "elapsed_time": "15:35:12", "remaining_time": "10:10:05"}
467
+ {"current_steps": 2335, "total_steps": 3850, "loss": 0.2008, "lr": 1.609930511999321e-05, "epoch": 4.245677888989991, "percentage": 60.65, "elapsed_time": "15:37:32", "remaining_time": "10:08:18"}
468
+ {"current_steps": 2340, "total_steps": 3850, "loss": 0.2221, "lr": 1.6010420179798623e-05, "epoch": 4.254777070063694, "percentage": 60.78, "elapsed_time": "15:39:34", "remaining_time": "10:06:18"}
469
+ {"current_steps": 2345, "total_steps": 3850, "loss": 0.2113, "lr": 1.5921617229378338e-05, "epoch": 4.263876251137398, "percentage": 60.91, "elapsed_time": "15:41:26", "remaining_time": "10:04:12"}
470
+ {"current_steps": 2350, "total_steps": 3850, "loss": 0.2147, "lr": 1.583289809372e-05, "epoch": 4.272975432211101, "percentage": 61.04, "elapsed_time": "15:43:31", "remaining_time": "10:02:14"}
471
+ {"current_steps": 2355, "total_steps": 3850, "loss": 0.2127, "lr": 1.5744264596088763e-05, "epoch": 4.282074613284804, "percentage": 61.17, "elapsed_time": "15:45:13", "remaining_time": "10:00:02"}
472
+ {"current_steps": 2360, "total_steps": 3850, "loss": 0.2081, "lr": 1.5655718557989848e-05, "epoch": 4.2911737943585075, "percentage": 61.3, "elapsed_time": "15:47:15", "remaining_time": "9:58:03"}
473
+ {"current_steps": 2365, "total_steps": 3850, "loss": 0.2041, "lr": 1.5567261799131102e-05, "epoch": 4.300272975432211, "percentage": 61.43, "elapsed_time": "15:49:25", "remaining_time": "9:56:08"}
474
+ {"current_steps": 2370, "total_steps": 3850, "loss": 0.2046, "lr": 1.5478896137385584e-05, "epoch": 4.309372156505915, "percentage": 61.56, "elapsed_time": "15:51:20", "remaining_time": "9:54:05"}
475
+ {"current_steps": 2375, "total_steps": 3850, "loss": 0.2171, "lr": 1.5390623388754232e-05, "epoch": 4.318471337579618, "percentage": 61.69, "elapsed_time": "15:53:13", "remaining_time": "9:52:00"}
476
+ {"current_steps": 2380, "total_steps": 3850, "loss": 0.2065, "lr": 1.5302445367328507e-05, "epoch": 4.327570518653321, "percentage": 61.82, "elapsed_time": "15:55:13", "remaining_time": "9:49:59"}
477
+ {"current_steps": 2385, "total_steps": 3850, "loss": 0.2029, "lr": 1.5214363885253156e-05, "epoch": 4.336669699727024, "percentage": 61.95, "elapsed_time": "15:57:09", "remaining_time": "9:47:56"}
478
+ {"current_steps": 2390, "total_steps": 3850, "loss": 0.2029, "lr": 1.5126380752688934e-05, "epoch": 4.345768880800728, "percentage": 62.08, "elapsed_time": "15:59:07", "remaining_time": "9:45:54"}
479
+ {"current_steps": 2395, "total_steps": 3850, "loss": 0.2009, "lr": 1.503849777777543e-05, "epoch": 4.3548680618744315, "percentage": 62.21, "elapsed_time": "16:01:10", "remaining_time": "9:43:55"}
480
+ {"current_steps": 2400, "total_steps": 3850, "loss": 0.2047, "lr": 1.4950716766593872e-05, "epoch": 4.363967242948135, "percentage": 62.34, "elapsed_time": "16:03:11", "remaining_time": "9:41:55"}