penfever commited on
Commit
2665392
·
verified ·
1 Parent(s): 06fc797

Training in progress, step 400

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a3021cbcfec905eeef92a765e70e4724b2934c20c69a29b976e0c2246bb7686
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8777b38cc627bd3fd53b8213b190f3463fcec4259fdb8b35e114d7c67d0506c6
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:460c4e782b026689d673ac7634b3d5566c4eb0985a13dd5c0a40424983e2e0c9
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af3b23343d497c80b25ca147dc7477d352afe1bcb86e1a49d7a98b877f94c9f7
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:64202a4a43f12ebdb7638b7124e99cd43e7e37a2ee3cde7e3299cc6974152e7c
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3849d98fb3fe971af5e4f68b0823e22124e74c213934b15152a017a48dd30b62
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bea38c35d521e505430722083b476df170ef2f45aa2693ab4f63e35c3b903cc5
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc9dd83bf6287481e8c02210a9975f61b4cff8f39b14e4a4b99c262fcb25234a
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -58,3 +58,25 @@
58
  {"current_steps": 290, "total_steps": 3850, "loss": 0.3524, "lr": 3.002597402597403e-05, "epoch": 0.5277525022747953, "percentage": 7.53, "elapsed_time": "1:57:14", "remaining_time": "23:59:15"}
59
  {"current_steps": 295, "total_steps": 3850, "loss": 0.3704, "lr": 3.054545454545455e-05, "epoch": 0.5368516833484986, "percentage": 7.66, "elapsed_time": "1:58:57", "remaining_time": "23:53:30"}
60
  {"current_steps": 300, "total_steps": 3850, "loss": 0.3664, "lr": 3.106493506493507e-05, "epoch": 0.545950864422202, "percentage": 7.79, "elapsed_time": "2:00:50", "remaining_time": "23:49:59"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
58
  {"current_steps": 290, "total_steps": 3850, "loss": 0.3524, "lr": 3.002597402597403e-05, "epoch": 0.5277525022747953, "percentage": 7.53, "elapsed_time": "1:57:14", "remaining_time": "23:59:15"}
59
  {"current_steps": 295, "total_steps": 3850, "loss": 0.3704, "lr": 3.054545454545455e-05, "epoch": 0.5368516833484986, "percentage": 7.66, "elapsed_time": "1:58:57", "remaining_time": "23:53:30"}
60
  {"current_steps": 300, "total_steps": 3850, "loss": 0.3664, "lr": 3.106493506493507e-05, "epoch": 0.545950864422202, "percentage": 7.79, "elapsed_time": "2:00:50", "remaining_time": "23:49:59"}
61
+ {"current_steps": 305, "total_steps": 3850, "loss": 0.3375, "lr": 3.158441558441559e-05, "epoch": 0.5550500454959054, "percentage": 7.92, "elapsed_time": "2:02:49", "remaining_time": "23:47:38"}
62
+ {"current_steps": 310, "total_steps": 3850, "loss": 0.3457, "lr": 3.210389610389611e-05, "epoch": 0.5641492265696088, "percentage": 8.05, "elapsed_time": "2:04:46", "remaining_time": "23:44:51"}
63
+ {"current_steps": 315, "total_steps": 3850, "loss": 0.3473, "lr": 3.2623376623376626e-05, "epoch": 0.5732484076433121, "percentage": 8.18, "elapsed_time": "2:06:40", "remaining_time": "23:41:32"}
64
+ {"current_steps": 320, "total_steps": 3850, "loss": 0.3601, "lr": 3.314285714285715e-05, "epoch": 0.5823475887170154, "percentage": 8.31, "elapsed_time": "2:08:44", "remaining_time": "23:40:07"}
65
+ {"current_steps": 325, "total_steps": 3850, "loss": 0.3288, "lr": 3.366233766233766e-05, "epoch": 0.5914467697907189, "percentage": 8.44, "elapsed_time": "2:10:46", "remaining_time": "23:38:24"}
66
+ {"current_steps": 330, "total_steps": 3850, "loss": 0.3588, "lr": 3.4181818181818185e-05, "epoch": 0.6005459508644222, "percentage": 8.57, "elapsed_time": "2:12:35", "remaining_time": "23:34:14"}
67
+ {"current_steps": 335, "total_steps": 3850, "loss": 0.3542, "lr": 3.47012987012987e-05, "epoch": 0.6096451319381255, "percentage": 8.7, "elapsed_time": "2:14:36", "remaining_time": "23:32:20"}
68
+ {"current_steps": 340, "total_steps": 3850, "loss": 0.3574, "lr": 3.522077922077922e-05, "epoch": 0.618744313011829, "percentage": 8.83, "elapsed_time": "2:16:38", "remaining_time": "23:30:40"}
69
+ {"current_steps": 345, "total_steps": 3850, "loss": 0.3515, "lr": 3.5740259740259743e-05, "epoch": 0.6278434940855323, "percentage": 8.96, "elapsed_time": "2:18:46", "remaining_time": "23:29:53"}
70
+ {"current_steps": 350, "total_steps": 3850, "loss": 0.3246, "lr": 3.625974025974026e-05, "epoch": 0.6369426751592356, "percentage": 9.09, "elapsed_time": "2:20:50", "remaining_time": "23:28:28"}
71
+ {"current_steps": 355, "total_steps": 3850, "loss": 0.3434, "lr": 3.677922077922078e-05, "epoch": 0.6460418562329391, "percentage": 9.22, "elapsed_time": "2:22:58", "remaining_time": "23:27:33"}
72
+ {"current_steps": 360, "total_steps": 3850, "loss": 0.3339, "lr": 3.72987012987013e-05, "epoch": 0.6551410373066424, "percentage": 9.35, "elapsed_time": "2:24:47", "remaining_time": "23:23:40"}
73
+ {"current_steps": 365, "total_steps": 3850, "loss": 0.3445, "lr": 3.7818181818181824e-05, "epoch": 0.6642402183803457, "percentage": 9.48, "elapsed_time": "2:26:56", "remaining_time": "23:22:55"}
74
+ {"current_steps": 370, "total_steps": 3850, "loss": 0.3429, "lr": 3.833766233766234e-05, "epoch": 0.6733393994540491, "percentage": 9.61, "elapsed_time": "2:28:49", "remaining_time": "23:19:48"}
75
+ {"current_steps": 375, "total_steps": 3850, "loss": 0.3363, "lr": 3.885714285714286e-05, "epoch": 0.6824385805277525, "percentage": 9.74, "elapsed_time": "2:30:46", "remaining_time": "23:17:12"}
76
+ {"current_steps": 380, "total_steps": 3850, "loss": 0.3474, "lr": 3.937662337662338e-05, "epoch": 0.6915377616014559, "percentage": 9.87, "elapsed_time": "2:32:38", "remaining_time": "23:13:53"}
77
+ {"current_steps": 385, "total_steps": 3850, "loss": 0.3135, "lr": 3.98961038961039e-05, "epoch": 0.7006369426751592, "percentage": 10.0, "elapsed_time": "2:34:48", "remaining_time": "23:13:19"}
78
+ {"current_steps": 390, "total_steps": 3850, "loss": 0.3455, "lr": 3.999986847364818e-05, "epoch": 0.7097361237488626, "percentage": 10.13, "elapsed_time": "2:36:49", "remaining_time": "23:11:23"}
79
+ {"current_steps": 395, "total_steps": 3850, "loss": 0.3428, "lr": 3.999933415080877e-05, "epoch": 0.718835304822566, "percentage": 10.26, "elapsed_time": "2:38:58", "remaining_time": "23:10:34"}
80
+ {"current_steps": 400, "total_steps": 3850, "loss": 0.3347, "lr": 3.999838882205719e-05, "epoch": 0.7279344858962693, "percentage": 10.39, "elapsed_time": "2:41:02", "remaining_time": "23:08:56"}
81
+ {"current_steps": 405, "total_steps": 3850, "loss": 0.3471, "lr": 3.999703250682087e-05, "epoch": 0.7370336669699727, "percentage": 10.52, "elapsed_time": "2:44:05", "remaining_time": "23:15:49"}
82
+ {"current_steps": 410, "total_steps": 3850, "loss": 0.321, "lr": 3.9995265232973414e-05, "epoch": 0.7461328480436761, "percentage": 10.65, "elapsed_time": "2:46:16", "remaining_time": "23:15:05"}