3N3G commited on
Commit
fb9d75c
·
verified ·
1 Parent(s): b0c47d4

Training in progress, step 368

Browse files
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:096439a15e0b06aee20e3753c9fc04b16d480adc998310ef78cc635894ce0439
3
  size 4969539560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ceb02694688565e3a16da06ce91c5e882db4d780d31df5f10c2dea997b2c3ca
3
  size 4969539560
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:baf6e5b35338a330f50e7e5f5405f807ca31d11aeffe1893d6a171ddc95e8f71
3
  size 1912795688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6db59088a0fb0851b5830cd0eb2bea70eda5332580952aa7bc75acee5ac2887e
3
  size 1912795688
trainer_log.jsonl CHANGED
@@ -866,3 +866,20 @@
866
  {"current_steps": 367, "total_steps": 400, "loss": 0.6327, "lr": 1.1966285981663406e-08, "epoch": 91.87272727272727, "percentage": 91.75, "elapsed_time": "0:44:39", "remaining_time": "0:04:00"}
867
  {"current_steps": 368, "total_steps": 400, "loss": 0.6545, "lr": 1.1853111930931313e-08, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:42", "remaining_time": "0:03:53"}
868
  {"current_steps": 368, "total_steps": 400, "eval_loss": 0.6371535062789917, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:43", "remaining_time": "0:03:53"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
866
  {"current_steps": 367, "total_steps": 400, "loss": 0.6327, "lr": 1.1966285981663406e-08, "epoch": 91.87272727272727, "percentage": 91.75, "elapsed_time": "0:44:39", "remaining_time": "0:04:00"}
867
  {"current_steps": 368, "total_steps": 400, "loss": 0.6545, "lr": 1.1853111930931313e-08, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:42", "remaining_time": "0:03:53"}
868
  {"current_steps": 368, "total_steps": 400, "eval_loss": 0.6371535062789917, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:43", "remaining_time": "0:03:53"}
869
+ {"current_steps": 369, "total_steps": 400, "loss": 0.5913, "lr": 1.174322368277565e-08, "epoch": 92.2909090909091, "percentage": 92.25, "elapsed_time": "0:45:15", "remaining_time": "0:03:48"}
870
+ {"current_steps": 370, "total_steps": 400, "loss": 0.6869, "lr": 1.1636629605611967e-08, "epoch": 92.58181818181818, "percentage": 92.5, "elapsed_time": "0:45:22", "remaining_time": "0:03:40"}
871
+ {"current_steps": 371, "total_steps": 400, "loss": 0.6699, "lr": 1.1533337816991931e-08, "epoch": 92.87272727272727, "percentage": 92.75, "elapsed_time": "0:45:29", "remaining_time": "0:03:33"}
872
+ {"current_steps": 372, "total_steps": 400, "loss": 0.658, "lr": 1.1433356182985158e-08, "epoch": 93.0, "percentage": 93.0, "elapsed_time": "0:45:32", "remaining_time": "0:03:25"}
873
+ {"current_steps": 373, "total_steps": 400, "loss": 0.7064, "lr": 1.133669231758016e-08, "epoch": 93.2909090909091, "percentage": 93.25, "elapsed_time": "0:45:40", "remaining_time": "0:03:18"}
874
+ {"current_steps": 374, "total_steps": 400, "loss": 0.6268, "lr": 1.1243353582104555e-08, "epoch": 93.58181818181818, "percentage": 93.5, "elapsed_time": "0:45:46", "remaining_time": "0:03:10"}
875
+ {"current_steps": 375, "total_steps": 400, "loss": 0.6366, "lr": 1.115334708466442e-08, "epoch": 93.87272727272727, "percentage": 93.75, "elapsed_time": "0:45:53", "remaining_time": "0:03:03"}
876
+ {"current_steps": 376, "total_steps": 400, "loss": 0.5847, "lr": 1.1066679679602998e-08, "epoch": 94.0, "percentage": 94.0, "elapsed_time": "0:45:56", "remaining_time": "0:02:55"}
877
+ {"current_steps": 377, "total_steps": 400, "loss": 0.6578, "lr": 1.0983357966978745e-08, "epoch": 94.2909090909091, "percentage": 94.25, "elapsed_time": "0:46:03", "remaining_time": "0:02:48"}
878
+ {"current_steps": 378, "total_steps": 400, "loss": 0.6523, "lr": 1.0903388292062667e-08, "epoch": 94.58181818181818, "percentage": 94.5, "elapsed_time": "0:46:10", "remaining_time": "0:02:41"}
879
+ {"current_steps": 379, "total_steps": 400, "loss": 0.6582, "lr": 1.0826776744855121e-08, "epoch": 94.87272727272727, "percentage": 94.75, "elapsed_time": "0:46:17", "remaining_time": "0:02:33"}
880
+ {"current_steps": 380, "total_steps": 400, "loss": 0.6047, "lr": 1.0753529159622047e-08, "epoch": 95.0, "percentage": 95.0, "elapsed_time": "0:46:20", "remaining_time": "0:02:26"}
881
+ {"current_steps": 381, "total_steps": 400, "loss": 0.6078, "lr": 1.068365111445064e-08, "epoch": 95.2909090909091, "percentage": 95.25, "elapsed_time": "0:46:26", "remaining_time": "0:02:18"}
882
+ {"current_steps": 382, "total_steps": 400, "loss": 0.6347, "lr": 1.0617147930824585e-08, "epoch": 95.58181818181818, "percentage": 95.5, "elapsed_time": "0:46:34", "remaining_time": "0:02:11"}
883
+ {"current_steps": 383, "total_steps": 400, "loss": 0.6709, "lr": 1.0554024673218806e-08, "epoch": 95.87272727272727, "percentage": 95.75, "elapsed_time": "0:46:40", "remaining_time": "0:02:04"}
884
+ {"current_steps": 384, "total_steps": 400, "loss": 0.7126, "lr": 1.0494286148713743e-08, "epoch": 96.0, "percentage": 96.0, "elapsed_time": "0:46:43", "remaining_time": "0:01:56"}
885
+ {"current_steps": 384, "total_steps": 400, "eval_loss": 0.6363654732704163, "epoch": 96.0, "percentage": 96.0, "elapsed_time": "0:46:44", "remaining_time": "0:01:56"}