3N3G commited on
Commit
6f330d3
·
verified ·
1 Parent(s): 4395a23

Training in progress, step 224

Browse files
model-00001-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:50a7626c3332382c720b25d7028428e6e693206a85b1d278123f350e6447c549
3
  size 4969539560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f766264a80af3c2e0386eedf3905edbf56634837a038ce95c6038d7405eedfe
3
  size 4969539560
model-00002-of-00002.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:674ac2c674747082527a37e7013363c3374ff004d5b78edf91c3585792370cd4
3
  size 1912795688
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6e24e7e534a14d518b12200bfaba3ba2cedbbafce9b0fbda9c2aca6057ce604
3
  size 1912795688
trainer_log.jsonl CHANGED
@@ -713,3 +713,20 @@
713
  {"current_steps": 223, "total_steps": 400, "loss": 0.6684, "lr": 5.421464171032224e-08, "epoch": 55.872727272727275, "percentage": 55.75, "elapsed_time": "0:27:00", "remaining_time": "0:21:25"}
714
  {"current_steps": 224, "total_steps": 400, "loss": 0.7467, "lr": 5.382203732614572e-08, "epoch": 56.0, "percentage": 56.0, "elapsed_time": "0:27:02", "remaining_time": "0:21:15"}
715
  {"current_steps": 224, "total_steps": 400, "eval_loss": 0.6532977819442749, "epoch": 56.0, "percentage": 56.0, "elapsed_time": "0:27:03", "remaining_time": "0:21:15"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
713
  {"current_steps": 223, "total_steps": 400, "loss": 0.6684, "lr": 5.421464171032224e-08, "epoch": 55.872727272727275, "percentage": 55.75, "elapsed_time": "0:27:00", "remaining_time": "0:21:25"}
714
  {"current_steps": 224, "total_steps": 400, "loss": 0.7467, "lr": 5.382203732614572e-08, "epoch": 56.0, "percentage": 56.0, "elapsed_time": "0:27:02", "remaining_time": "0:21:15"}
715
  {"current_steps": 224, "total_steps": 400, "eval_loss": 0.6532977819442749, "epoch": 56.0, "percentage": 56.0, "elapsed_time": "0:27:03", "remaining_time": "0:21:15"}
716
+ {"current_steps": 225, "total_steps": 400, "loss": 0.7395, "lr": 5.342952264838747e-08, "epoch": 56.29090909090909, "percentage": 56.25, "elapsed_time": "0:27:35", "remaining_time": "0:21:27"}
717
+ {"current_steps": 226, "total_steps": 400, "loss": 0.7176, "lr": 5.303712756855988e-08, "epoch": 56.58181818181818, "percentage": 56.5, "elapsed_time": "0:27:42", "remaining_time": "0:21:19"}
718
+ {"current_steps": 227, "total_steps": 400, "loss": 0.5565, "lr": 5.264488196906752e-08, "epoch": 56.872727272727275, "percentage": 56.75, "elapsed_time": "0:27:49", "remaining_time": "0:21:12"}
719
+ {"current_steps": 228, "total_steps": 400, "loss": 0.7052, "lr": 5.225281572093143e-08, "epoch": 57.0, "percentage": 57.0, "elapsed_time": "0:27:52", "remaining_time": "0:21:01"}
720
+ {"current_steps": 229, "total_steps": 400, "loss": 0.6931, "lr": 5.1860958681514355e-08, "epoch": 57.29090909090909, "percentage": 57.25, "elapsed_time": "0:27:59", "remaining_time": "0:20:53"}
721
+ {"current_steps": 230, "total_steps": 400, "loss": 0.6126, "lr": 5.1469340692246985e-08, "epoch": 57.58181818181818, "percentage": 57.5, "elapsed_time": "0:28:06", "remaining_time": "0:20:46"}
722
+ {"current_steps": 231, "total_steps": 400, "loss": 0.7149, "lr": 5.107799157635537e-08, "epoch": 57.872727272727275, "percentage": 57.75, "elapsed_time": "0:28:12", "remaining_time": "0:20:38"}
723
+ {"current_steps": 232, "total_steps": 400, "loss": 0.6564, "lr": 5.068694113658992e-08, "epoch": 58.0, "percentage": 58.0, "elapsed_time": "0:28:16", "remaining_time": "0:20:28"}
724
+ {"current_steps": 233, "total_steps": 400, "loss": 0.6657, "lr": 5.02962191529556e-08, "epoch": 58.29090909090909, "percentage": 58.25, "elapsed_time": "0:28:22", "remaining_time": "0:20:20"}
725
+ {"current_steps": 234, "total_steps": 400, "loss": 0.7461, "lr": 4.9905855380444194e-08, "epoch": 58.58181818181818, "percentage": 58.5, "elapsed_time": "0:28:29", "remaining_time": "0:20:13"}
726
+ {"current_steps": 235, "total_steps": 400, "loss": 0.5924, "lr": 4.9515879546768366e-08, "epoch": 58.872727272727275, "percentage": 58.75, "elapsed_time": "0:28:36", "remaining_time": "0:20:05"}
727
+ {"current_steps": 236, "total_steps": 400, "loss": 0.6793, "lr": 4.912632135009769e-08, "epoch": 59.0, "percentage": 59.0, "elapsed_time": "0:28:39", "remaining_time": "0:19:55"}
728
+ {"current_steps": 237, "total_steps": 400, "loss": 0.6648, "lr": 4.873721045679706e-08, "epoch": 59.29090909090909, "percentage": 59.25, "elapsed_time": "0:28:46", "remaining_time": "0:19:47"}
729
+ {"current_steps": 238, "total_steps": 400, "loss": 0.6871, "lr": 4.8348576499167516e-08, "epoch": 59.58181818181818, "percentage": 59.5, "elapsed_time": "0:28:54", "remaining_time": "0:19:40"}
730
+ {"current_steps": 239, "total_steps": 400, "loss": 0.6136, "lr": 4.7960449073189604e-08, "epoch": 59.872727272727275, "percentage": 59.75, "elapsed_time": "0:29:00", "remaining_time": "0:19:32"}
731
+ {"current_steps": 240, "total_steps": 400, "loss": 0.7364, "lr": 4.75728577362695e-08, "epoch": 60.0, "percentage": 60.0, "elapsed_time": "0:29:03", "remaining_time": "0:19:22"}
732
+ {"current_steps": 240, "total_steps": 400, "eval_loss": 0.6488688588142395, "epoch": 60.0, "percentage": 60.0, "elapsed_time": "0:29:04", "remaining_time": "0:19:22"}