esfrankel17 commited on
Commit
a9b718f
·
verified ·
1 Parent(s): 0dde0bd

Training in progress, epoch 3

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dd8375c299cd303703eaa82d93dcb12a6166fddebeb767b6ed8e68b804d4f58d
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9424903c8e1d977cafd776f2fb3c8f3c710ccd6f5df363f351b6d4d0ca456ae6
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:703e26711abc4d6ac566e22495ef15af12b8d04ba3730483ab905e16895ee6d0
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba3b49b61df03a4e5f87786a7a4854c8eeccc9beefb750142179c7667726d3fd
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:31cb0c129728363d39cdbb9a62d99bdb872cc6d0fa532fd642944fcf2ab51f85
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50c885824fd3f29de6f6912f35cbed63d712b19861e629ddb399f7187de8aa0c
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1632dbea5cfca5ad2d186b81bbcb0d471d4d772744c2396d600160ba8742fdc0
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec10705282830f55d566bfd8a90775e1d07fff661806d754bfbd1a19605e80c8
3
  size 1168138808
trainer_log.jsonl CHANGED
@@ -4,3 +4,7 @@
4
  {"current_steps": 30, "total_steps": 69, "loss": 0.9035, "learning_rate": 5e-06, "epoch": 1.3043478260869565, "percentage": 43.48, "elapsed_time": "2:17:38", "remaining_time": "2:58:56"}
5
  {"current_steps": 40, "total_steps": 69, "loss": 0.8651, "learning_rate": 5e-06, "epoch": 1.7391304347826086, "percentage": 57.97, "elapsed_time": "3:02:47", "remaining_time": "2:12:31"}
6
  {"current_steps": 46, "total_steps": 69, "eval_loss": 0.889980673789978, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:30:48", "remaining_time": "1:45:24"}
 
 
 
 
 
4
  {"current_steps": 30, "total_steps": 69, "loss": 0.9035, "learning_rate": 5e-06, "epoch": 1.3043478260869565, "percentage": 43.48, "elapsed_time": "2:17:38", "remaining_time": "2:58:56"}
5
  {"current_steps": 40, "total_steps": 69, "loss": 0.8651, "learning_rate": 5e-06, "epoch": 1.7391304347826086, "percentage": 57.97, "elapsed_time": "3:02:47", "remaining_time": "2:12:31"}
6
  {"current_steps": 46, "total_steps": 69, "eval_loss": 0.889980673789978, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:30:48", "remaining_time": "1:45:24"}
7
+ {"current_steps": 50, "total_steps": 69, "loss": 0.8334, "learning_rate": 5e-06, "epoch": 2.1739130434782608, "percentage": 72.46, "elapsed_time": "3:50:06", "remaining_time": "1:27:26"}
8
+ {"current_steps": 60, "total_steps": 69, "loss": 0.7988, "learning_rate": 5e-06, "epoch": 2.608695652173913, "percentage": 86.96, "elapsed_time": "4:35:14", "remaining_time": "0:41:17"}
9
+ {"current_steps": 69, "total_steps": 69, "eval_loss": 0.8782235980033875, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "5:17:58", "remaining_time": "0:00:00"}
10
+ {"current_steps": 69, "total_steps": 69, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "5:18:43", "remaining_time": "0:00:00"}