ryanmarten commited on
Commit
c3e3d07
·
verified ·
1 Parent(s): 05c265f

Training in progress, epoch 7

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2564c606514d795b9e64b4eedb55beb3ed5308579459e43049f59c9e0c31a0f7
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fc774e3f493ff6199a3bc1b1d7a5656a6f3447363ae0a8b33699a172c007628d
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae2b6e0c992f2feefd461738f0a518dd6450a8153e0ccaf39f7034c14114d558
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a13661ab0ee7c29184497b16df1a50f794688cf70b55f55a833ec217b5337b76
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:56b3d45c3a8393a016b32ac20e6cb57d3839532897a1c81a4b822f267508f223
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c60cdfdbef6d8bf886d2eac1980022746cc6ecaf4af64c4054328e400f16619b
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2903a97c9925a90ea89ea9acabcaf67dbea2da237b495c940c03ebda7e183597
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f8a26cf366c04e0fd7425ec6813d4bd66a8ace121e4dc1cac7523cbc09d1188b
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -65,3 +65,22 @@
65
  {"current_steps": 65, "total_steps": 117, "loss": 0.2782, "lr": 4.9252029649236835e-06, "epoch": 6.810126582278481, "percentage": 55.56, "elapsed_time": "0:31:34", "remaining_time": "0:25:15"}
66
  {"current_steps": 66, "total_steps": 117, "loss": 0.2408, "lr": 4.775675848247427e-06, "epoch": 6.911392405063291, "percentage": 56.41, "elapsed_time": "0:32:01", "remaining_time": "0:24:44"}
67
  {"current_steps": 67, "total_steps": 117, "loss": 0.2107, "lr": 4.626349532067879e-06, "epoch": 7.050632911392405, "percentage": 57.26, "elapsed_time": "0:33:17", "remaining_time": "0:24:50"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
65
  {"current_steps": 65, "total_steps": 117, "loss": 0.2782, "lr": 4.9252029649236835e-06, "epoch": 6.810126582278481, "percentage": 55.56, "elapsed_time": "0:31:34", "remaining_time": "0:25:15"}
66
  {"current_steps": 66, "total_steps": 117, "loss": 0.2408, "lr": 4.775675848247427e-06, "epoch": 6.911392405063291, "percentage": 56.41, "elapsed_time": "0:32:01", "remaining_time": "0:24:44"}
67
  {"current_steps": 67, "total_steps": 117, "loss": 0.2107, "lr": 4.626349532067879e-06, "epoch": 7.050632911392405, "percentage": 57.26, "elapsed_time": "0:33:17", "remaining_time": "0:24:50"}
68
+ {"current_steps": 68, "total_steps": 117, "loss": 0.2229, "lr": 4.477357683661734e-06, "epoch": 7.151898734177215, "percentage": 58.12, "elapsed_time": "0:33:37", "remaining_time": "0:24:13"}
69
+ {"current_steps": 69, "total_steps": 117, "loss": 0.1277, "lr": 4.3288336709117246e-06, "epoch": 7.253164556962025, "percentage": 58.97, "elapsed_time": "0:33:57", "remaining_time": "0:23:37"}
70
+ {"current_steps": 70, "total_steps": 117, "loss": 0.2897, "lr": 4.180910442924312e-06, "epoch": 7.3544303797468356, "percentage": 59.83, "elapsed_time": "0:34:27", "remaining_time": "0:23:08"}
71
+ {"current_steps": 71, "total_steps": 117, "loss": 0.2406, "lr": 4.033720411022235e-06, "epoch": 7.455696202531645, "percentage": 60.68, "elapsed_time": "0:34:54", "remaining_time": "0:22:36"}
72
+ {"current_steps": 72, "total_steps": 117, "loss": 0.1761, "lr": 3.887395330218429e-06, "epoch": 7.556962025316456, "percentage": 61.54, "elapsed_time": "0:35:20", "remaining_time": "0:22:05"}
73
+ {"current_steps": 73, "total_steps": 117, "loss": 0.1929, "lr": 3.7420661812774577e-06, "epoch": 7.658227848101266, "percentage": 62.39, "elapsed_time": "0:35:43", "remaining_time": "0:21:31"}
74
+ {"current_steps": 74, "total_steps": 117, "loss": 0.1819, "lr": 3.5978630534699873e-06, "epoch": 7.759493670886076, "percentage": 63.25, "elapsed_time": "0:36:03", "remaining_time": "0:20:57"}
75
+ {"current_steps": 75, "total_steps": 117, "loss": 0.2077, "lr": 3.4549150281252635e-06, "epoch": 7.860759493670886, "percentage": 64.1, "elapsed_time": "0:36:32", "remaining_time": "0:20:27"}
76
+ {"current_steps": 76, "total_steps": 117, "loss": 0.1836, "lr": 3.3133500630858507e-06, "epoch": 7.962025316455696, "percentage": 64.96, "elapsed_time": "0:36:54", "remaining_time": "0:19:54"}
77
+ {"current_steps": 77, "total_steps": 117, "loss": 0.1977, "lr": 3.173294878168025e-06, "epoch": 8.10126582278481, "percentage": 65.81, "elapsed_time": "0:38:28", "remaining_time": "0:19:59"}
78
+ {"current_steps": 78, "total_steps": 117, "loss": 0.158, "lr": 3.0348748417303826e-06, "epoch": 8.20253164556962, "percentage": 66.67, "elapsed_time": "0:38:52", "remaining_time": "0:19:26"}
79
+ {"current_steps": 79, "total_steps": 117, "loss": 0.1434, "lr": 2.8982138584521734e-06, "epoch": 8.30379746835443, "percentage": 67.52, "elapsed_time": "0:39:14", "remaining_time": "0:18:52"}
80
+ {"current_steps": 80, "total_steps": 117, "loss": 0.1397, "lr": 2.7634342584218364e-06, "epoch": 8.405063291139241, "percentage": 68.38, "elapsed_time": "0:39:34", "remaining_time": "0:18:17"}
81
+ {"current_steps": 81, "total_steps": 117, "loss": 0.2219, "lr": 2.6306566876350072e-06, "epoch": 8.50632911392405, "percentage": 69.23, "elapsed_time": "0:40:03", "remaining_time": "0:17:48"}
82
+ {"current_steps": 82, "total_steps": 117, "loss": 0.1362, "lr": 2.5000000000000015e-06, "epoch": 8.60759493670886, "percentage": 70.09, "elapsed_time": "0:40:28", "remaining_time": "0:17:16"}
83
+ {"current_steps": 83, "total_steps": 117, "loss": 0.1965, "lr": 2.371581150947476e-06, "epoch": 8.708860759493671, "percentage": 70.94, "elapsed_time": "0:40:54", "remaining_time": "0:16:45"}
84
+ {"current_steps": 84, "total_steps": 117, "loss": 0.2106, "lr": 2.245515092739488e-06, "epoch": 8.810126582278482, "percentage": 71.79, "elapsed_time": "0:41:29", "remaining_time": "0:16:17"}
85
+ {"current_steps": 85, "total_steps": 117, "loss": 0.151, "lr": 2.1219146715716332e-06, "epoch": 8.91139240506329, "percentage": 72.65, "elapsed_time": "0:41:44", "remaining_time": "0:15:42"}
86
+ {"current_steps": 86, "total_steps": 117, "loss": 0.1684, "lr": 2.0008905265604316e-06, "epoch": 9.050632911392405, "percentage": 73.5, "elapsed_time": "0:43:08", "remaining_time": "0:15:33"}