sedrickkeh commited on
Commit
9c7c52f
·
verified ·
1 Parent(s): 4ad06f3

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92e7ec5c56c988d48e2263f6fdefeb750ed5120d86f540a15f00cabdaae06d43
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5640feb9ce63d00217e08262b97b74fc945e26c70aacdef2131ffd47f158192b
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1d737baca2dc81e1667e300d5b8bf07e102e24e99360c1e136d015b6ab6f2f85
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec25a652cbda1b84f04f4ec3592e555dd2cd2431fe58a48244378cf01cd918d3
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b561dd1099b98564a7714df65b29474b64c033be6a8afe2ae6bd71db5abdc6c4
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c794e3203c7d04155566418905c7e4dc2527ae0843cb5d74ddecb7e96f17de78
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:32a5df850156613f10caa3dffd731ea4ab1cbf03412a901e66c397aab1ed03a7
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73c8c1555f87907649eaa4618089a46566a0d7cf6d6d1d20c21d3cfb6f482f03
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -21,3 +21,24 @@
21
  {"current_steps": 21, "total_steps": 60, "loss": 1.2317, "lr": 8.213938048432697e-06, "epoch": 1.016, "percentage": 35.0, "elapsed_time": "0:20:43", "remaining_time": "0:38:29"}
22
  {"current_steps": 22, "total_steps": 60, "loss": 0.8934, "lr": 7.985792958513932e-06, "epoch": 1.064, "percentage": 36.67, "elapsed_time": "0:21:38", "remaining_time": "0:37:23"}
23
  {"current_steps": 23, "total_steps": 60, "loss": 0.991, "lr": 7.747544890354031e-06, "epoch": 1.112, "percentage": 38.33, "elapsed_time": "0:22:33", "remaining_time": "0:36:16"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
21
  {"current_steps": 21, "total_steps": 60, "loss": 1.2317, "lr": 8.213938048432697e-06, "epoch": 1.016, "percentage": 35.0, "elapsed_time": "0:20:43", "remaining_time": "0:38:29"}
22
  {"current_steps": 22, "total_steps": 60, "loss": 0.8934, "lr": 7.985792958513932e-06, "epoch": 1.064, "percentage": 36.67, "elapsed_time": "0:21:38", "remaining_time": "0:37:23"}
23
  {"current_steps": 23, "total_steps": 60, "loss": 0.991, "lr": 7.747544890354031e-06, "epoch": 1.112, "percentage": 38.33, "elapsed_time": "0:22:33", "remaining_time": "0:36:16"}
24
+ {"current_steps": 24, "total_steps": 60, "loss": 0.9389, "lr": 7.500000000000001e-06, "epoch": 1.16, "percentage": 40.0, "elapsed_time": "0:23:27", "remaining_time": "0:35:11"}
25
+ {"current_steps": 25, "total_steps": 60, "loss": 0.86, "lr": 7.243995901002312e-06, "epoch": 1.208, "percentage": 41.67, "elapsed_time": "0:24:25", "remaining_time": "0:34:11"}
26
+ {"current_steps": 26, "total_steps": 60, "loss": 0.9331, "lr": 6.980398830195785e-06, "epoch": 1.256, "percentage": 43.33, "elapsed_time": "0:25:21", "remaining_time": "0:33:09"}
27
+ {"current_steps": 27, "total_steps": 60, "loss": 0.9881, "lr": 6.710100716628345e-06, "epoch": 1.304, "percentage": 45.0, "elapsed_time": "0:26:13", "remaining_time": "0:32:02"}
28
+ {"current_steps": 28, "total_steps": 60, "loss": 0.9337, "lr": 6.434016163555452e-06, "epoch": 1.3519999999999999, "percentage": 46.67, "elapsed_time": "0:27:11", "remaining_time": "0:31:04"}
29
+ {"current_steps": 29, "total_steps": 60, "loss": 0.8651, "lr": 6.153079353712201e-06, "epoch": 1.4, "percentage": 48.33, "elapsed_time": "0:28:07", "remaining_time": "0:30:04"}
30
+ {"current_steps": 30, "total_steps": 60, "loss": 0.8596, "lr": 5.8682408883346535e-06, "epoch": 1.448, "percentage": 50.0, "elapsed_time": "0:28:57", "remaining_time": "0:28:57"}
31
+ {"current_steps": 31, "total_steps": 60, "loss": 0.8963, "lr": 5.5804645706261515e-06, "epoch": 1.496, "percentage": 51.67, "elapsed_time": "0:29:55", "remaining_time": "0:27:59"}
32
+ {"current_steps": 32, "total_steps": 60, "loss": 0.8475, "lr": 5.290724144552379e-06, "epoch": 1.544, "percentage": 53.33, "elapsed_time": "0:30:43", "remaining_time": "0:26:53"}
33
+ {"current_steps": 33, "total_steps": 60, "loss": 0.8904, "lr": 5e-06, "epoch": 1.592, "percentage": 55.0, "elapsed_time": "0:31:36", "remaining_time": "0:25:51"}
34
+ {"current_steps": 34, "total_steps": 60, "loss": 0.9363, "lr": 4.7092758554476215e-06, "epoch": 1.6400000000000001, "percentage": 56.67, "elapsed_time": "0:32:29", "remaining_time": "0:24:50"}
35
+ {"current_steps": 35, "total_steps": 60, "loss": 0.9859, "lr": 4.4195354293738484e-06, "epoch": 1.688, "percentage": 58.33, "elapsed_time": "0:33:32", "remaining_time": "0:23:57"}
36
+ {"current_steps": 36, "total_steps": 60, "loss": 0.7657, "lr": 4.131759111665349e-06, "epoch": 1.736, "percentage": 60.0, "elapsed_time": "0:34:22", "remaining_time": "0:22:55"}
37
+ {"current_steps": 37, "total_steps": 60, "loss": 0.9692, "lr": 3.8469206462878e-06, "epoch": 1.784, "percentage": 61.67, "elapsed_time": "0:35:21", "remaining_time": "0:21:58"}
38
+ {"current_steps": 38, "total_steps": 60, "loss": 0.894, "lr": 3.5659838364445505e-06, "epoch": 1.8319999999999999, "percentage": 63.33, "elapsed_time": "0:36:17", "remaining_time": "0:21:00"}
39
+ {"current_steps": 39, "total_steps": 60, "loss": 1.0476, "lr": 3.289899283371657e-06, "epoch": 1.88, "percentage": 65.0, "elapsed_time": "0:37:21", "remaining_time": "0:20:07"}
40
+ {"current_steps": 40, "total_steps": 60, "loss": 0.7547, "lr": 3.019601169804216e-06, "epoch": 1.928, "percentage": 66.67, "elapsed_time": "0:38:14", "remaining_time": "0:19:07"}
41
+ {"current_steps": 41, "total_steps": 60, "loss": 1.0386, "lr": 2.7560040989976894e-06, "epoch": 1.976, "percentage": 68.33, "elapsed_time": "0:39:11", "remaining_time": "0:18:09"}
42
+ {"current_steps": 42, "total_steps": 60, "loss": 1.0944, "lr": 2.5000000000000015e-06, "epoch": 2.032, "percentage": 70.0, "elapsed_time": "0:41:17", "remaining_time": "0:17:41"}
43
+ {"current_steps": 43, "total_steps": 60, "loss": 0.7287, "lr": 2.2524551096459703e-06, "epoch": 2.08, "percentage": 71.67, "elapsed_time": "0:42:03", "remaining_time": "0:16:37"}
44
+ {"current_steps": 44, "total_steps": 60, "loss": 0.9188, "lr": 2.0142070414860704e-06, "epoch": 2.128, "percentage": 73.33, "elapsed_time": "0:43:00", "remaining_time": "0:15:38"}