ryanmarten commited on
Commit
05c265f
·
verified ·
1 Parent(s): 70f0ccc

Training in progress, epoch 5

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:212e3c4b92abca77bbc1f748cb1759951fc305280e1a47ba2fd5330d154a4e7b
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2564c606514d795b9e64b4eedb55beb3ed5308579459e43049f59c9e0c31a0f7
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7c7a33598dd0f35b34c840983368eab97318abc550f06c37bd930ce5db206faa
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ae2b6e0c992f2feefd461738f0a518dd6450a8153e0ccaf39f7034c14114d558
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:668fa255d0e61491f5153196cfcb2c2ae0dbaa268a72b1c0a4a770f70f95c853
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56b3d45c3a8393a016b32ac20e6cb57d3839532897a1c81a4b822f267508f223
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a0e065e440ace5b107ef3e6813bb3dfead91cb4f1359b7f5c977eb41e5c1392
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2903a97c9925a90ea89ea9acabcaf67dbea2da237b495c940c03ebda7e183597
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -54,3 +54,14 @@
54
  {"current_steps": 54, "total_steps": 117, "loss": 0.2991, "lr": 6.545084971874738e-06, "epoch": 5.658227848101266, "percentage": 46.15, "elapsed_time": "0:26:02", "remaining_time": "0:30:22"}
55
  {"current_steps": 55, "total_steps": 117, "loss": 0.2762, "lr": 6.402136946530014e-06, "epoch": 5.759493670886076, "percentage": 47.01, "elapsed_time": "0:26:24", "remaining_time": "0:29:46"}
56
  {"current_steps": 56, "total_steps": 117, "loss": 0.2439, "lr": 6.257933818722544e-06, "epoch": 5.860759493670886, "percentage": 47.86, "elapsed_time": "0:26:43", "remaining_time": "0:29:07"}
 
 
 
 
 
 
 
 
 
 
 
 
54
  {"current_steps": 54, "total_steps": 117, "loss": 0.2991, "lr": 6.545084971874738e-06, "epoch": 5.658227848101266, "percentage": 46.15, "elapsed_time": "0:26:02", "remaining_time": "0:30:22"}
55
  {"current_steps": 55, "total_steps": 117, "loss": 0.2762, "lr": 6.402136946530014e-06, "epoch": 5.759493670886076, "percentage": 47.01, "elapsed_time": "0:26:24", "remaining_time": "0:29:46"}
56
  {"current_steps": 56, "total_steps": 117, "loss": 0.2439, "lr": 6.257933818722544e-06, "epoch": 5.860759493670886, "percentage": 47.86, "elapsed_time": "0:26:43", "remaining_time": "0:29:07"}
57
+ {"current_steps": 57, "total_steps": 117, "loss": 0.3137, "lr": 6.112604669781572e-06, "epoch": 5.962025316455696, "percentage": 48.72, "elapsed_time": "0:27:11", "remaining_time": "0:28:37"}
58
+ {"current_steps": 58, "total_steps": 117, "loss": 0.2574, "lr": 5.9662795889777666e-06, "epoch": 6.10126582278481, "percentage": 49.57, "elapsed_time": "0:28:39", "remaining_time": "0:29:09"}
59
+ {"current_steps": 59, "total_steps": 117, "loss": 0.1956, "lr": 5.819089557075689e-06, "epoch": 6.2025316455696204, "percentage": 50.43, "elapsed_time": "0:29:08", "remaining_time": "0:28:38"}
60
+ {"current_steps": 60, "total_steps": 117, "loss": 0.2565, "lr": 5.671166329088278e-06, "epoch": 6.30379746835443, "percentage": 51.28, "elapsed_time": "0:29:34", "remaining_time": "0:28:05"}
61
+ {"current_steps": 61, "total_steps": 117, "loss": 0.3037, "lr": 5.522642316338268e-06, "epoch": 6.405063291139241, "percentage": 52.14, "elapsed_time": "0:30:03", "remaining_time": "0:27:35"}
62
+ {"current_steps": 62, "total_steps": 117, "loss": 0.2369, "lr": 5.373650467932122e-06, "epoch": 6.506329113924051, "percentage": 52.99, "elapsed_time": "0:30:30", "remaining_time": "0:27:03"}
63
+ {"current_steps": 63, "total_steps": 117, "loss": 0.1729, "lr": 5.224324151752575e-06, "epoch": 6.6075949367088604, "percentage": 53.85, "elapsed_time": "0:30:47", "remaining_time": "0:26:23"}
64
+ {"current_steps": 64, "total_steps": 117, "loss": 0.2579, "lr": 5.074797035076319e-06, "epoch": 6.708860759493671, "percentage": 54.7, "elapsed_time": "0:31:09", "remaining_time": "0:25:48"}
65
+ {"current_steps": 65, "total_steps": 117, "loss": 0.2782, "lr": 4.9252029649236835e-06, "epoch": 6.810126582278481, "percentage": 55.56, "elapsed_time": "0:31:34", "remaining_time": "0:25:15"}
66
+ {"current_steps": 66, "total_steps": 117, "loss": 0.2408, "lr": 4.775675848247427e-06, "epoch": 6.911392405063291, "percentage": 56.41, "elapsed_time": "0:32:01", "remaining_time": "0:24:44"}
67
+ {"current_steps": 67, "total_steps": 117, "loss": 0.2107, "lr": 4.626349532067879e-06, "epoch": 7.050632911392405, "percentage": 57.26, "elapsed_time": "0:33:17", "remaining_time": "0:24:50"}