ryanmarten commited on
Commit
0d15886
·
verified ·
1 Parent(s): 0ff3cb3

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ffc51524d2cbed36d7f09dd98204ea2c3fe1bd41dc03584b0e9703c2865797e7
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:051d5668a04cc82311647f0e61fd60cf01d4d5e94004f6397c71d3a8a3da76c4
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a27e6c7e2874001c694c80f3941cf7d1cc17517692fc43514d7edac872860c23
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35ba29e4dfcdb83ec3838a8933550af71351c21be97e2dc957f374195a53b449
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0019fb69d9eb2fc5550f6088460ffcd1486455ba762b573b0a5e6c8177cef541
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79d8bef13c386a820ecc00732522b5e4e85e8e93cfba5a986264652edd9bb573
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aa66dac0e0adbc7994e83625ca0dcd74f4160cbc892185b56e23be8cf60216e8
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d538d8fa19241687206f65046e9ce847e7cd3028840eba86b1001974f2040ba1
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -80,3 +80,42 @@
80
  {"current_steps": 80, "total_steps": 190, "loss": 0.3866, "lr": 2.8701313729641467e-05, "epoch": 2.0844155844155843, "percentage": 42.11, "elapsed_time": "0:31:58", "remaining_time": "0:43:58"}
81
  {"current_steps": 81, "total_steps": 190, "loss": 0.3825, "lr": 2.8369023454079223e-05, "epoch": 2.1103896103896105, "percentage": 42.63, "elapsed_time": "0:32:18", "remaining_time": "0:43:29"}
82
  {"current_steps": 82, "total_steps": 190, "loss": 0.3714, "lr": 2.8033908493059394e-05, "epoch": 2.1363636363636362, "percentage": 43.16, "elapsed_time": "0:32:40", "remaining_time": "0:43:02"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
80
  {"current_steps": 80, "total_steps": 190, "loss": 0.3866, "lr": 2.8701313729641467e-05, "epoch": 2.0844155844155843, "percentage": 42.11, "elapsed_time": "0:31:58", "remaining_time": "0:43:58"}
81
  {"current_steps": 81, "total_steps": 190, "loss": 0.3825, "lr": 2.8369023454079223e-05, "epoch": 2.1103896103896105, "percentage": 42.63, "elapsed_time": "0:32:18", "remaining_time": "0:43:29"}
82
  {"current_steps": 82, "total_steps": 190, "loss": 0.3714, "lr": 2.8033908493059394e-05, "epoch": 2.1363636363636362, "percentage": 43.16, "elapsed_time": "0:32:40", "remaining_time": "0:43:02"}
83
+ {"current_steps": 83, "total_steps": 190, "loss": 0.3888, "lr": 2.7696081953488917e-05, "epoch": 2.1623376623376624, "percentage": 43.68, "elapsed_time": "0:33:03", "remaining_time": "0:42:37"}
84
+ {"current_steps": 84, "total_steps": 190, "loss": 0.3642, "lr": 2.735565785747787e-05, "epoch": 2.188311688311688, "percentage": 44.21, "elapsed_time": "0:33:25", "remaining_time": "0:42:11"}
85
+ {"current_steps": 85, "total_steps": 190, "loss": 0.3783, "lr": 2.7012751103855092e-05, "epoch": 2.2142857142857144, "percentage": 44.74, "elapsed_time": "0:33:47", "remaining_time": "0:41:44"}
86
+ {"current_steps": 86, "total_steps": 190, "loss": 0.3754, "lr": 2.6667477429387915e-05, "epoch": 2.24025974025974, "percentage": 45.26, "elapsed_time": "0:34:08", "remaining_time": "0:41:17"}
87
+ {"current_steps": 87, "total_steps": 190, "loss": 0.3473, "lr": 2.6319953369719057e-05, "epoch": 2.2662337662337664, "percentage": 45.79, "elapsed_time": "0:34:34", "remaining_time": "0:40:56"}
88
+ {"current_steps": 88, "total_steps": 190, "loss": 0.3471, "lr": 2.5970296220033894e-05, "epoch": 2.292207792207792, "percentage": 46.32, "elapsed_time": "0:35:01", "remaining_time": "0:40:35"}
89
+ {"current_steps": 89, "total_steps": 190, "loss": 0.3837, "lr": 2.5618623995471394e-05, "epoch": 2.3181818181818183, "percentage": 46.84, "elapsed_time": "0:35:22", "remaining_time": "0:40:08"}
90
+ {"current_steps": 90, "total_steps": 190, "loss": 0.3528, "lr": 2.5265055391291986e-05, "epoch": 2.344155844155844, "percentage": 47.37, "elapsed_time": "0:35:47", "remaining_time": "0:39:45"}
91
+ {"current_steps": 91, "total_steps": 190, "loss": 0.3649, "lr": 2.4909709742815986e-05, "epoch": 2.3701298701298703, "percentage": 47.89, "elapsed_time": "0:36:13", "remaining_time": "0:39:24"}
92
+ {"current_steps": 92, "total_steps": 190, "loss": 0.3669, "lr": 2.4552706985145873e-05, "epoch": 2.396103896103896, "percentage": 48.42, "elapsed_time": "0:36:31", "remaining_time": "0:38:54"}
93
+ {"current_steps": 93, "total_steps": 190, "loss": 0.3532, "lr": 2.4194167612686208e-05, "epoch": 2.4220779220779223, "percentage": 48.95, "elapsed_time": "0:36:50", "remaining_time": "0:38:25"}
94
+ {"current_steps": 94, "total_steps": 190, "loss": 0.3657, "lr": 2.3834212638474773e-05, "epoch": 2.448051948051948, "percentage": 49.47, "elapsed_time": "0:37:10", "remaining_time": "0:37:58"}
95
+ {"current_steps": 95, "total_steps": 190, "loss": 0.3621, "lr": 2.3472963553338614e-05, "epoch": 2.474025974025974, "percentage": 50.0, "elapsed_time": "0:37:29", "remaining_time": "0:37:29"}
96
+ {"current_steps": 96, "total_steps": 190, "loss": 0.3467, "lr": 2.3110542284888866e-05, "epoch": 2.5, "percentage": 50.53, "elapsed_time": "0:37:46", "remaining_time": "0:36:59"}
97
+ {"current_steps": 97, "total_steps": 190, "loss": 0.3624, "lr": 2.2747071156368166e-05, "epoch": 2.525974025974026, "percentage": 51.05, "elapsed_time": "0:38:12", "remaining_time": "0:36:38"}
98
+ {"current_steps": 98, "total_steps": 190, "loss": 0.3564, "lr": 2.2382672845364474e-05, "epoch": 2.551948051948052, "percentage": 51.58, "elapsed_time": "0:38:34", "remaining_time": "0:36:13"}
99
+ {"current_steps": 99, "total_steps": 190, "loss": 0.3658, "lr": 2.201747034240537e-05, "epoch": 2.5779220779220777, "percentage": 52.11, "elapsed_time": "0:38:59", "remaining_time": "0:35:50"}
100
+ {"current_steps": 100, "total_steps": 190, "loss": 0.3473, "lr": 2.165158690944665e-05, "epoch": 2.603896103896104, "percentage": 52.63, "elapsed_time": "0:39:20", "remaining_time": "0:35:24"}
101
+ {"current_steps": 101, "total_steps": 190, "loss": 0.3416, "lr": 2.1285146038269406e-05, "epoch": 2.62987012987013, "percentage": 53.16, "elapsed_time": "0:39:46", "remaining_time": "0:35:03"}
102
+ {"current_steps": 102, "total_steps": 190, "loss": 0.3448, "lr": 2.091827140879944e-05, "epoch": 2.655844155844156, "percentage": 53.68, "elapsed_time": "0:40:17", "remaining_time": "0:34:45"}
103
+ {"current_steps": 103, "total_steps": 190, "loss": 0.3433, "lr": 2.0551086847363245e-05, "epoch": 2.6818181818181817, "percentage": 54.21, "elapsed_time": "0:40:40", "remaining_time": "0:34:21"}
104
+ {"current_steps": 104, "total_steps": 190, "loss": 0.3467, "lr": 2.0183716284894533e-05, "epoch": 2.707792207792208, "percentage": 54.74, "elapsed_time": "0:41:00", "remaining_time": "0:33:54"}
105
+ {"current_steps": 105, "total_steps": 190, "loss": 0.3482, "lr": 1.9816283715105474e-05, "epoch": 2.7337662337662336, "percentage": 55.26, "elapsed_time": "0:41:19", "remaining_time": "0:33:27"}
106
+ {"current_steps": 106, "total_steps": 190, "loss": 0.3545, "lr": 1.9448913152636765e-05, "epoch": 2.75974025974026, "percentage": 55.79, "elapsed_time": "0:41:39", "remaining_time": "0:33:00"}
107
+ {"current_steps": 107, "total_steps": 190, "loss": 0.3666, "lr": 1.9081728591200565e-05, "epoch": 2.7857142857142856, "percentage": 56.32, "elapsed_time": "0:42:00", "remaining_time": "0:32:35"}
108
+ {"current_steps": 108, "total_steps": 190, "loss": 0.344, "lr": 1.87148539617306e-05, "epoch": 2.811688311688312, "percentage": 56.84, "elapsed_time": "0:42:21", "remaining_time": "0:32:09"}
109
+ {"current_steps": 109, "total_steps": 190, "loss": 0.3387, "lr": 1.8348413090553356e-05, "epoch": 2.8376623376623376, "percentage": 57.37, "elapsed_time": "0:42:39", "remaining_time": "0:31:41"}
110
+ {"current_steps": 110, "total_steps": 190, "loss": 0.3604, "lr": 1.7982529657594637e-05, "epoch": 2.8636363636363638, "percentage": 57.89, "elapsed_time": "0:43:01", "remaining_time": "0:31:17"}
111
+ {"current_steps": 111, "total_steps": 190, "loss": 0.3363, "lr": 1.761732715463553e-05, "epoch": 2.8896103896103895, "percentage": 58.42, "elapsed_time": "0:43:19", "remaining_time": "0:30:50"}
112
+ {"current_steps": 112, "total_steps": 190, "loss": 0.3546, "lr": 1.7252928843631838e-05, "epoch": 2.9155844155844157, "percentage": 58.95, "elapsed_time": "0:43:39", "remaining_time": "0:30:24"}
113
+ {"current_steps": 113, "total_steps": 190, "loss": 0.3486, "lr": 1.6889457715111144e-05, "epoch": 2.9415584415584415, "percentage": 59.47, "elapsed_time": "0:44:08", "remaining_time": "0:30:04"}
114
+ {"current_steps": 114, "total_steps": 190, "loss": 0.3352, "lr": 1.6527036446661396e-05, "epoch": 2.9675324675324677, "percentage": 60.0, "elapsed_time": "0:44:28", "remaining_time": "0:29:39"}
115
+ {"current_steps": 115, "total_steps": 190, "loss": 0.3593, "lr": 1.6165787361525237e-05, "epoch": 2.9935064935064934, "percentage": 60.53, "elapsed_time": "0:44:51", "remaining_time": "0:29:15"}
116
+ {"current_steps": 116, "total_steps": 190, "loss": 0.2407, "lr": 1.5805832387313795e-05, "epoch": 3.022727272727273, "percentage": 61.05, "elapsed_time": "0:46:11", "remaining_time": "0:29:28"}
117
+ {"current_steps": 117, "total_steps": 190, "loss": 0.1911, "lr": 1.544729301485414e-05, "epoch": 3.0487012987012987, "percentage": 61.58, "elapsed_time": "0:46:30", "remaining_time": "0:29:01"}
118
+ {"current_steps": 118, "total_steps": 190, "loss": 0.1896, "lr": 1.5090290257184019e-05, "epoch": 3.074675324675325, "percentage": 62.11, "elapsed_time": "0:46:49", "remaining_time": "0:28:34"}
119
+ {"current_steps": 119, "total_steps": 190, "loss": 0.2093, "lr": 1.4734944608708022e-05, "epoch": 3.1006493506493507, "percentage": 62.63, "elapsed_time": "0:47:12", "remaining_time": "0:28:10"}
120
+ {"current_steps": 120, "total_steps": 190, "loss": 0.2057, "lr": 1.4381376004528616e-05, "epoch": 3.1266233766233764, "percentage": 63.16, "elapsed_time": "0:47:36", "remaining_time": "0:27:46"}
121
+ {"current_steps": 121, "total_steps": 190, "loss": 0.1884, "lr": 1.4029703779966116e-05, "epoch": 3.1525974025974026, "percentage": 63.68, "elapsed_time": "0:47:53", "remaining_time": "0:27:18"}