gsmyrnis commited on
Commit
d802dcf
·
verified ·
1 Parent(s): 5320b49

Training in progress, epoch 1

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:585a71b995bf71e75c6bdca54ae005bf4f9c31a2ca2077a6bde649c91248c4ab
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40f38a285767f7686e72c50f455741c77f9deedbe105578804c8d6d46f8c0bdf
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3f7c2b87e185fa451bb775ca1f1df1259af945283a770593c819af428bdde332
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0409cc62d5b17b02e76042416c02256037e7779755228ef58c064f33f5e68ccc
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:36a9edd4463485fe8aaecbf4f4208244a06b14f8b4838cf3c0d6841452c56fd4
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6aeaa421c8a78e3d50140d2c04608a44a2b1080982dd51529e56e9cfa6103a2e
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:30ab721db5f33777ba77f9a80f0e9ffa216e77899e6db06fbdcc5217ef16ae5a
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9272e0f4fcce8b5ba3aaba56a0f832b45e9beb921fa0216a92af4eb7c52508b2
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -88,3 +88,80 @@
88
  {"current_steps": 88, "total_steps": 234, "loss": 0.7596, "lr": 7.87808532842837e-06, "epoch": 1.123404255319149, "percentage": 37.61, "elapsed_time": "0:21:34", "remaining_time": "0:35:47"}
89
  {"current_steps": 89, "total_steps": 234, "loss": 0.7416, "lr": 7.81660029031811e-06, "epoch": 1.1361702127659574, "percentage": 38.03, "elapsed_time": "0:21:45", "remaining_time": "0:35:26"}
90
  {"current_steps": 90, "total_steps": 234, "loss": 0.688, "lr": 7.754484907260513e-06, "epoch": 1.148936170212766, "percentage": 38.46, "elapsed_time": "0:21:58", "remaining_time": "0:35:09"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
88
  {"current_steps": 88, "total_steps": 234, "loss": 0.7596, "lr": 7.87808532842837e-06, "epoch": 1.123404255319149, "percentage": 37.61, "elapsed_time": "0:21:34", "remaining_time": "0:35:47"}
89
  {"current_steps": 89, "total_steps": 234, "loss": 0.7416, "lr": 7.81660029031811e-06, "epoch": 1.1361702127659574, "percentage": 38.03, "elapsed_time": "0:21:45", "remaining_time": "0:35:26"}
90
  {"current_steps": 90, "total_steps": 234, "loss": 0.688, "lr": 7.754484907260513e-06, "epoch": 1.148936170212766, "percentage": 38.46, "elapsed_time": "0:21:58", "remaining_time": "0:35:09"}
91
+ {"current_steps": 91, "total_steps": 234, "loss": 0.7427, "lr": 7.691753080453413e-06, "epoch": 1.1617021276595745, "percentage": 38.89, "elapsed_time": "0:22:12", "remaining_time": "0:34:54"}
92
+ {"current_steps": 92, "total_steps": 234, "loss": 0.7761, "lr": 7.628418849052523e-06, "epoch": 1.174468085106383, "percentage": 39.32, "elapsed_time": "0:22:23", "remaining_time": "0:34:34"}
93
+ {"current_steps": 93, "total_steps": 234, "loss": 0.8177, "lr": 7.564496387029532e-06, "epoch": 1.1872340425531915, "percentage": 39.74, "elapsed_time": "0:22:39", "remaining_time": "0:34:20"}
94
+ {"current_steps": 94, "total_steps": 234, "loss": 0.731, "lr": 7.500000000000001e-06, "epoch": 1.2, "percentage": 40.17, "elapsed_time": "0:22:52", "remaining_time": "0:34:03"}
95
+ {"current_steps": 95, "total_steps": 234, "loss": 0.7076, "lr": 7.434944122021837e-06, "epoch": 1.2127659574468086, "percentage": 40.6, "elapsed_time": "0:23:08", "remaining_time": "0:33:51"}
96
+ {"current_steps": 96, "total_steps": 234, "loss": 0.7707, "lr": 7.369343312364994e-06, "epoch": 1.225531914893617, "percentage": 41.03, "elapsed_time": "0:23:20", "remaining_time": "0:33:33"}
97
+ {"current_steps": 97, "total_steps": 234, "loss": 0.7246, "lr": 7.303212252253163e-06, "epoch": 1.2382978723404254, "percentage": 41.45, "elapsed_time": "0:23:36", "remaining_time": "0:33:20"}
98
+ {"current_steps": 98, "total_steps": 234, "loss": 0.8116, "lr": 7.236565741578163e-06, "epoch": 1.251063829787234, "percentage": 41.88, "elapsed_time": "0:23:51", "remaining_time": "0:33:06"}
99
+ {"current_steps": 99, "total_steps": 234, "loss": 0.7499, "lr": 7.169418695587791e-06, "epoch": 1.2638297872340425, "percentage": 42.31, "elapsed_time": "0:24:06", "remaining_time": "0:32:52"}
100
+ {"current_steps": 100, "total_steps": 234, "loss": 0.7554, "lr": 7.101786141547829e-06, "epoch": 1.2765957446808511, "percentage": 42.74, "elapsed_time": "0:24:19", "remaining_time": "0:32:35"}
101
+ {"current_steps": 101, "total_steps": 234, "loss": 0.6596, "lr": 7.033683215379002e-06, "epoch": 1.2893617021276595, "percentage": 43.16, "elapsed_time": "0:24:32", "remaining_time": "0:32:19"}
102
+ {"current_steps": 102, "total_steps": 234, "loss": 0.8226, "lr": 6.965125158269619e-06, "epoch": 1.302127659574468, "percentage": 43.59, "elapsed_time": "0:24:46", "remaining_time": "0:32:04"}
103
+ {"current_steps": 103, "total_steps": 234, "loss": 0.8034, "lr": 6.896127313264643e-06, "epoch": 1.3148936170212766, "percentage": 44.02, "elapsed_time": "0:25:01", "remaining_time": "0:31:49"}
104
+ {"current_steps": 104, "total_steps": 234, "loss": 0.7348, "lr": 6.8267051218319766e-06, "epoch": 1.327659574468085, "percentage": 44.44, "elapsed_time": "0:25:15", "remaining_time": "0:31:33"}
105
+ {"current_steps": 105, "total_steps": 234, "loss": 0.7203, "lr": 6.7568741204067145e-06, "epoch": 1.3404255319148937, "percentage": 44.87, "elapsed_time": "0:25:25", "remaining_time": "0:31:14"}
106
+ {"current_steps": 106, "total_steps": 234, "loss": 0.7419, "lr": 6.686649936914151e-06, "epoch": 1.353191489361702, "percentage": 45.3, "elapsed_time": "0:25:39", "remaining_time": "0:30:59"}
107
+ {"current_steps": 107, "total_steps": 234, "loss": 0.7898, "lr": 6.616048287272301e-06, "epoch": 1.3659574468085105, "percentage": 45.73, "elapsed_time": "0:25:55", "remaining_time": "0:30:46"}
108
+ {"current_steps": 108, "total_steps": 234, "loss": 0.8062, "lr": 6.545084971874738e-06, "epoch": 1.3787234042553191, "percentage": 46.15, "elapsed_time": "0:26:11", "remaining_time": "0:30:33"}
109
+ {"current_steps": 109, "total_steps": 234, "loss": 0.8034, "lr": 6.473775872054522e-06, "epoch": 1.3914893617021278, "percentage": 46.58, "elapsed_time": "0:26:25", "remaining_time": "0:30:18"}
110
+ {"current_steps": 110, "total_steps": 234, "loss": 0.7673, "lr": 6.402136946530014e-06, "epoch": 1.4042553191489362, "percentage": 47.01, "elapsed_time": "0:26:40", "remaining_time": "0:30:03"}
111
+ {"current_steps": 111, "total_steps": 234, "loss": 0.6315, "lr": 6.330184227833376e-06, "epoch": 1.4170212765957446, "percentage": 47.44, "elapsed_time": "0:26:56", "remaining_time": "0:29:50"}
112
+ {"current_steps": 112, "total_steps": 234, "loss": 0.7698, "lr": 6.257933818722544e-06, "epoch": 1.4297872340425533, "percentage": 47.86, "elapsed_time": "0:27:10", "remaining_time": "0:29:35"}
113
+ {"current_steps": 113, "total_steps": 234, "loss": 0.8267, "lr": 6.185401888577488e-06, "epoch": 1.4425531914893617, "percentage": 48.29, "elapsed_time": "0:27:24", "remaining_time": "0:29:20"}
114
+ {"current_steps": 114, "total_steps": 234, "loss": 0.6971, "lr": 6.112604669781572e-06, "epoch": 1.4553191489361703, "percentage": 48.72, "elapsed_time": "0:27:39", "remaining_time": "0:29:06"}
115
+ {"current_steps": 115, "total_steps": 234, "loss": 0.8687, "lr": 6.039558454088796e-06, "epoch": 1.4680851063829787, "percentage": 49.15, "elapsed_time": "0:27:54", "remaining_time": "0:28:52"}
116
+ {"current_steps": 116, "total_steps": 234, "loss": 0.732, "lr": 5.9662795889777666e-06, "epoch": 1.4808510638297872, "percentage": 49.57, "elapsed_time": "0:28:09", "remaining_time": "0:28:38"}
117
+ {"current_steps": 117, "total_steps": 234, "loss": 0.6502, "lr": 5.892784473993184e-06, "epoch": 1.4936170212765958, "percentage": 50.0, "elapsed_time": "0:28:21", "remaining_time": "0:28:21"}
118
+ {"current_steps": 118, "total_steps": 234, "loss": 0.7959, "lr": 5.819089557075689e-06, "epoch": 1.5063829787234042, "percentage": 50.43, "elapsed_time": "0:28:35", "remaining_time": "0:28:06"}
119
+ {"current_steps": 119, "total_steps": 234, "loss": 0.7351, "lr": 5.745211330880872e-06, "epoch": 1.5191489361702128, "percentage": 50.85, "elapsed_time": "0:28:47", "remaining_time": "0:27:49"}
120
+ {"current_steps": 120, "total_steps": 234, "loss": 0.7528, "lr": 5.671166329088278e-06, "epoch": 1.5319148936170213, "percentage": 51.28, "elapsed_time": "0:28:59", "remaining_time": "0:27:32"}
121
+ {"current_steps": 121, "total_steps": 234, "loss": 0.8955, "lr": 5.596971122701221e-06, "epoch": 1.5446808510638297, "percentage": 51.71, "elapsed_time": "0:29:14", "remaining_time": "0:27:18"}
122
+ {"current_steps": 122, "total_steps": 234, "loss": 0.7261, "lr": 5.522642316338268e-06, "epoch": 1.5574468085106383, "percentage": 52.14, "elapsed_time": "0:29:29", "remaining_time": "0:27:04"}
123
+ {"current_steps": 123, "total_steps": 234, "loss": 0.7679, "lr": 5.448196544517168e-06, "epoch": 1.570212765957447, "percentage": 52.56, "elapsed_time": "0:29:44", "remaining_time": "0:26:50"}
124
+ {"current_steps": 124, "total_steps": 234, "loss": 0.7638, "lr": 5.373650467932122e-06, "epoch": 1.5829787234042554, "percentage": 52.99, "elapsed_time": "0:30:01", "remaining_time": "0:26:38"}
125
+ {"current_steps": 125, "total_steps": 234, "loss": 0.787, "lr": 5.299020769725172e-06, "epoch": 1.5957446808510638, "percentage": 53.42, "elapsed_time": "0:30:18", "remaining_time": "0:26:25"}
126
+ {"current_steps": 126, "total_steps": 234, "loss": 0.8122, "lr": 5.224324151752575e-06, "epoch": 1.6085106382978722, "percentage": 53.85, "elapsed_time": "0:30:33", "remaining_time": "0:26:11"}
127
+ {"current_steps": 127, "total_steps": 234, "loss": 0.7534, "lr": 5.1495773308469935e-06, "epoch": 1.6212765957446809, "percentage": 54.27, "elapsed_time": "0:30:48", "remaining_time": "0:25:57"}
128
+ {"current_steps": 128, "total_steps": 234, "loss": 0.7181, "lr": 5.074797035076319e-06, "epoch": 1.6340425531914895, "percentage": 54.7, "elapsed_time": "0:31:03", "remaining_time": "0:25:42"}
129
+ {"current_steps": 129, "total_steps": 234, "loss": 0.892, "lr": 5e-06, "epoch": 1.646808510638298, "percentage": 55.13, "elapsed_time": "0:31:19", "remaining_time": "0:25:29"}
130
+ {"current_steps": 130, "total_steps": 234, "loss": 0.7209, "lr": 4.9252029649236835e-06, "epoch": 1.6595744680851063, "percentage": 55.56, "elapsed_time": "0:31:32", "remaining_time": "0:25:14"}
131
+ {"current_steps": 131, "total_steps": 234, "loss": 0.7289, "lr": 4.850422669153009e-06, "epoch": 1.6723404255319148, "percentage": 55.98, "elapsed_time": "0:31:48", "remaining_time": "0:25:00"}
132
+ {"current_steps": 132, "total_steps": 234, "loss": 0.7493, "lr": 4.775675848247427e-06, "epoch": 1.6851063829787234, "percentage": 56.41, "elapsed_time": "0:32:00", "remaining_time": "0:24:43"}
133
+ {"current_steps": 133, "total_steps": 234, "loss": 0.6385, "lr": 4.700979230274829e-06, "epoch": 1.697872340425532, "percentage": 56.84, "elapsed_time": "0:32:13", "remaining_time": "0:24:28"}
134
+ {"current_steps": 134, "total_steps": 234, "loss": 0.868, "lr": 4.626349532067879e-06, "epoch": 1.7106382978723405, "percentage": 57.26, "elapsed_time": "0:32:28", "remaining_time": "0:24:13"}
135
+ {"current_steps": 135, "total_steps": 234, "loss": 0.7627, "lr": 4.551803455482833e-06, "epoch": 1.7234042553191489, "percentage": 57.69, "elapsed_time": "0:32:43", "remaining_time": "0:24:00"}
136
+ {"current_steps": 136, "total_steps": 234, "loss": 0.7253, "lr": 4.477357683661734e-06, "epoch": 1.7361702127659573, "percentage": 58.12, "elapsed_time": "0:32:57", "remaining_time": "0:23:45"}
137
+ {"current_steps": 137, "total_steps": 234, "loss": 0.7586, "lr": 4.4030288772987795e-06, "epoch": 1.748936170212766, "percentage": 58.55, "elapsed_time": "0:33:11", "remaining_time": "0:23:29"}
138
+ {"current_steps": 138, "total_steps": 234, "loss": 0.808, "lr": 4.3288336709117246e-06, "epoch": 1.7617021276595746, "percentage": 58.97, "elapsed_time": "0:33:25", "remaining_time": "0:23:14"}
139
+ {"current_steps": 139, "total_steps": 234, "loss": 0.7702, "lr": 4.254788669119127e-06, "epoch": 1.774468085106383, "percentage": 59.4, "elapsed_time": "0:33:34", "remaining_time": "0:22:56"}
140
+ {"current_steps": 140, "total_steps": 234, "loss": 0.7557, "lr": 4.180910442924312e-06, "epoch": 1.7872340425531914, "percentage": 59.83, "elapsed_time": "0:33:49", "remaining_time": "0:22:42"}
141
+ {"current_steps": 141, "total_steps": 234, "loss": 0.7419, "lr": 4.107215526006818e-06, "epoch": 1.8, "percentage": 60.26, "elapsed_time": "0:34:03", "remaining_time": "0:22:27"}
142
+ {"current_steps": 142, "total_steps": 234, "loss": 0.666, "lr": 4.033720411022235e-06, "epoch": 1.8127659574468085, "percentage": 60.68, "elapsed_time": "0:34:15", "remaining_time": "0:22:11"}
143
+ {"current_steps": 143, "total_steps": 234, "loss": 0.772, "lr": 3.960441545911205e-06, "epoch": 1.825531914893617, "percentage": 61.11, "elapsed_time": "0:34:29", "remaining_time": "0:21:57"}
144
+ {"current_steps": 144, "total_steps": 234, "loss": 0.7972, "lr": 3.887395330218429e-06, "epoch": 1.8382978723404255, "percentage": 61.54, "elapsed_time": "0:34:42", "remaining_time": "0:21:41"}
145
+ {"current_steps": 145, "total_steps": 234, "loss": 0.6953, "lr": 3.8145981114225135e-06, "epoch": 1.851063829787234, "percentage": 61.97, "elapsed_time": "0:34:58", "remaining_time": "0:21:27"}
146
+ {"current_steps": 146, "total_steps": 234, "loss": 0.8309, "lr": 3.7420661812774577e-06, "epoch": 1.8638297872340426, "percentage": 62.39, "elapsed_time": "0:35:11", "remaining_time": "0:21:12"}
147
+ {"current_steps": 147, "total_steps": 234, "loss": 0.6375, "lr": 3.669815772166625e-06, "epoch": 1.8765957446808512, "percentage": 62.82, "elapsed_time": "0:35:22", "remaining_time": "0:20:55"}
148
+ {"current_steps": 148, "total_steps": 234, "loss": 0.7718, "lr": 3.5978630534699873e-06, "epoch": 1.8893617021276596, "percentage": 63.25, "elapsed_time": "0:35:34", "remaining_time": "0:20:40"}
149
+ {"current_steps": 149, "total_steps": 234, "loss": 0.7586, "lr": 3.526224127945479e-06, "epoch": 1.902127659574468, "percentage": 63.68, "elapsed_time": "0:35:49", "remaining_time": "0:20:26"}
150
+ {"current_steps": 150, "total_steps": 234, "loss": 0.8194, "lr": 3.4549150281252635e-06, "epoch": 1.9148936170212765, "percentage": 64.1, "elapsed_time": "0:36:05", "remaining_time": "0:20:12"}
151
+ {"current_steps": 151, "total_steps": 234, "loss": 0.7998, "lr": 3.383951712727701e-06, "epoch": 1.9276595744680851, "percentage": 64.53, "elapsed_time": "0:36:22", "remaining_time": "0:19:59"}
152
+ {"current_steps": 152, "total_steps": 234, "loss": 0.7879, "lr": 3.3133500630858507e-06, "epoch": 1.9404255319148938, "percentage": 64.96, "elapsed_time": "0:36:37", "remaining_time": "0:19:45"}
153
+ {"current_steps": 153, "total_steps": 234, "loss": 0.7206, "lr": 3.2431258795932863e-06, "epoch": 1.9531914893617022, "percentage": 65.38, "elapsed_time": "0:36:48", "remaining_time": "0:19:29"}
154
+ {"current_steps": 154, "total_steps": 234, "loss": 0.7528, "lr": 3.173294878168025e-06, "epoch": 1.9659574468085106, "percentage": 65.81, "elapsed_time": "0:36:59", "remaining_time": "0:19:13"}
155
+ {"current_steps": 155, "total_steps": 234, "loss": 0.7817, "lr": 3.1038726867353587e-06, "epoch": 1.978723404255319, "percentage": 66.24, "elapsed_time": "0:37:16", "remaining_time": "0:18:59"}
156
+ {"current_steps": 156, "total_steps": 234, "loss": 0.7491, "lr": 3.0348748417303826e-06, "epoch": 1.9914893617021276, "percentage": 66.67, "elapsed_time": "0:37:29", "remaining_time": "0:18:44"}
157
+ {"current_steps": 157, "total_steps": 234, "loss": 1.2112, "lr": 2.966316784621e-06, "epoch": 2.0042553191489363, "percentage": 67.09, "elapsed_time": "0:38:51", "remaining_time": "0:19:03"}
158
+ {"current_steps": 158, "total_steps": 234, "loss": 0.6694, "lr": 2.8982138584521734e-06, "epoch": 2.0170212765957447, "percentage": 67.52, "elapsed_time": "0:39:04", "remaining_time": "0:18:47"}
159
+ {"current_steps": 159, "total_steps": 234, "loss": 0.7556, "lr": 2.83058130441221e-06, "epoch": 2.029787234042553, "percentage": 67.95, "elapsed_time": "0:39:21", "remaining_time": "0:18:33"}
160
+ {"current_steps": 160, "total_steps": 234, "loss": 0.6236, "lr": 2.7634342584218364e-06, "epoch": 2.0425531914893615, "percentage": 68.38, "elapsed_time": "0:39:35", "remaining_time": "0:18:18"}
161
+ {"current_steps": 161, "total_steps": 234, "loss": 0.8026, "lr": 2.6967877477468394e-06, "epoch": 2.0553191489361704, "percentage": 68.8, "elapsed_time": "0:39:52", "remaining_time": "0:18:04"}
162
+ {"current_steps": 162, "total_steps": 234, "loss": 0.693, "lr": 2.6306566876350072e-06, "epoch": 2.068085106382979, "percentage": 69.23, "elapsed_time": "0:40:06", "remaining_time": "0:17:49"}
163
+ {"current_steps": 163, "total_steps": 234, "loss": 0.695, "lr": 2.5650558779781635e-06, "epoch": 2.0808510638297872, "percentage": 69.66, "elapsed_time": "0:40:21", "remaining_time": "0:17:34"}
164
+ {"current_steps": 164, "total_steps": 234, "loss": 0.6958, "lr": 2.5000000000000015e-06, "epoch": 2.0936170212765957, "percentage": 70.09, "elapsed_time": "0:40:33", "remaining_time": "0:17:18"}
165
+ {"current_steps": 165, "total_steps": 234, "loss": 0.6422, "lr": 2.43550361297047e-06, "epoch": 2.106382978723404, "percentage": 70.51, "elapsed_time": "0:40:46", "remaining_time": "0:17:03"}
166
+ {"current_steps": 166, "total_steps": 234, "loss": 0.7221, "lr": 2.371581150947476e-06, "epoch": 2.119148936170213, "percentage": 70.94, "elapsed_time": "0:41:00", "remaining_time": "0:16:47"}
167
+ {"current_steps": 167, "total_steps": 234, "loss": 0.6881, "lr": 2.3082469195465893e-06, "epoch": 2.1319148936170214, "percentage": 71.37, "elapsed_time": "0:41:13", "remaining_time": "0:16:32"}