nornor02 commited on
Commit
27ff10d
·
verified ·
1 Parent(s): 2926ef8

Training in progress, step 2000

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88f21ae7654fa3e1a55aedae15338758b336a6131838f1a6a7399a419b26d1bc
3
  size 328693404
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd5eee1d3a1a8a8ea109ef9c1f112b86b07b4f693c5152dd541b7610680596a3
3
  size 328693404
runs/Jan17_23-12-05_52cbc9ada374/events.out.tfevents.1705533128.52cbc9ada374.26.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b668852176943c09a25fcdaf9f84e212bb0518c611f5b22ee674045c5802aead
3
- size 4836
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:affd098891ff5b3a304e2225991415319ded4222ab358ee016b05371e56d1026
3
+ size 4993
wandb/debug-internal.log CHANGED
@@ -193,3 +193,44 @@
193
  2024-01-17 23:17:11,204 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
194
  2024-01-17 23:17:13,355 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
195
  2024-01-17 23:17:16,204 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
193
  2024-01-17 23:17:11,204 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
194
  2024-01-17 23:17:13,355 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
195
  2024-01-17 23:17:16,204 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
196
+ 2024-01-17 23:17:18,356 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
197
+ 2024-01-17 23:17:21,205 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
198
+ 2024-01-17 23:17:23,357 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
199
+ 2024-01-17 23:17:24,928 DEBUG SenderThread:103 [sender.py:send():382] send: stats
200
+ 2024-01-17 23:17:26,208 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
201
+ 2024-01-17 23:17:28,929 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
202
+ 2024-01-17 23:17:31,211 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
203
+ 2024-01-17 23:17:33,930 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
204
+ 2024-01-17 23:17:36,212 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
205
+ 2024-01-17 23:17:38,930 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
206
+ 2024-01-17 23:17:41,213 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
207
+ 2024-01-17 23:17:43,931 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
208
+ 2024-01-17 23:17:46,215 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
209
+ 2024-01-17 23:17:48,932 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
210
+ 2024-01-17 23:17:51,217 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
211
+ 2024-01-17 23:17:53,933 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
212
+ 2024-01-17 23:17:54,931 DEBUG SenderThread:103 [sender.py:send():382] send: stats
213
+ 2024-01-17 23:17:56,218 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
214
+ 2024-01-17 23:17:59,932 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
215
+ 2024-01-17 23:18:01,225 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
216
+ 2024-01-17 23:18:04,933 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
217
+ 2024-01-17 23:18:06,226 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
218
+ 2024-01-17 23:18:09,933 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
219
+ 2024-01-17 23:18:11,234 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
220
+ 2024-01-17 23:18:14,934 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
221
+ 2024-01-17 23:18:16,236 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
222
+ 2024-01-17 23:18:19,935 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
223
+ 2024-01-17 23:18:21,237 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
224
+ 2024-01-17 23:18:24,930 DEBUG SenderThread:103 [sender.py:send():382] send: stats
225
+ 2024-01-17 23:18:25,931 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
226
+ 2024-01-17 23:18:26,238 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
227
+ 2024-01-17 23:18:28,971 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: partial_history
228
+ 2024-01-17 23:18:28,972 DEBUG SenderThread:103 [sender.py:send():382] send: history
229
+ 2024-01-17 23:18:28,972 DEBUG SenderThread:103 [sender.py:send_request():409] send_request: summary_record
230
+ 2024-01-17 23:18:28,973 INFO SenderThread:103 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
231
+ 2024-01-17 23:18:29,946 INFO Thread-12 :103 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240117_231223-wasc5lj5/files/wandb-summary.json
232
+ 2024-01-17 23:18:30,973 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
233
+ 2024-01-17 23:18:31,375 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
234
+ 2024-01-17 23:18:33,948 INFO Thread-12 :103 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240117_231223-wasc5lj5/files/output.log
235
+ 2024-01-17 23:18:36,256 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
236
+ 2024-01-17 23:18:36,381 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
wandb/run-20240117_231223-wasc5lj5/files/output.log CHANGED
@@ -5,4 +5,6 @@ You're using a PreTrainedTokenizerFast tokenizer. Please note that with a fast t
5
  warnings.warn('Was asked to gather along dimension 0, but all '
6
  /opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
7
  warnings.warn('Was asked to gather along dimension 0, but all '
 
 
8
  /opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
 
5
  warnings.warn('Was asked to gather along dimension 0, but all '
6
  /opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
7
  warnings.warn('Was asked to gather along dimension 0, but all '
8
+ /opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
9
+ warnings.warn('Was asked to gather along dimension 0, but all '
10
  /opt/conda/lib/python3.10/site-packages/torch/nn/parallel/_functions.py:68: UserWarning: Was asked to gather along dimension 0, but all input tensors were scalars; will instead unsqueeze and return a vector.
wandb/run-20240117_231223-wasc5lj5/files/wandb-summary.json CHANGED
@@ -1 +1 @@
1
- {"train/loss": 1.6212, "train/learning_rate": 8.461538461538462e-06, "train/epoch": 115.38, "train/global_step": 1500, "_timestamp": 1705533425.1149898, "_runtime": 281.1206748485565, "_step": 2}
 
1
+ {"train/loss": 1.2988, "train/learning_rate": 4.615384615384616e-06, "train/epoch": 153.85, "train/global_step": 2000, "_timestamp": 1705533508.9709108, "_runtime": 364.9765958786011, "_step": 3}
wandb/run-20240117_231223-wasc5lj5/logs/debug-internal.log CHANGED
@@ -193,3 +193,44 @@
193
  2024-01-17 23:17:11,204 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
194
  2024-01-17 23:17:13,355 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
195
  2024-01-17 23:17:16,204 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
193
  2024-01-17 23:17:11,204 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
194
  2024-01-17 23:17:13,355 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
195
  2024-01-17 23:17:16,204 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
196
+ 2024-01-17 23:17:18,356 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
197
+ 2024-01-17 23:17:21,205 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
198
+ 2024-01-17 23:17:23,357 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
199
+ 2024-01-17 23:17:24,928 DEBUG SenderThread:103 [sender.py:send():382] send: stats
200
+ 2024-01-17 23:17:26,208 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
201
+ 2024-01-17 23:17:28,929 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
202
+ 2024-01-17 23:17:31,211 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
203
+ 2024-01-17 23:17:33,930 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
204
+ 2024-01-17 23:17:36,212 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
205
+ 2024-01-17 23:17:38,930 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
206
+ 2024-01-17 23:17:41,213 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
207
+ 2024-01-17 23:17:43,931 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
208
+ 2024-01-17 23:17:46,215 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
209
+ 2024-01-17 23:17:48,932 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
210
+ 2024-01-17 23:17:51,217 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
211
+ 2024-01-17 23:17:53,933 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
212
+ 2024-01-17 23:17:54,931 DEBUG SenderThread:103 [sender.py:send():382] send: stats
213
+ 2024-01-17 23:17:56,218 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
214
+ 2024-01-17 23:17:59,932 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
215
+ 2024-01-17 23:18:01,225 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
216
+ 2024-01-17 23:18:04,933 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
217
+ 2024-01-17 23:18:06,226 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
218
+ 2024-01-17 23:18:09,933 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
219
+ 2024-01-17 23:18:11,234 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
220
+ 2024-01-17 23:18:14,934 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
221
+ 2024-01-17 23:18:16,236 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
222
+ 2024-01-17 23:18:19,935 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
223
+ 2024-01-17 23:18:21,237 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
224
+ 2024-01-17 23:18:24,930 DEBUG SenderThread:103 [sender.py:send():382] send: stats
225
+ 2024-01-17 23:18:25,931 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
226
+ 2024-01-17 23:18:26,238 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
227
+ 2024-01-17 23:18:28,971 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: partial_history
228
+ 2024-01-17 23:18:28,972 DEBUG SenderThread:103 [sender.py:send():382] send: history
229
+ 2024-01-17 23:18:28,972 DEBUG SenderThread:103 [sender.py:send_request():409] send_request: summary_record
230
+ 2024-01-17 23:18:28,973 INFO SenderThread:103 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
231
+ 2024-01-17 23:18:29,946 INFO Thread-12 :103 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240117_231223-wasc5lj5/files/wandb-summary.json
232
+ 2024-01-17 23:18:30,973 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
233
+ 2024-01-17 23:18:31,375 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
234
+ 2024-01-17 23:18:33,948 INFO Thread-12 :103 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240117_231223-wasc5lj5/files/output.log
235
+ 2024-01-17 23:18:36,256 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: status_report
236
+ 2024-01-17 23:18:36,381 DEBUG HandlerThread:103 [handler.py:handle_request():146] handle_request: keepalive
wandb/run-20240117_231223-wasc5lj5/run-wasc5lj5.wandb CHANGED
Binary files a/wandb/run-20240117_231223-wasc5lj5/run-wasc5lj5.wandb and b/wandb/run-20240117_231223-wasc5lj5/run-wasc5lj5.wandb differ