sharukat commited on
Commit
9351061
·
verified ·
1 Parent(s): 1e08120

Training in progress, epoch 4

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7429b3e2d9bf032cfab32114ff902416c8f69be1f9fcc8df0c815a004a4b4c9c
3
  size 502675828
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf8d0dc39fc554f5133aeee0a32cbdb4ea4ab932c17eb8e076cc9b9be62d7115
3
  size 502675828
runs/Apr10_15-06-31_9088970cc926/events.out.tfevents.1712761592.9088970cc926.34.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ccfd8060db458ccc4d8c76a88c71af79dfde5854105b9e2630301ee3b7b4b96
3
- size 7211
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a670c62bf143f8838a31fb99666f1e27be401d52b09911f10d139cfc1df676d7
3
+ size 7894
wandb/debug-internal.log CHANGED
@@ -391,3 +391,38 @@ subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after
391
  2024-04-10 15:09:59,273 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
392
  2024-04-10 15:10:00,833 DEBUG SenderThread:100 [sender.py:send():379] send: stats
393
  2024-04-10 15:10:04,835 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
391
  2024-04-10 15:09:59,273 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
392
  2024-04-10 15:10:00,833 DEBUG SenderThread:100 [sender.py:send():379] send: stats
393
  2024-04-10 15:10:04,835 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
394
+ 2024-04-10 15:10:09,835 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
395
+ 2024-04-10 15:10:11,984 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
396
+ 2024-04-10 15:10:11,998 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
397
+ 2024-04-10 15:10:11,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
398
+ 2024-04-10 15:10:15,227 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
399
+ 2024-04-10 15:10:20,228 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
400
+ 2024-04-10 15:10:25,229 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
401
+ 2024-04-10 15:10:26,984 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
402
+ 2024-04-10 15:10:26,998 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
403
+ 2024-04-10 15:10:26,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
404
+ 2024-04-10 15:10:30,264 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
405
+ 2024-04-10 15:10:30,834 DEBUG SenderThread:100 [sender.py:send():379] send: stats
406
+ 2024-04-10 15:10:33,546 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: partial_history
407
+ 2024-04-10 15:10:33,547 DEBUG SenderThread:100 [sender.py:send():379] send: history
408
+ 2024-04-10 15:10:33,547 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: summary_record
409
+ 2024-04-10 15:10:33,548 INFO SenderThread:100 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
410
+ 2024-04-10 15:10:33,859 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/wandb-summary.json
411
+ 2024-04-10 15:10:35,548 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
412
+ 2024-04-10 15:10:36,404 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: partial_history
413
+ 2024-04-10 15:10:36,405 DEBUG SenderThread:100 [sender.py:send():379] send: history
414
+ 2024-04-10 15:10:36,406 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: summary_record
415
+ 2024-04-10 15:10:36,406 INFO SenderThread:100 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
416
+ 2024-04-10 15:10:36,861 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/wandb-summary.json
417
+ 2024-04-10 15:10:38,862 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/output.log
418
+ 2024-04-10 15:10:41,408 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
419
+ 2024-04-10 15:10:41,984 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
420
+ 2024-04-10 15:10:41,998 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
421
+ 2024-04-10 15:10:41,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
422
+ 2024-04-10 15:10:47,266 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
423
+ 2024-04-10 15:10:52,267 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
424
+ 2024-04-10 15:10:56,998 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
425
+ 2024-04-10 15:10:56,999 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
426
+ 2024-04-10 15:10:56,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
427
+ 2024-04-10 15:10:58,184 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
428
+ 2024-04-10 15:11:00,835 DEBUG SenderThread:100 [sender.py:send():379] send: stats
wandb/run-20240410_150123-cuua991r/files/output.log CHANGED
@@ -15,4 +15,6 @@ dataloader_config = DataLoaderConfiguration(dispatch_batches=None, split_batches
15
  _warn_prf(average, modifier, msg_start, len(result))
16
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
17
  _warn_prf(average, modifier, msg_start, len(result))
 
 
18
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
 
15
  _warn_prf(average, modifier, msg_start, len(result))
16
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
17
  _warn_prf(average, modifier, msg_start, len(result))
18
+ /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
19
+ _warn_prf(average, modifier, msg_start, len(result))
20
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
wandb/run-20240410_150123-cuua991r/files/wandb-summary.json CHANGED
@@ -1 +1 @@
1
- {"train/loss": 1.8499, "train/grad_norm": 8.081238746643066, "train/learning_rate": 7.016949152542374e-06, "train/epoch": 3.0, "train/global_step": 354, "_timestamp": 1712761773.6414328, "_runtime": 490.09070086479187, "_step": 13, "eval/loss": 1.8500417470932007, "eval/accuracy": 0.3028169014084507, "eval/precision": 0.15226251402682664, "eval/recall": 0.3028169014084507, "eval/f1": 0.19308999089624623, "eval/runtime": 2.8399, "eval/samples_per_second": 50.001, "eval/steps_per_second": 6.338}
 
1
+ {"train/loss": 1.8157, "train/grad_norm": 8.839205741882324, "train/learning_rate": 6.0169491525423725e-06, "train/epoch": 4.0, "train/global_step": 472, "_timestamp": 1712761836.404062, "_runtime": 552.8533301353455, "_step": 15, "eval/loss": 1.847446084022522, "eval/accuracy": 0.28169014084507044, "eval/precision": 0.14118326831447664, "eval/recall": 0.28169014084507044, "eval/f1": 0.1868000687049124, "eval/runtime": 2.8541, "eval/samples_per_second": 49.753, "eval/steps_per_second": 6.307}
wandb/run-20240410_150123-cuua991r/logs/debug-internal.log CHANGED
@@ -391,3 +391,38 @@ subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after
391
  2024-04-10 15:09:59,273 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
392
  2024-04-10 15:10:00,833 DEBUG SenderThread:100 [sender.py:send():379] send: stats
393
  2024-04-10 15:10:04,835 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
391
  2024-04-10 15:09:59,273 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
392
  2024-04-10 15:10:00,833 DEBUG SenderThread:100 [sender.py:send():379] send: stats
393
  2024-04-10 15:10:04,835 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
394
+ 2024-04-10 15:10:09,835 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
395
+ 2024-04-10 15:10:11,984 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
396
+ 2024-04-10 15:10:11,998 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
397
+ 2024-04-10 15:10:11,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
398
+ 2024-04-10 15:10:15,227 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
399
+ 2024-04-10 15:10:20,228 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
400
+ 2024-04-10 15:10:25,229 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
401
+ 2024-04-10 15:10:26,984 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
402
+ 2024-04-10 15:10:26,998 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
403
+ 2024-04-10 15:10:26,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
404
+ 2024-04-10 15:10:30,264 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
405
+ 2024-04-10 15:10:30,834 DEBUG SenderThread:100 [sender.py:send():379] send: stats
406
+ 2024-04-10 15:10:33,546 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: partial_history
407
+ 2024-04-10 15:10:33,547 DEBUG SenderThread:100 [sender.py:send():379] send: history
408
+ 2024-04-10 15:10:33,547 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: summary_record
409
+ 2024-04-10 15:10:33,548 INFO SenderThread:100 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
410
+ 2024-04-10 15:10:33,859 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/wandb-summary.json
411
+ 2024-04-10 15:10:35,548 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
412
+ 2024-04-10 15:10:36,404 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: partial_history
413
+ 2024-04-10 15:10:36,405 DEBUG SenderThread:100 [sender.py:send():379] send: history
414
+ 2024-04-10 15:10:36,406 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: summary_record
415
+ 2024-04-10 15:10:36,406 INFO SenderThread:100 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
416
+ 2024-04-10 15:10:36,861 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/wandb-summary.json
417
+ 2024-04-10 15:10:38,862 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/output.log
418
+ 2024-04-10 15:10:41,408 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
419
+ 2024-04-10 15:10:41,984 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
420
+ 2024-04-10 15:10:41,998 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
421
+ 2024-04-10 15:10:41,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
422
+ 2024-04-10 15:10:47,266 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
423
+ 2024-04-10 15:10:52,267 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
424
+ 2024-04-10 15:10:56,998 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
425
+ 2024-04-10 15:10:56,999 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
426
+ 2024-04-10 15:10:56,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
427
+ 2024-04-10 15:10:58,184 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
428
+ 2024-04-10 15:11:00,835 DEBUG SenderThread:100 [sender.py:send():379] send: stats
wandb/run-20240410_150123-cuua991r/run-cuua991r.wandb CHANGED
Binary files a/wandb/run-20240410_150123-cuua991r/run-cuua991r.wandb and b/wandb/run-20240410_150123-cuua991r/run-cuua991r.wandb differ