sharukat commited on
Commit
2c0d046
·
verified ·
1 Parent(s): 9351061

Training in progress, epoch 5

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf8d0dc39fc554f5133aeee0a32cbdb4ea4ab932c17eb8e076cc9b9be62d7115
3
  size 502675828
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:67a4cb420958d75a3bb4a7ce6dc06955cc986e3d340535eadfc1a5407026e1a6
3
  size 502675828
runs/Apr10_15-06-31_9088970cc926/events.out.tfevents.1712761592.9088970cc926.34.1 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a670c62bf143f8838a31fb99666f1e27be401d52b09911f10d139cfc1df676d7
3
- size 7894
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:55818385261a9228fe7718644c8078ac2604992eb45db2fda25a43443b285848
3
+ size 8577
wandb/debug-internal.log CHANGED
@@ -426,3 +426,38 @@ subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after
426
  2024-04-10 15:10:56,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
427
  2024-04-10 15:10:58,184 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
428
  2024-04-10 15:11:00,835 DEBUG SenderThread:100 [sender.py:send():379] send: stats
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
426
  2024-04-10 15:10:56,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
427
  2024-04-10 15:10:58,184 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
428
  2024-04-10 15:11:00,835 DEBUG SenderThread:100 [sender.py:send():379] send: stats
429
+ 2024-04-10 15:11:03,836 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
430
+ 2024-04-10 15:11:08,837 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
431
+ 2024-04-10 15:11:11,991 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
432
+ 2024-04-10 15:11:11,999 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
433
+ 2024-04-10 15:11:11,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
434
+ 2024-04-10 15:11:14,251 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
435
+ 2024-04-10 15:11:19,252 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
436
+ 2024-04-10 15:11:24,253 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
437
+ 2024-04-10 15:11:26,991 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
438
+ 2024-04-10 15:11:27,000 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
439
+ 2024-04-10 15:11:27,000 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
440
+ 2024-04-10 15:11:30,239 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
441
+ 2024-04-10 15:11:30,836 DEBUG SenderThread:100 [sender.py:send():379] send: stats
442
+ 2024-04-10 15:11:34,816 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: partial_history
443
+ 2024-04-10 15:11:34,817 DEBUG SenderThread:100 [sender.py:send():379] send: history
444
+ 2024-04-10 15:11:34,818 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: summary_record
445
+ 2024-04-10 15:11:34,818 INFO SenderThread:100 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
446
+ 2024-04-10 15:11:34,883 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/wandb-summary.json
447
+ 2024-04-10 15:11:35,819 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
448
+ 2024-04-10 15:11:37,666 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: partial_history
449
+ 2024-04-10 15:11:37,667 DEBUG SenderThread:100 [sender.py:send():379] send: history
450
+ 2024-04-10 15:11:37,668 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: summary_record
451
+ 2024-04-10 15:11:37,668 INFO SenderThread:100 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
452
+ 2024-04-10 15:11:37,884 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/wandb-summary.json
453
+ 2024-04-10 15:11:38,885 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/output.log
454
+ 2024-04-10 15:11:41,669 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
455
+ 2024-04-10 15:11:41,991 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
456
+ 2024-04-10 15:11:42,000 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
457
+ 2024-04-10 15:11:42,000 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
458
+ 2024-04-10 15:11:47,192 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
459
+ 2024-04-10 15:11:52,193 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
460
+ 2024-04-10 15:11:56,991 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
461
+ 2024-04-10 15:11:57,000 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
462
+ 2024-04-10 15:11:57,000 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
463
+ 2024-04-10 15:11:57,236 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
wandb/run-20240410_150123-cuua991r/files/output.log CHANGED
@@ -17,4 +17,6 @@ dataloader_config = DataLoaderConfiguration(dispatch_batches=None, split_batches
17
  _warn_prf(average, modifier, msg_start, len(result))
18
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
19
  _warn_prf(average, modifier, msg_start, len(result))
 
 
20
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
 
17
  _warn_prf(average, modifier, msg_start, len(result))
18
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
19
  _warn_prf(average, modifier, msg_start, len(result))
20
+ /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
21
+ _warn_prf(average, modifier, msg_start, len(result))
22
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
wandb/run-20240410_150123-cuua991r/files/wandb-summary.json CHANGED
@@ -1 +1 @@
1
- {"train/loss": 1.8157, "train/grad_norm": 8.839205741882324, "train/learning_rate": 6.0169491525423725e-06, "train/epoch": 4.0, "train/global_step": 472, "_timestamp": 1712761836.404062, "_runtime": 552.8533301353455, "_step": 15, "eval/loss": 1.847446084022522, "eval/accuracy": 0.28169014084507044, "eval/precision": 0.14118326831447664, "eval/recall": 0.28169014084507044, "eval/f1": 0.1868000687049124, "eval/runtime": 2.8541, "eval/samples_per_second": 49.753, "eval/steps_per_second": 6.307}
 
1
+ {"train/loss": 1.778, "train/grad_norm": 7.37423038482666, "train/learning_rate": 5.016949152542373e-06, "train/epoch": 5.0, "train/global_step": 590, "_timestamp": 1712761897.6655517, "_runtime": 614.1148197650909, "_step": 17, "eval/loss": 1.8340991735458374, "eval/accuracy": 0.2605633802816901, "eval/precision": 0.16817207593386405, "eval/recall": 0.2605633802816901, "eval/f1": 0.18793666033701997, "eval/runtime": 2.8447, "eval/samples_per_second": 49.918, "eval/steps_per_second": 6.328}
wandb/run-20240410_150123-cuua991r/logs/debug-internal.log CHANGED
@@ -426,3 +426,38 @@ subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after
426
  2024-04-10 15:10:56,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
427
  2024-04-10 15:10:58,184 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
428
  2024-04-10 15:11:00,835 DEBUG SenderThread:100 [sender.py:send():379] send: stats
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
426
  2024-04-10 15:10:56,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
427
  2024-04-10 15:10:58,184 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
428
  2024-04-10 15:11:00,835 DEBUG SenderThread:100 [sender.py:send():379] send: stats
429
+ 2024-04-10 15:11:03,836 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
430
+ 2024-04-10 15:11:08,837 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
431
+ 2024-04-10 15:11:11,991 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
432
+ 2024-04-10 15:11:11,999 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
433
+ 2024-04-10 15:11:11,999 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
434
+ 2024-04-10 15:11:14,251 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
435
+ 2024-04-10 15:11:19,252 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
436
+ 2024-04-10 15:11:24,253 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
437
+ 2024-04-10 15:11:26,991 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
438
+ 2024-04-10 15:11:27,000 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
439
+ 2024-04-10 15:11:27,000 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
440
+ 2024-04-10 15:11:30,239 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
441
+ 2024-04-10 15:11:30,836 DEBUG SenderThread:100 [sender.py:send():379] send: stats
442
+ 2024-04-10 15:11:34,816 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: partial_history
443
+ 2024-04-10 15:11:34,817 DEBUG SenderThread:100 [sender.py:send():379] send: history
444
+ 2024-04-10 15:11:34,818 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: summary_record
445
+ 2024-04-10 15:11:34,818 INFO SenderThread:100 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
446
+ 2024-04-10 15:11:34,883 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/wandb-summary.json
447
+ 2024-04-10 15:11:35,819 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
448
+ 2024-04-10 15:11:37,666 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: partial_history
449
+ 2024-04-10 15:11:37,667 DEBUG SenderThread:100 [sender.py:send():379] send: history
450
+ 2024-04-10 15:11:37,668 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: summary_record
451
+ 2024-04-10 15:11:37,668 INFO SenderThread:100 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
452
+ 2024-04-10 15:11:37,884 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/wandb-summary.json
453
+ 2024-04-10 15:11:38,885 INFO Thread-12 :100 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_150123-cuua991r/files/output.log
454
+ 2024-04-10 15:11:41,669 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
455
+ 2024-04-10 15:11:41,991 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
456
+ 2024-04-10 15:11:42,000 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
457
+ 2024-04-10 15:11:42,000 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
458
+ 2024-04-10 15:11:47,192 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
459
+ 2024-04-10 15:11:52,193 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report
460
+ 2024-04-10 15:11:56,991 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: internal_messages
461
+ 2024-04-10 15:11:57,000 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: stop_status
462
+ 2024-04-10 15:11:57,000 DEBUG SenderThread:100 [sender.py:send_request():406] send_request: stop_status
463
+ 2024-04-10 15:11:57,236 DEBUG HandlerThread:100 [handler.py:handle_request():146] handle_request: status_report