sharukat commited on
Commit
c8b80d8
·
verified ·
1 Parent(s): 2b369dc

Training in progress, epoch 3

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6c3dd47b4c910468e268d03db7d5f3bef3a00253c6ade9204cfd15cf73968149
3
  size 502675828
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a57e47fb384faf33138a4416f9e5a2be79f2b4be384456bdcb3d266154cfa06b
3
  size 502675828
runs/Mar06_15-06-49_41759fa8e6ad/events.out.tfevents.1709737609.41759fa8e6ad.34.4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:997076216899c04f517674f013430d160c7582ddfa4cc8c986d74d9741ca7ec2
3
- size 6510
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d161e64b9478e067452d03d91fc62fce3591d774f8a60eaddbffb678e0cc370c
3
+ size 7180
wandb/debug-internal.log CHANGED
@@ -739,3 +739,33 @@
739
  2024-03-06 15:08:05,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
740
  2024-03-06 15:08:07,431 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
741
  2024-03-06 15:08:09,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
739
  2024-03-06 15:08:05,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
740
  2024-03-06 15:08:07,431 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
741
  2024-03-06 15:08:09,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
742
+ 2024-03-06 15:08:10,347 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
743
+ 2024-03-06 15:08:12,438 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
744
+ 2024-03-06 15:08:14,803 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
745
+ 2024-03-06 15:08:15,348 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
746
+ 2024-03-06 15:08:17,439 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
747
+ 2024-03-06 15:08:19,804 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
748
+ 2024-03-06 15:08:20,348 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
749
+ 2024-03-06 15:08:22,392 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
750
+ 2024-03-06 15:08:22,393 DEBUG SenderThread:137 [sender.py:send():382] send: history
751
+ 2024-03-06 15:08:22,393 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
752
+ 2024-03-06 15:08:22,393 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
753
+ 2024-03-06 15:08:22,443 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
754
+ 2024-03-06 15:08:23,065 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
755
+ 2024-03-06 15:08:23,507 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
756
+ 2024-03-06 15:08:23,508 DEBUG SenderThread:137 [sender.py:send():382] send: history
757
+ 2024-03-06 15:08:23,509 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
758
+ 2024-03-06 15:08:23,509 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
759
+ 2024-03-06 15:08:24,066 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
760
+ 2024-03-06 15:08:25,349 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
761
+ 2024-03-06 15:08:25,510 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
762
+ 2024-03-06 15:08:26,066 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/output.log
763
+ 2024-03-06 15:08:26,800 DEBUG SenderThread:137 [sender.py:send():382] send: stats
764
+ 2024-03-06 15:08:27,494 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
765
+ 2024-03-06 15:08:30,350 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
766
+ 2024-03-06 15:08:30,801 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
767
+ 2024-03-06 15:08:32,495 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
768
+ 2024-03-06 15:08:35,351 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
769
+ 2024-03-06 15:08:35,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
770
+ 2024-03-06 15:08:37,496 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
771
+ 2024-03-06 15:08:40,352 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
wandb/run-20240306_145424-trm7fvg4/logs/debug-internal.log CHANGED
@@ -790,3 +790,33 @@ wandb.errors.AuthenticationError: The API key you provided is either invalid or
790
  2024-03-06 15:08:05,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
791
  2024-03-06 15:08:07,431 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
792
  2024-03-06 15:08:09,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
790
  2024-03-06 15:08:05,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
791
  2024-03-06 15:08:07,431 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
792
  2024-03-06 15:08:09,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
793
+ 2024-03-06 15:08:10,347 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
794
+ 2024-03-06 15:08:12,438 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
795
+ 2024-03-06 15:08:14,803 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
796
+ 2024-03-06 15:08:15,348 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
797
+ 2024-03-06 15:08:17,439 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
798
+ 2024-03-06 15:08:19,804 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
799
+ 2024-03-06 15:08:20,348 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
800
+ 2024-03-06 15:08:22,392 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
801
+ 2024-03-06 15:08:22,393 DEBUG SenderThread:137 [sender.py:send():382] send: history
802
+ 2024-03-06 15:08:22,393 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
803
+ 2024-03-06 15:08:22,393 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
804
+ 2024-03-06 15:08:22,443 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
805
+ 2024-03-06 15:08:23,065 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
806
+ 2024-03-06 15:08:23,507 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
807
+ 2024-03-06 15:08:23,508 DEBUG SenderThread:137 [sender.py:send():382] send: history
808
+ 2024-03-06 15:08:23,509 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
809
+ 2024-03-06 15:08:23,509 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
810
+ 2024-03-06 15:08:24,066 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
811
+ 2024-03-06 15:08:25,349 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
812
+ 2024-03-06 15:08:25,510 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
813
+ 2024-03-06 15:08:26,066 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/output.log
814
+ 2024-03-06 15:08:26,800 DEBUG SenderThread:137 [sender.py:send():382] send: stats
815
+ 2024-03-06 15:08:27,494 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
816
+ 2024-03-06 15:08:30,350 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
817
+ 2024-03-06 15:08:30,801 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
818
+ 2024-03-06 15:08:32,495 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
819
+ 2024-03-06 15:08:35,351 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
820
+ 2024-03-06 15:08:35,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
821
+ 2024-03-06 15:08:37,496 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
822
+ 2024-03-06 15:08:40,352 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
wandb/run-20240306_145455-h1uv5tyi/files/output.log CHANGED
@@ -39,3 +39,5 @@ You should probably TRAIN this model on a down-stream task to be able to use it
39
  _warn_prf(average, modifier, msg_start, len(result))
40
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
41
  _warn_prf(average, modifier, msg_start, len(result))
 
 
 
39
  _warn_prf(average, modifier, msg_start, len(result))
40
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
41
  _warn_prf(average, modifier, msg_start, len(result))
42
+ Checkpoint destination directory /kaggle/working/checkpoint-62 already exists and is non-empty. Saving will proceed but saved results may be invalid.
43
+ /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json CHANGED
@@ -1 +1 @@
1
- {"train/loss": 1.7527, "train/grad_norm": 5.8667988777160645, "train/learning_rate": 2.4e-05, "train/epoch": 2.0, "train/global_step": 62, "_timestamp": 1709737671.3031292, "_runtime": 775.5843722820282, "_step": 29, "eval/loss": 1.773923397064209, "eval/accuracy": 0.34545454545454546, "eval/precision": 0.11933884297520661, "eval/recall": 0.34545454545454546, "eval/f1": 0.17739557739557738, "eval/runtime": 1.1095, "eval/samples_per_second": 49.57, "eval/steps_per_second": 3.605, "train/train_runtime": 237.4526, "train/train_samples_per_second": 10.339, "train/train_steps_per_second": 1.306, "train/total_flos": 645966638976000.0, "train/train_loss": 1.7031736066264491}
 
1
+ {"train/loss": 1.7018, "train/grad_norm": 5.185774326324463, "train/learning_rate": 2.1e-05, "train/epoch": 3.0, "train/global_step": 93, "_timestamp": 1709737703.506952, "_runtime": 807.7881951332092, "_step": 31, "eval/loss": 1.739591121673584, "eval/accuracy": 0.34545454545454546, "eval/precision": 0.18308668076109938, "eval/recall": 0.34545454545454546, "eval/f1": 0.23284457478005866, "eval/runtime": 1.1118, "eval/samples_per_second": 49.471, "eval/steps_per_second": 3.598, "train/train_runtime": 237.4526, "train/train_samples_per_second": 10.339, "train/train_steps_per_second": 1.306, "train/total_flos": 645966638976000.0, "train/train_loss": 1.7031736066264491}
wandb/run-20240306_145455-h1uv5tyi/logs/debug-internal.log CHANGED
@@ -739,3 +739,33 @@
739
  2024-03-06 15:08:05,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
740
  2024-03-06 15:08:07,431 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
741
  2024-03-06 15:08:09,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
739
  2024-03-06 15:08:05,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
740
  2024-03-06 15:08:07,431 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
741
  2024-03-06 15:08:09,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
742
+ 2024-03-06 15:08:10,347 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
743
+ 2024-03-06 15:08:12,438 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
744
+ 2024-03-06 15:08:14,803 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
745
+ 2024-03-06 15:08:15,348 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
746
+ 2024-03-06 15:08:17,439 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
747
+ 2024-03-06 15:08:19,804 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
748
+ 2024-03-06 15:08:20,348 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
749
+ 2024-03-06 15:08:22,392 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
750
+ 2024-03-06 15:08:22,393 DEBUG SenderThread:137 [sender.py:send():382] send: history
751
+ 2024-03-06 15:08:22,393 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
752
+ 2024-03-06 15:08:22,393 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
753
+ 2024-03-06 15:08:22,443 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
754
+ 2024-03-06 15:08:23,065 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
755
+ 2024-03-06 15:08:23,507 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
756
+ 2024-03-06 15:08:23,508 DEBUG SenderThread:137 [sender.py:send():382] send: history
757
+ 2024-03-06 15:08:23,509 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
758
+ 2024-03-06 15:08:23,509 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
759
+ 2024-03-06 15:08:24,066 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
760
+ 2024-03-06 15:08:25,349 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
761
+ 2024-03-06 15:08:25,510 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
762
+ 2024-03-06 15:08:26,066 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/output.log
763
+ 2024-03-06 15:08:26,800 DEBUG SenderThread:137 [sender.py:send():382] send: stats
764
+ 2024-03-06 15:08:27,494 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
765
+ 2024-03-06 15:08:30,350 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
766
+ 2024-03-06 15:08:30,801 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
767
+ 2024-03-06 15:08:32,495 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
768
+ 2024-03-06 15:08:35,351 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
769
+ 2024-03-06 15:08:35,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
770
+ 2024-03-06 15:08:37,496 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
771
+ 2024-03-06 15:08:40,352 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report