Training in progress, epoch 2
Browse files- model.safetensors +1 -1
- runs/Mar06_15-06-49_41759fa8e6ad/events.out.tfevents.1709737609.41759fa8e6ad.34.4 +2 -2
- wandb/debug-internal.log +32 -0
- wandb/run-20240306_145424-trm7fvg4/logs/debug-internal.log +32 -0
- wandb/run-20240306_145455-h1uv5tyi/files/output.log +3 -0
- wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json +1 -1
- wandb/run-20240306_145455-h1uv5tyi/logs/debug-internal.log +32 -0
- wandb/run-20240306_145455-h1uv5tyi/run-h1uv5tyi.wandb +0 -0
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 502675828
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6c3dd47b4c910468e268d03db7d5f3bef3a00253c6ade9204cfd15cf73968149
|
| 3 |
size 502675828
|
runs/Mar06_15-06-49_41759fa8e6ad/events.out.tfevents.1709737609.41759fa8e6ad.34.4
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:997076216899c04f517674f013430d160c7582ddfa4cc8c986d74d9741ca7ec2
|
| 3 |
+
size 6510
|
wandb/debug-internal.log
CHANGED
|
@@ -707,3 +707,35 @@
|
|
| 707 |
2024-03-06 15:07:31,922 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 708 |
2024-03-06 15:07:33,800 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 709 |
2024-03-06 15:07:35,340 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 707 |
2024-03-06 15:07:31,922 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 708 |
2024-03-06 15:07:33,800 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 709 |
2024-03-06 15:07:35,340 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 710 |
+
2024-03-06 15:07:36,923 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 711 |
+
2024-03-06 15:07:38,801 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 712 |
+
2024-03-06 15:07:40,341 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 713 |
+
2024-03-06 15:07:41,924 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 714 |
+
2024-03-06 15:07:43,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 715 |
+
2024-03-06 15:07:45,343 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 716 |
+
2024-03-06 15:07:46,925 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 717 |
+
2024-03-06 15:07:48,803 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 718 |
+
2024-03-06 15:07:50,190 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
|
| 719 |
+
2024-03-06 15:07:50,191 DEBUG SenderThread:137 [sender.py:send():382] send: history
|
| 720 |
+
2024-03-06 15:07:50,191 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
|
| 721 |
+
2024-03-06 15:07:50,192 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
|
| 722 |
+
2024-03-06 15:07:50,343 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 723 |
+
2024-03-06 15:07:51,049 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
|
| 724 |
+
2024-03-06 15:07:51,303 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
|
| 725 |
+
2024-03-06 15:07:51,305 DEBUG SenderThread:137 [sender.py:send():382] send: history
|
| 726 |
+
2024-03-06 15:07:51,305 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
|
| 727 |
+
2024-03-06 15:07:51,306 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
|
| 728 |
+
2024-03-06 15:07:52,049 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
|
| 729 |
+
2024-03-06 15:07:52,385 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 730 |
+
2024-03-06 15:07:54,050 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/output.log
|
| 731 |
+
2024-03-06 15:07:54,308 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 732 |
+
2024-03-06 15:07:55,344 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 733 |
+
2024-03-06 15:07:56,799 DEBUG SenderThread:137 [sender.py:send():382] send: stats
|
| 734 |
+
2024-03-06 15:07:57,427 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 735 |
+
2024-03-06 15:07:59,800 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 736 |
+
2024-03-06 15:08:00,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 737 |
+
2024-03-06 15:08:02,430 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 738 |
+
2024-03-06 15:08:04,801 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 739 |
+
2024-03-06 15:08:05,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 740 |
+
2024-03-06 15:08:07,431 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 741 |
+
2024-03-06 15:08:09,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
wandb/run-20240306_145424-trm7fvg4/logs/debug-internal.log
CHANGED
|
@@ -758,3 +758,35 @@ wandb.errors.AuthenticationError: The API key you provided is either invalid or
|
|
| 758 |
2024-03-06 15:07:31,922 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 759 |
2024-03-06 15:07:33,800 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 760 |
2024-03-06 15:07:35,340 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 758 |
2024-03-06 15:07:31,922 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 759 |
2024-03-06 15:07:33,800 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 760 |
2024-03-06 15:07:35,340 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 761 |
+
2024-03-06 15:07:36,923 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 762 |
+
2024-03-06 15:07:38,801 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 763 |
+
2024-03-06 15:07:40,341 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 764 |
+
2024-03-06 15:07:41,924 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 765 |
+
2024-03-06 15:07:43,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 766 |
+
2024-03-06 15:07:45,343 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 767 |
+
2024-03-06 15:07:46,925 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 768 |
+
2024-03-06 15:07:48,803 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 769 |
+
2024-03-06 15:07:50,190 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
|
| 770 |
+
2024-03-06 15:07:50,191 DEBUG SenderThread:137 [sender.py:send():382] send: history
|
| 771 |
+
2024-03-06 15:07:50,191 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
|
| 772 |
+
2024-03-06 15:07:50,192 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
|
| 773 |
+
2024-03-06 15:07:50,343 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 774 |
+
2024-03-06 15:07:51,049 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
|
| 775 |
+
2024-03-06 15:07:51,303 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
|
| 776 |
+
2024-03-06 15:07:51,305 DEBUG SenderThread:137 [sender.py:send():382] send: history
|
| 777 |
+
2024-03-06 15:07:51,305 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
|
| 778 |
+
2024-03-06 15:07:51,306 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
|
| 779 |
+
2024-03-06 15:07:52,049 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
|
| 780 |
+
2024-03-06 15:07:52,385 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 781 |
+
2024-03-06 15:07:54,050 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/output.log
|
| 782 |
+
2024-03-06 15:07:54,308 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 783 |
+
2024-03-06 15:07:55,344 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 784 |
+
2024-03-06 15:07:56,799 DEBUG SenderThread:137 [sender.py:send():382] send: stats
|
| 785 |
+
2024-03-06 15:07:57,427 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 786 |
+
2024-03-06 15:07:59,800 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 787 |
+
2024-03-06 15:08:00,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 788 |
+
2024-03-06 15:08:02,430 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 789 |
+
2024-03-06 15:08:04,801 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 790 |
+
2024-03-06 15:08:05,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 791 |
+
2024-03-06 15:08:07,431 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 792 |
+
2024-03-06 15:08:09,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
wandb/run-20240306_145455-h1uv5tyi/files/output.log
CHANGED
|
@@ -36,3 +36,6 @@ You should probably TRAIN this model on a down-stream task to be able to use it
|
|
| 36 |
Some weights of MegatronBertForSequenceClassification were not initialized from the model checkpoint at mmukh/SOBertBase and are newly initialized: ['bert.embeddings.token_type_embeddings.weight', 'bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
|
| 37 |
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
|
| 38 |
/opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
|
|
|
|
|
|
|
|
|
|
|
|
| 36 |
Some weights of MegatronBertForSequenceClassification were not initialized from the model checkpoint at mmukh/SOBertBase and are newly initialized: ['bert.embeddings.token_type_embeddings.weight', 'bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'classifier.bias', 'classifier.weight']
|
| 37 |
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
|
| 38 |
/opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
|
| 39 |
+
_warn_prf(average, modifier, msg_start, len(result))
|
| 40 |
+
/opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
|
| 41 |
+
_warn_prf(average, modifier, msg_start, len(result))
|
wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"train/loss": 1.
|
|
|
|
| 1 |
+
{"train/loss": 1.7527, "train/grad_norm": 5.8667988777160645, "train/learning_rate": 2.4e-05, "train/epoch": 2.0, "train/global_step": 62, "_timestamp": 1709737671.3031292, "_runtime": 775.5843722820282, "_step": 29, "eval/loss": 1.773923397064209, "eval/accuracy": 0.34545454545454546, "eval/precision": 0.11933884297520661, "eval/recall": 0.34545454545454546, "eval/f1": 0.17739557739557738, "eval/runtime": 1.1095, "eval/samples_per_second": 49.57, "eval/steps_per_second": 3.605, "train/train_runtime": 237.4526, "train/train_samples_per_second": 10.339, "train/train_steps_per_second": 1.306, "train/total_flos": 645966638976000.0, "train/train_loss": 1.7031736066264491}
|
wandb/run-20240306_145455-h1uv5tyi/logs/debug-internal.log
CHANGED
|
@@ -707,3 +707,35 @@
|
|
| 707 |
2024-03-06 15:07:31,922 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 708 |
2024-03-06 15:07:33,800 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 709 |
2024-03-06 15:07:35,340 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 707 |
2024-03-06 15:07:31,922 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 708 |
2024-03-06 15:07:33,800 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 709 |
2024-03-06 15:07:35,340 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 710 |
+
2024-03-06 15:07:36,923 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 711 |
+
2024-03-06 15:07:38,801 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 712 |
+
2024-03-06 15:07:40,341 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 713 |
+
2024-03-06 15:07:41,924 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 714 |
+
2024-03-06 15:07:43,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 715 |
+
2024-03-06 15:07:45,343 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 716 |
+
2024-03-06 15:07:46,925 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 717 |
+
2024-03-06 15:07:48,803 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 718 |
+
2024-03-06 15:07:50,190 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
|
| 719 |
+
2024-03-06 15:07:50,191 DEBUG SenderThread:137 [sender.py:send():382] send: history
|
| 720 |
+
2024-03-06 15:07:50,191 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
|
| 721 |
+
2024-03-06 15:07:50,192 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
|
| 722 |
+
2024-03-06 15:07:50,343 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 723 |
+
2024-03-06 15:07:51,049 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
|
| 724 |
+
2024-03-06 15:07:51,303 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
|
| 725 |
+
2024-03-06 15:07:51,305 DEBUG SenderThread:137 [sender.py:send():382] send: history
|
| 726 |
+
2024-03-06 15:07:51,305 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
|
| 727 |
+
2024-03-06 15:07:51,306 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
|
| 728 |
+
2024-03-06 15:07:52,049 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
|
| 729 |
+
2024-03-06 15:07:52,385 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 730 |
+
2024-03-06 15:07:54,050 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/output.log
|
| 731 |
+
2024-03-06 15:07:54,308 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 732 |
+
2024-03-06 15:07:55,344 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 733 |
+
2024-03-06 15:07:56,799 DEBUG SenderThread:137 [sender.py:send():382] send: stats
|
| 734 |
+
2024-03-06 15:07:57,427 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 735 |
+
2024-03-06 15:07:59,800 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 736 |
+
2024-03-06 15:08:00,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 737 |
+
2024-03-06 15:08:02,430 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 738 |
+
2024-03-06 15:08:04,801 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 739 |
+
2024-03-06 15:08:05,345 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
| 740 |
+
2024-03-06 15:08:07,431 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
|
| 741 |
+
2024-03-06 15:08:09,802 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
|
wandb/run-20240306_145455-h1uv5tyi/run-h1uv5tyi.wandb
CHANGED
|
Binary files a/wandb/run-20240306_145455-h1uv5tyi/run-h1uv5tyi.wandb and b/wandb/run-20240306_145455-h1uv5tyi/run-h1uv5tyi.wandb differ
|
|
|