sharukat commited on
Commit
aa5ce0c
·
verified ·
1 Parent(s): f3051d3

Training in progress, epoch 8

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0b05656e1052c5e5de8c3917d0744cf96448312e8f81f3380e15eccb74fc9808
3
  size 502675828
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eb455317e6e44818cd5895c227773b809a3117630c09ddc603402ced97e4add0
3
  size 502675828
runs/Mar06_15-06-49_41759fa8e6ad/events.out.tfevents.1709737609.41759fa8e6ad.34.4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82727860d80623db1233da432c77b672064d01dedddfcbfd300b54688f9deeb2
3
- size 9899
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0cb13f81c94f361a52ad50c0947a690717d63f5cfbe2275abd652e9e02fff9a1
3
+ size 10582
wandb/debug-internal.log CHANGED
@@ -896,3 +896,35 @@
896
  2024-03-06 15:10:48,908 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
897
  2024-03-06 15:10:50,376 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
898
  2024-03-06 15:10:50,877 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
896
  2024-03-06 15:10:48,908 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
897
  2024-03-06 15:10:50,376 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
898
  2024-03-06 15:10:50,877 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
899
+ 2024-03-06 15:10:53,909 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
900
+ 2024-03-06 15:10:55,377 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
901
+ 2024-03-06 15:10:55,878 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
902
+ 2024-03-06 15:10:56,804 DEBUG SenderThread:137 [sender.py:send():382] send: stats
903
+ 2024-03-06 15:10:58,910 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
904
+ 2024-03-06 15:11:00,378 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
905
+ 2024-03-06 15:11:01,806 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
906
+ 2024-03-06 15:11:03,911 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
907
+ 2024-03-06 15:11:05,379 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
908
+ 2024-03-06 15:11:06,806 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
909
+ 2024-03-06 15:11:07,830 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
910
+ 2024-03-06 15:11:07,831 DEBUG SenderThread:137 [sender.py:send():382] send: history
911
+ 2024-03-06 15:11:07,832 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
912
+ 2024-03-06 15:11:07,832 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
913
+ 2024-03-06 15:11:08,137 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
914
+ 2024-03-06 15:11:08,912 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
915
+ 2024-03-06 15:11:08,947 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
916
+ 2024-03-06 15:11:08,949 DEBUG SenderThread:137 [sender.py:send():382] send: history
917
+ 2024-03-06 15:11:08,949 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
918
+ 2024-03-06 15:11:08,950 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
919
+ 2024-03-06 15:11:09,137 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
920
+ 2024-03-06 15:11:10,138 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/output.log
921
+ 2024-03-06 15:11:10,380 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
922
+ 2024-03-06 15:11:11,951 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
923
+ 2024-03-06 15:11:13,975 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
924
+ 2024-03-06 15:11:15,380 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
925
+ 2024-03-06 15:11:16,952 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
926
+ 2024-03-06 15:11:19,031 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
927
+ 2024-03-06 15:11:20,381 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
928
+ 2024-03-06 15:11:21,953 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
929
+ 2024-03-06 15:11:24,032 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
930
+ 2024-03-06 15:11:25,382 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
wandb/run-20240306_145424-trm7fvg4/logs/debug-internal.log CHANGED
@@ -947,3 +947,35 @@ wandb.errors.AuthenticationError: The API key you provided is either invalid or
947
  2024-03-06 15:10:48,908 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
948
  2024-03-06 15:10:50,376 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
949
  2024-03-06 15:10:50,877 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
947
  2024-03-06 15:10:48,908 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
948
  2024-03-06 15:10:50,376 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
949
  2024-03-06 15:10:50,877 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
950
+ 2024-03-06 15:10:53,909 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
951
+ 2024-03-06 15:10:55,377 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
952
+ 2024-03-06 15:10:55,878 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
953
+ 2024-03-06 15:10:56,804 DEBUG SenderThread:137 [sender.py:send():382] send: stats
954
+ 2024-03-06 15:10:58,910 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
955
+ 2024-03-06 15:11:00,378 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
956
+ 2024-03-06 15:11:01,806 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
957
+ 2024-03-06 15:11:03,911 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
958
+ 2024-03-06 15:11:05,379 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
959
+ 2024-03-06 15:11:06,806 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
960
+ 2024-03-06 15:11:07,830 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
961
+ 2024-03-06 15:11:07,831 DEBUG SenderThread:137 [sender.py:send():382] send: history
962
+ 2024-03-06 15:11:07,832 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
963
+ 2024-03-06 15:11:07,832 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
964
+ 2024-03-06 15:11:08,137 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
965
+ 2024-03-06 15:11:08,912 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
966
+ 2024-03-06 15:11:08,947 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
967
+ 2024-03-06 15:11:08,949 DEBUG SenderThread:137 [sender.py:send():382] send: history
968
+ 2024-03-06 15:11:08,949 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
969
+ 2024-03-06 15:11:08,950 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
970
+ 2024-03-06 15:11:09,137 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
971
+ 2024-03-06 15:11:10,138 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/output.log
972
+ 2024-03-06 15:11:10,380 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
973
+ 2024-03-06 15:11:11,951 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
974
+ 2024-03-06 15:11:13,975 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
975
+ 2024-03-06 15:11:15,380 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
976
+ 2024-03-06 15:11:16,952 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
977
+ 2024-03-06 15:11:19,031 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
978
+ 2024-03-06 15:11:20,381 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
979
+ 2024-03-06 15:11:21,953 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
980
+ 2024-03-06 15:11:24,032 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
981
+ 2024-03-06 15:11:25,382 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
wandb/run-20240306_145455-h1uv5tyi/files/output.log CHANGED
@@ -51,3 +51,6 @@ Checkpoint destination directory /kaggle/working/checkpoint-124 already exists a
51
  _warn_prf(average, modifier, msg_start, len(result))
52
  Checkpoint destination directory /kaggle/working/checkpoint-186 already exists and is non-empty. Saving will proceed but saved results may be invalid.
53
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
 
 
 
 
51
  _warn_prf(average, modifier, msg_start, len(result))
52
  Checkpoint destination directory /kaggle/working/checkpoint-186 already exists and is non-empty. Saving will proceed but saved results may be invalid.
53
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
54
+ _warn_prf(average, modifier, msg_start, len(result))
55
+ /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
56
+ _warn_prf(average, modifier, msg_start, len(result))
wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json CHANGED
@@ -1 +1 @@
1
- {"train/loss": 1.4789, "train/grad_norm": 6.611419677734375, "train/learning_rate": 9.096774193548387e-06, "train/epoch": 7.0, "train/global_step": 217, "_timestamp": 1709737835.8675447, "_runtime": 940.1487877368927, "_step": 39, "eval/loss": 1.7304738759994507, "eval/accuracy": 0.4, "eval/precision": 0.3062720225510923, "eval/recall": 0.4, "eval/f1": 0.30165060745705913, "eval/runtime": 1.113, "eval/samples_per_second": 49.416, "eval/steps_per_second": 3.594, "train/train_runtime": 237.4526, "train/train_samples_per_second": 10.339, "train/train_steps_per_second": 1.306, "train/total_flos": 645966638976000.0, "train/train_loss": 1.7031736066264491}
 
1
+ {"train/loss": 1.4226, "train/grad_norm": 6.0385541915893555, "train/learning_rate": 6.096774193548387e-06, "train/epoch": 8.0, "train/global_step": 248, "_timestamp": 1709737868.9472039, "_runtime": 973.2284469604492, "_step": 41, "eval/loss": 1.7184381484985352, "eval/accuracy": 0.41818181818181815, "eval/precision": 0.37482517482517486, "eval/recall": 0.41818181818181815, "eval/f1": 0.3393939393939394, "eval/runtime": 1.1132, "eval/samples_per_second": 49.406, "eval/steps_per_second": 3.593, "train/train_runtime": 237.4526, "train/train_samples_per_second": 10.339, "train/train_steps_per_second": 1.306, "train/total_flos": 645966638976000.0, "train/train_loss": 1.7031736066264491}
wandb/run-20240306_145455-h1uv5tyi/logs/debug-internal.log CHANGED
@@ -896,3 +896,35 @@
896
  2024-03-06 15:10:48,908 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
897
  2024-03-06 15:10:50,376 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
898
  2024-03-06 15:10:50,877 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
896
  2024-03-06 15:10:48,908 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
897
  2024-03-06 15:10:50,376 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
898
  2024-03-06 15:10:50,877 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
899
+ 2024-03-06 15:10:53,909 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
900
+ 2024-03-06 15:10:55,377 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
901
+ 2024-03-06 15:10:55,878 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
902
+ 2024-03-06 15:10:56,804 DEBUG SenderThread:137 [sender.py:send():382] send: stats
903
+ 2024-03-06 15:10:58,910 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
904
+ 2024-03-06 15:11:00,378 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
905
+ 2024-03-06 15:11:01,806 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
906
+ 2024-03-06 15:11:03,911 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
907
+ 2024-03-06 15:11:05,379 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
908
+ 2024-03-06 15:11:06,806 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
909
+ 2024-03-06 15:11:07,830 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
910
+ 2024-03-06 15:11:07,831 DEBUG SenderThread:137 [sender.py:send():382] send: history
911
+ 2024-03-06 15:11:07,832 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
912
+ 2024-03-06 15:11:07,832 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
913
+ 2024-03-06 15:11:08,137 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
914
+ 2024-03-06 15:11:08,912 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
915
+ 2024-03-06 15:11:08,947 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: partial_history
916
+ 2024-03-06 15:11:08,949 DEBUG SenderThread:137 [sender.py:send():382] send: history
917
+ 2024-03-06 15:11:08,949 DEBUG SenderThread:137 [sender.py:send_request():409] send_request: summary_record
918
+ 2024-03-06 15:11:08,950 INFO SenderThread:137 [sender.py:_save_file():1403] saving file wandb-summary.json with policy end
919
+ 2024-03-06 15:11:09,137 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/wandb-summary.json
920
+ 2024-03-06 15:11:10,138 INFO Thread-18 :137 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240306_145455-h1uv5tyi/files/output.log
921
+ 2024-03-06 15:11:10,380 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
922
+ 2024-03-06 15:11:11,951 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
923
+ 2024-03-06 15:11:13,975 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
924
+ 2024-03-06 15:11:15,380 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
925
+ 2024-03-06 15:11:16,952 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
926
+ 2024-03-06 15:11:19,031 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
927
+ 2024-03-06 15:11:20,381 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
928
+ 2024-03-06 15:11:21,953 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report
929
+ 2024-03-06 15:11:24,032 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: keepalive
930
+ 2024-03-06 15:11:25,382 DEBUG HandlerThread:137 [handler.py:handle_request():146] handle_request: status_report