sharukat commited on
Commit
4e982c1
·
verified ·
1 Parent(s): 563e70d

Training in progress, epoch 2

Browse files
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7f32bd9201f86bc9fb8c4e9d255d1b876209f641dbd6b9464fded038413d3c76
3
  size 596114452
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc9377fc78fec87d4d2a3e3ee34912159c9f3a17e95f81b6df19d0cc5f1250fb
3
  size 596114452
runs/Apr10_16-17-22_ae604480b8c9/events.out.tfevents.1712765843.ae604480b8c9.34.4 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:00e26802e615e75e71a61425bab2310dfd2f53924b9f6c49f39ea6051d4c68ce
3
- size 5966
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15cdd3b337bd2d705f1ad71a9615b390dc8b69a9bb14a22a4eb1f85fab853d2d
3
+ size 6636
wandb/debug-internal.log CHANGED
@@ -1459,3 +1459,40 @@ subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after
1459
  2024-04-10 16:18:37,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1460
  2024-04-10 16:18:37,716 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1461
  2024-04-10 16:18:40,900 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1459
  2024-04-10 16:18:37,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1460
  2024-04-10 16:18:37,716 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1461
  2024-04-10 16:18:40,900 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1462
+ 2024-04-10 16:18:45,910 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1463
+ 2024-04-10 16:18:46,727 INFO Thread-12 :98 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_155650-albqrbhg/files/config.yaml
1464
+ 2024-04-10 16:18:51,046 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1465
+ 2024-04-10 16:18:51,878 DEBUG SenderThread:98 [sender.py:send():379] send: stats
1466
+ 2024-04-10 16:18:52,440 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: internal_messages
1467
+ 2024-04-10 16:18:52,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1468
+ 2024-04-10 16:18:52,716 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1469
+ 2024-04-10 16:18:56,868 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1470
+ 2024-04-10 16:19:01,869 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1471
+ 2024-04-10 16:19:06,870 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1472
+ 2024-04-10 16:19:07,448 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: internal_messages
1473
+ 2024-04-10 16:19:07,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1474
+ 2024-04-10 16:19:07,716 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1475
+ 2024-04-10 16:19:12,803 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1476
+ 2024-04-10 16:19:17,150 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: partial_history
1477
+ 2024-04-10 16:19:17,152 DEBUG SenderThread:98 [sender.py:send():379] send: history
1478
+ 2024-04-10 16:19:17,152 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: summary_record
1479
+ 2024-04-10 16:19:17,154 INFO SenderThread:98 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
1480
+ 2024-04-10 16:19:17,739 INFO Thread-12 :98 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_155650-albqrbhg/files/wandb-summary.json
1481
+ 2024-04-10 16:19:18,154 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1482
+ 2024-04-10 16:19:21,879 DEBUG SenderThread:98 [sender.py:send():379] send: stats
1483
+ 2024-04-10 16:19:22,447 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: internal_messages
1484
+ 2024-04-10 16:19:22,493 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: partial_history
1485
+ 2024-04-10 16:19:22,495 DEBUG SenderThread:98 [sender.py:send():379] send: history
1486
+ 2024-04-10 16:19:22,495 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: summary_record
1487
+ 2024-04-10 16:19:22,495 INFO SenderThread:98 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
1488
+ 2024-04-10 16:19:22,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1489
+ 2024-04-10 16:19:22,717 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1490
+ 2024-04-10 16:19:22,742 INFO Thread-12 :98 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_155650-albqrbhg/files/wandb-summary.json
1491
+ 2024-04-10 16:19:23,742 INFO Thread-12 :98 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_155650-albqrbhg/files/output.log
1492
+ 2024-04-10 16:19:23,808 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1493
+ 2024-04-10 16:19:28,809 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1494
+ 2024-04-10 16:19:33,811 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1495
+ 2024-04-10 16:19:37,447 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: internal_messages
1496
+ 2024-04-10 16:19:37,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1497
+ 2024-04-10 16:19:37,717 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1498
+ 2024-04-10 16:19:38,846 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
wandb/run-20240410_155650-albqrbhg/files/config.yaml CHANGED
@@ -74,6 +74,38 @@ _wandb:
74
  5: 1
75
  6:
76
  - 1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
77
  return_dict:
78
  desc: null
79
  value: true
 
74
  5: 1
75
  6:
76
  - 1
77
+ - 1: eval/loss
78
+ 5: 1
79
+ 6:
80
+ - 1
81
+ - 1: eval/accuracy
82
+ 5: 1
83
+ 6:
84
+ - 1
85
+ - 1: eval/precision
86
+ 5: 1
87
+ 6:
88
+ - 1
89
+ - 1: eval/recall
90
+ 5: 1
91
+ 6:
92
+ - 1
93
+ - 1: eval/f1
94
+ 5: 1
95
+ 6:
96
+ - 1
97
+ - 1: eval/runtime
98
+ 5: 1
99
+ 6:
100
+ - 1
101
+ - 1: eval/samples_per_second
102
+ 5: 1
103
+ 6:
104
+ - 1
105
+ - 1: eval/steps_per_second
106
+ 5: 1
107
+ 6:
108
+ - 1
109
  return_dict:
110
  desc: null
111
  value: true
wandb/run-20240410_155650-albqrbhg/files/output.log CHANGED
@@ -84,4 +84,6 @@ You should probably TRAIN this model on a down-stream task to be able to use it
84
  /opt/conda/lib/python3.10/site-packages/accelerate/accelerator.py:432: FutureWarning: Passing the following arguments to `Accelerator` is deprecated and will be removed in version 1.0 of Accelerate: dict_keys(['dispatch_batches', 'split_batches', 'even_batches', 'use_seedable_sampler']). Please pass an `accelerate.DataLoaderConfiguration` instead:
85
  dataloader_config = DataLoaderConfiguration(dispatch_batches=None, split_batches=False, even_batches=True, use_seedable_sampler=True)
86
  warnings.warn(
 
 
87
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
 
84
  /opt/conda/lib/python3.10/site-packages/accelerate/accelerator.py:432: FutureWarning: Passing the following arguments to `Accelerator` is deprecated and will be removed in version 1.0 of Accelerate: dict_keys(['dispatch_batches', 'split_batches', 'even_batches', 'use_seedable_sampler']). Please pass an `accelerate.DataLoaderConfiguration` instead:
85
  dataloader_config = DataLoaderConfiguration(dispatch_batches=None, split_batches=False, even_batches=True, use_seedable_sampler=True)
86
  warnings.warn(
87
+ /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
88
+ _warn_prf(average, modifier, msg_start, len(result))
89
  /opt/conda/lib/python3.10/site-packages/sklearn/metrics/_classification.py:1344: UndefinedMetricWarning: Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples. Use `zero_division` parameter to control this behavior.
wandb/run-20240410_155650-albqrbhg/files/wandb-summary.json CHANGED
@@ -1 +1 @@
1
- {"train/loss": 1.9459, "train/grad_norm": 6.674560546875, "train/learning_rate": 8.000000000000001e-06, "train/epoch": 1.0, "train/global_step": 59, "_timestamp": 1712765900.9632816, "_runtime": 1290.6948807239532, "_step": 3, "eval/loss": 1.9451844692230225, "eval/accuracy": 0.2112676056338028, "eval/precision": 0.030181086519114688, "eval/recall": 0.14285714285714285, "eval/f1": 0.04983388704318937, "eval/runtime": 5.393, "eval/samples_per_second": 26.33, "eval/steps_per_second": 1.669}
 
1
+ {"train/loss": 1.9323, "train/grad_norm": 6.981883525848389, "train/learning_rate": 6e-06, "train/epoch": 2.0, "train/global_step": 118, "_timestamp": 1712765962.4548702, "_runtime": 1352.1864693164825, "_step": 5, "eval/loss": 1.9262523651123047, "eval/accuracy": 0.19718309859154928, "eval/precision": 0.02816901408450704, "eval/recall": 0.14285714285714285, "eval/f1": 0.047058823529411764, "eval/runtime": 5.3003, "eval/samples_per_second": 26.791, "eval/steps_per_second": 1.698}
wandb/run-20240410_155650-albqrbhg/logs/debug-internal.log CHANGED
@@ -1459,3 +1459,40 @@ subprocess.TimeoutExpired: Command '['conda', 'env', 'export']' timed out after
1459
  2024-04-10 16:18:37,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1460
  2024-04-10 16:18:37,716 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1461
  2024-04-10 16:18:40,900 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1459
  2024-04-10 16:18:37,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1460
  2024-04-10 16:18:37,716 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1461
  2024-04-10 16:18:40,900 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1462
+ 2024-04-10 16:18:45,910 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1463
+ 2024-04-10 16:18:46,727 INFO Thread-12 :98 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_155650-albqrbhg/files/config.yaml
1464
+ 2024-04-10 16:18:51,046 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1465
+ 2024-04-10 16:18:51,878 DEBUG SenderThread:98 [sender.py:send():379] send: stats
1466
+ 2024-04-10 16:18:52,440 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: internal_messages
1467
+ 2024-04-10 16:18:52,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1468
+ 2024-04-10 16:18:52,716 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1469
+ 2024-04-10 16:18:56,868 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1470
+ 2024-04-10 16:19:01,869 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1471
+ 2024-04-10 16:19:06,870 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1472
+ 2024-04-10 16:19:07,448 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: internal_messages
1473
+ 2024-04-10 16:19:07,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1474
+ 2024-04-10 16:19:07,716 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1475
+ 2024-04-10 16:19:12,803 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1476
+ 2024-04-10 16:19:17,150 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: partial_history
1477
+ 2024-04-10 16:19:17,152 DEBUG SenderThread:98 [sender.py:send():379] send: history
1478
+ 2024-04-10 16:19:17,152 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: summary_record
1479
+ 2024-04-10 16:19:17,154 INFO SenderThread:98 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
1480
+ 2024-04-10 16:19:17,739 INFO Thread-12 :98 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_155650-albqrbhg/files/wandb-summary.json
1481
+ 2024-04-10 16:19:18,154 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1482
+ 2024-04-10 16:19:21,879 DEBUG SenderThread:98 [sender.py:send():379] send: stats
1483
+ 2024-04-10 16:19:22,447 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: internal_messages
1484
+ 2024-04-10 16:19:22,493 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: partial_history
1485
+ 2024-04-10 16:19:22,495 DEBUG SenderThread:98 [sender.py:send():379] send: history
1486
+ 2024-04-10 16:19:22,495 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: summary_record
1487
+ 2024-04-10 16:19:22,495 INFO SenderThread:98 [sender.py:_save_file():1390] saving file wandb-summary.json with policy end
1488
+ 2024-04-10 16:19:22,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1489
+ 2024-04-10 16:19:22,717 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1490
+ 2024-04-10 16:19:22,742 INFO Thread-12 :98 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_155650-albqrbhg/files/wandb-summary.json
1491
+ 2024-04-10 16:19:23,742 INFO Thread-12 :98 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240410_155650-albqrbhg/files/output.log
1492
+ 2024-04-10 16:19:23,808 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1493
+ 2024-04-10 16:19:28,809 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1494
+ 2024-04-10 16:19:33,811 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report
1495
+ 2024-04-10 16:19:37,447 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: internal_messages
1496
+ 2024-04-10 16:19:37,716 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: stop_status
1497
+ 2024-04-10 16:19:37,717 DEBUG SenderThread:98 [sender.py:send_request():406] send_request: stop_status
1498
+ 2024-04-10 16:19:38,846 DEBUG HandlerThread:98 [handler.py:handle_request():146] handle_request: status_report