Model save
Browse files- README.md +2 -2
- model.safetensors +1 -1
- runs/Jan10_17-10-35_6af31f6f7309/events.out.tfevents.1704906635.6af31f6f7309.124.0 +2 -2
- wandb/debug-internal.log +25 -0
- wandb/run-20240110_171048-v6i8wmgc/files/config.yaml +20 -0
- wandb/run-20240110_171048-v6i8wmgc/files/wandb-summary.json +1 -1
- wandb/run-20240110_171048-v6i8wmgc/logs/debug-internal.log +25 -0
- wandb/run-20240110_171048-v6i8wmgc/run-v6i8wmgc.wandb +0 -0
README.md
CHANGED
|
@@ -38,7 +38,7 @@ The following hyperparameters were used during training:
|
|
| 38 |
- seed: 42
|
| 39 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
| 40 |
- lr_scheduler_type: linear
|
| 41 |
-
- num_epochs:
|
| 42 |
|
| 43 |
### Training results
|
| 44 |
|
|
@@ -46,7 +46,7 @@ The following hyperparameters were used during training:
|
|
| 46 |
|
| 47 |
### Framework versions
|
| 48 |
|
| 49 |
-
- Transformers 4.
|
| 50 |
- Pytorch 2.0.0
|
| 51 |
- Datasets 2.1.0
|
| 52 |
- Tokenizers 0.15.0
|
|
|
|
| 38 |
- seed: 42
|
| 39 |
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
| 40 |
- lr_scheduler_type: linear
|
| 41 |
+
- num_epochs: 400
|
| 42 |
|
| 43 |
### Training results
|
| 44 |
|
|
|
|
| 46 |
|
| 47 |
### Framework versions
|
| 48 |
|
| 49 |
+
- Transformers 4.36.0
|
| 50 |
- Pytorch 2.0.0
|
| 51 |
- Datasets 2.1.0
|
| 52 |
- Tokenizers 0.15.0
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 328693404
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:50e6785a073d3266714b3d0d0d226a3d53b500603c5680210689eb12c347361b
|
| 3 |
size 328693404
|
runs/Jan10_17-10-35_6af31f6f7309/events.out.tfevents.1704906635.6af31f6f7309.124.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:465099456e557eb26ae661ffa8c39187fb529a2b4fff03aa21653f97a094a32e
|
| 3 |
+
size 6289
|
wandb/debug-internal.log
CHANGED
|
@@ -484,3 +484,28 @@
|
|
| 484 |
2024-01-10 17:25:18,660 DEBUG SenderThread:290 [sender.py:send():382] send: stats
|
| 485 |
2024-01-10 17:25:21,551 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 486 |
2024-01-10 17:25:21,661 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 484 |
2024-01-10 17:25:18,660 DEBUG SenderThread:290 [sender.py:send():382] send: stats
|
| 485 |
2024-01-10 17:25:21,551 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 486 |
2024-01-10 17:25:21,661 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 487 |
+
2024-01-10 17:25:26,554 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 488 |
+
2024-01-10 17:25:26,662 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 489 |
+
2024-01-10 17:25:31,555 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 490 |
+
2024-01-10 17:25:31,662 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 491 |
+
2024-01-10 17:25:36,557 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 492 |
+
2024-01-10 17:25:36,663 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 493 |
+
2024-01-10 17:25:41,558 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 494 |
+
2024-01-10 17:25:41,664 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 495 |
+
2024-01-10 17:25:43,532 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: partial_history
|
| 496 |
+
2024-01-10 17:25:43,562 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 497 |
+
2024-01-10 17:25:43,562 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 498 |
+
2024-01-10 17:25:43,563 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 499 |
+
2024-01-10 17:25:43,563 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 500 |
+
2024-01-10 17:25:43,563 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 501 |
+
2024-01-10 17:25:43,564 DEBUG SenderThread:290 [sender.py:send():382] send: history
|
| 502 |
+
2024-01-10 17:25:43,564 DEBUG SenderThread:290 [sender.py:send_request():409] send_request: summary_record
|
| 503 |
+
2024-01-10 17:25:43,564 INFO SenderThread:290 [sender.py:_save_file():1392] saving file wandb-summary.json with policy end
|
| 504 |
+
2024-01-10 17:25:43,843 INFO Thread-12 :290 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240110_171048-v6i8wmgc/files/wandb-summary.json
|
| 505 |
+
2024-01-10 17:25:46,594 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 506 |
+
2024-01-10 17:25:47,571 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 507 |
+
2024-01-10 17:25:47,844 INFO Thread-12 :290 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240110_171048-v6i8wmgc/files/config.yaml
|
| 508 |
+
2024-01-10 17:25:48,661 DEBUG SenderThread:290 [sender.py:send():382] send: stats
|
| 509 |
+
2024-01-10 17:25:51,595 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 510 |
+
2024-01-10 17:25:53,662 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 511 |
+
2024-01-10 17:25:56,596 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
wandb/run-20240110_171048-v6i8wmgc/files/config.yaml
CHANGED
|
@@ -66,6 +66,26 @@ _wandb:
|
|
| 66 |
5: 1
|
| 67 |
6:
|
| 68 |
- 1
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 69 |
return_dict:
|
| 70 |
desc: null
|
| 71 |
value: true
|
|
|
|
| 66 |
5: 1
|
| 67 |
6:
|
| 68 |
- 1
|
| 69 |
+
- 1: train/train_runtime
|
| 70 |
+
5: 1
|
| 71 |
+
6:
|
| 72 |
+
- 1
|
| 73 |
+
- 1: train/train_samples_per_second
|
| 74 |
+
5: 1
|
| 75 |
+
6:
|
| 76 |
+
- 1
|
| 77 |
+
- 1: train/train_steps_per_second
|
| 78 |
+
5: 1
|
| 79 |
+
6:
|
| 80 |
+
- 1
|
| 81 |
+
- 1: train/total_flos
|
| 82 |
+
5: 1
|
| 83 |
+
6:
|
| 84 |
+
- 1
|
| 85 |
+
- 1: train/train_loss
|
| 86 |
+
5: 1
|
| 87 |
+
6:
|
| 88 |
+
- 1
|
| 89 |
return_dict:
|
| 90 |
desc: null
|
| 91 |
value: true
|
wandb/run-20240110_171048-v6i8wmgc/files/wandb-summary.json
CHANGED
|
@@ -1 +1 @@
|
|
| 1 |
-
{"train/loss": 0.4506, "train/learning_rate": 7.692307692307694e-07, "train/epoch":
|
|
|
|
| 1 |
+
{"train/loss": 0.4506, "train/learning_rate": 7.692307692307694e-07, "train/epoch": 400.0, "train/global_step": 5200, "_timestamp": 1704907543.531435, "_runtime": 895.5191690921783, "_step": 10, "train/train_runtime": 907.945, "train/train_samples_per_second": 88.111, "train/train_steps_per_second": 5.727, "train/total_flos": 998967541507056.0, "train/train_loss": 1.1194059283916766}
|
wandb/run-20240110_171048-v6i8wmgc/logs/debug-internal.log
CHANGED
|
@@ -484,3 +484,28 @@
|
|
| 484 |
2024-01-10 17:25:18,660 DEBUG SenderThread:290 [sender.py:send():382] send: stats
|
| 485 |
2024-01-10 17:25:21,551 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 486 |
2024-01-10 17:25:21,661 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 484 |
2024-01-10 17:25:18,660 DEBUG SenderThread:290 [sender.py:send():382] send: stats
|
| 485 |
2024-01-10 17:25:21,551 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 486 |
2024-01-10 17:25:21,661 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 487 |
+
2024-01-10 17:25:26,554 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 488 |
+
2024-01-10 17:25:26,662 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 489 |
+
2024-01-10 17:25:31,555 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 490 |
+
2024-01-10 17:25:31,662 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 491 |
+
2024-01-10 17:25:36,557 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 492 |
+
2024-01-10 17:25:36,663 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 493 |
+
2024-01-10 17:25:41,558 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 494 |
+
2024-01-10 17:25:41,664 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 495 |
+
2024-01-10 17:25:43,532 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: partial_history
|
| 496 |
+
2024-01-10 17:25:43,562 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 497 |
+
2024-01-10 17:25:43,562 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 498 |
+
2024-01-10 17:25:43,563 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 499 |
+
2024-01-10 17:25:43,563 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 500 |
+
2024-01-10 17:25:43,563 DEBUG SenderThread:290 [sender.py:send():382] send: metric
|
| 501 |
+
2024-01-10 17:25:43,564 DEBUG SenderThread:290 [sender.py:send():382] send: history
|
| 502 |
+
2024-01-10 17:25:43,564 DEBUG SenderThread:290 [sender.py:send_request():409] send_request: summary_record
|
| 503 |
+
2024-01-10 17:25:43,564 INFO SenderThread:290 [sender.py:_save_file():1392] saving file wandb-summary.json with policy end
|
| 504 |
+
2024-01-10 17:25:43,843 INFO Thread-12 :290 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240110_171048-v6i8wmgc/files/wandb-summary.json
|
| 505 |
+
2024-01-10 17:25:46,594 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 506 |
+
2024-01-10 17:25:47,571 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 507 |
+
2024-01-10 17:25:47,844 INFO Thread-12 :290 [dir_watcher.py:_on_file_modified():288] file/dir modified: /kaggle/working/wandb/run-20240110_171048-v6i8wmgc/files/config.yaml
|
| 508 |
+
2024-01-10 17:25:48,661 DEBUG SenderThread:290 [sender.py:send():382] send: stats
|
| 509 |
+
2024-01-10 17:25:51,595 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
| 510 |
+
2024-01-10 17:25:53,662 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: status_report
|
| 511 |
+
2024-01-10 17:25:56,596 DEBUG HandlerThread:290 [handler.py:handle_request():146] handle_request: keepalive
|
wandb/run-20240110_171048-v6i8wmgc/run-v6i8wmgc.wandb
CHANGED
|
Binary files a/wandb/run-20240110_171048-v6i8wmgc/run-v6i8wmgc.wandb and b/wandb/run-20240110_171048-v6i8wmgc/run-v6i8wmgc.wandb differ
|
|
|