Commit ·
deee812
1
Parent(s): 31f3c0b
Training in progress, epoch 1
Browse files- model.safetensors +1 -1
- run-3/checkpoint-272/model.safetensors +1 -1
- run-3/checkpoint-272/optimizer.pt +1 -1
- run-3/checkpoint-272/rng_state.pth +2 -2
- run-3/checkpoint-272/scheduler.pt +1 -1
- run-3/checkpoint-272/tokenizer.json +2 -2
- run-3/checkpoint-272/tokenizer_config.json +1 -1
- run-3/checkpoint-272/trainer_state.json +10 -10
- run-3/checkpoint-272/training_args.bin +1 -1
- runs/Dec01_22-15-05_9632749e57d1/events.out.tfevents.1701469520.9632749e57d1.10239.3 +3 -0
- training_args.bin +1 -1
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 498692800
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f18a9c17794dcc64794600f514a20ec18ee99383447802910963fbc3fbd74a5
|
| 3 |
size 498692800
|
run-3/checkpoint-272/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 498692800
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1f18a9c17794dcc64794600f514a20ec18ee99383447802910963fbc3fbd74a5
|
| 3 |
size 498692800
|
run-3/checkpoint-272/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 997505402
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b25566a8dc0ae19360e446f27c6cff0afae23e4afeeaa3cf14ea0e99b9857a3b
|
| 3 |
size 997505402
|
run-3/checkpoint-272/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3646b4cdcd364d917497fd74fcfe29f7162e919c3f979cdb24aebb68f1f7cf36
|
| 3 |
+
size 14308
|
run-3/checkpoint-272/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:79a25765cf01b8c285d64615aacbe0ee01a4e20cc23d32d1d6fed0a37344b0cc
|
| 3 |
size 1064
|
run-3/checkpoint-272/tokenizer.json
CHANGED
|
@@ -2,13 +2,13 @@
|
|
| 2 |
"version": "1.0",
|
| 3 |
"truncation": {
|
| 4 |
"direction": "Right",
|
| 5 |
-
"max_length":
|
| 6 |
"strategy": "LongestFirst",
|
| 7 |
"stride": 0
|
| 8 |
},
|
| 9 |
"padding": {
|
| 10 |
"strategy": {
|
| 11 |
-
"Fixed":
|
| 12 |
},
|
| 13 |
"direction": "Right",
|
| 14 |
"pad_to_multiple_of": null,
|
|
|
|
| 2 |
"version": "1.0",
|
| 3 |
"truncation": {
|
| 4 |
"direction": "Right",
|
| 5 |
+
"max_length": 128,
|
| 6 |
"strategy": "LongestFirst",
|
| 7 |
"stride": 0
|
| 8 |
},
|
| 9 |
"padding": {
|
| 10 |
"strategy": {
|
| 11 |
+
"Fixed": 128
|
| 12 |
},
|
| 13 |
"direction": "Right",
|
| 14 |
"pad_to_multiple_of": null,
|
run-3/checkpoint-272/tokenizer_config.json
CHANGED
|
@@ -49,7 +49,7 @@
|
|
| 49 |
"eos_token": "</s>",
|
| 50 |
"errors": "replace",
|
| 51 |
"mask_token": "<mask>",
|
| 52 |
-
"model_max_length":
|
| 53 |
"pad_token": "<pad>",
|
| 54 |
"sep_token": "</s>",
|
| 55 |
"tokenizer_class": "RobertaTokenizer",
|
|
|
|
| 49 |
"eos_token": "</s>",
|
| 50 |
"errors": "replace",
|
| 51 |
"mask_token": "<mask>",
|
| 52 |
+
"model_max_length": 128,
|
| 53 |
"pad_token": "<pad>",
|
| 54 |
"sep_token": "</s>",
|
| 55 |
"tokenizer_class": "RobertaTokenizer",
|
run-3/checkpoint-272/trainer_state.json
CHANGED
|
@@ -11,23 +11,23 @@
|
|
| 11 |
{
|
| 12 |
"epoch": 1.0,
|
| 13 |
"eval_f1": 0.0,
|
| 14 |
-
"eval_loss": 0.
|
| 15 |
-
"eval_runtime":
|
| 16 |
-
"eval_samples_per_second":
|
| 17 |
-
"eval_steps_per_second":
|
| 18 |
"step": 272
|
| 19 |
}
|
| 20 |
],
|
| 21 |
"logging_steps": 500,
|
| 22 |
-
"max_steps":
|
| 23 |
-
"num_train_epochs":
|
| 24 |
"save_steps": 500,
|
| 25 |
"total_flos": 0,
|
| 26 |
"trial_name": null,
|
| 27 |
"trial_params": {
|
| 28 |
-
"learning_rate":
|
| 29 |
-
"num_train_epochs":
|
| 30 |
-
"per_device_train_batch_size":
|
| 31 |
-
"seed":
|
| 32 |
}
|
| 33 |
}
|
|
|
|
| 11 |
{
|
| 12 |
"epoch": 1.0,
|
| 13 |
"eval_f1": 0.0,
|
| 14 |
+
"eval_loss": 0.15121705830097198,
|
| 15 |
+
"eval_runtime": 1.7687,
|
| 16 |
+
"eval_samples_per_second": 153.22,
|
| 17 |
+
"eval_steps_per_second": 1.131,
|
| 18 |
"step": 272
|
| 19 |
}
|
| 20 |
],
|
| 21 |
"logging_steps": 500,
|
| 22 |
+
"max_steps": 272,
|
| 23 |
+
"num_train_epochs": 1,
|
| 24 |
"save_steps": 500,
|
| 25 |
"total_flos": 0,
|
| 26 |
"trial_name": null,
|
| 27 |
"trial_params": {
|
| 28 |
+
"learning_rate": 3.4549942125392434e-05,
|
| 29 |
+
"num_train_epochs": 1,
|
| 30 |
+
"per_device_train_batch_size": 8,
|
| 31 |
+
"seed": 32
|
| 32 |
}
|
| 33 |
}
|
run-3/checkpoint-272/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4600
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a860ef08b878fc8a841fef69af13e56850d256386ceb720646e3b321efbbe86b
|
| 3 |
size 4600
|
runs/Dec01_22-15-05_9632749e57d1/events.out.tfevents.1701469520.9632749e57d1.10239.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:65e7551c3de41ea0f263bb3bdfb4bc35cf1a3072cc23a1ef12e69a26d9dee0d7
|
| 3 |
+
size 6092
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4600
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a860ef08b878fc8a841fef69af13e56850d256386ceb720646e3b321efbbe86b
|
| 3 |
size 4600
|