Saving weights and logs of step 5000
Browse files- config.json +1 -1
- events.out.tfevents.1639431874.t1v-n-ccbf3e94-w-0.1053519.3.v2 +3 -0
- flax_model.msgpack +1 -1
- run_w5_long.sh +3 -1
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "
|
| 3 |
"architectures": [
|
| 4 |
"RobertaForMaskedLM"
|
| 5 |
],
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "./",
|
| 3 |
"architectures": [
|
| 4 |
"RobertaForMaskedLM"
|
| 5 |
],
|
events.out.tfevents.1639431874.t1v-n-ccbf3e94-w-0.1053519.3.v2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68887780af1577a229cee0ce20bb9da8be2c8465ca4f2b6508402c6256754f4a
|
| 3 |
+
size 735136
|
flax_model.msgpack
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 498796983
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ff2cd2aa2ccf0aa8ecc9af3e713ed51b9f3814590547b10d550c380ee3bc0df
|
| 3 |
size 498796983
|
run_w5_long.sh
CHANGED
|
@@ -3,8 +3,9 @@
|
|
| 3 |
--model_type="roberta" \
|
| 4 |
--config_name="./" \
|
| 5 |
--tokenizer_name="./" \
|
| 6 |
-
--train_file="/mnt/disks/flaxdisk/corpus/
|
| 7 |
--validation_file="/mnt/disks/flaxdisk/corpus/validation-shard-0001-of-0001.json" \
|
|
|
|
| 8 |
--max_seq_length="128" \
|
| 9 |
--weight_decay="0.01" \
|
| 10 |
--per_device_train_batch_size="128" \
|
|
@@ -18,4 +19,5 @@
|
|
| 18 |
--logging_steps="5000" \
|
| 19 |
--save_steps="5000" \
|
| 20 |
--eval_steps="5000" \
|
|
|
|
| 21 |
--push_to_hub
|
|
|
|
| 3 |
--model_type="roberta" \
|
| 4 |
--config_name="./" \
|
| 5 |
--tokenizer_name="./" \
|
| 6 |
+
--train_file="/mnt/disks/flaxdisk/corpus/long_train.json" \
|
| 7 |
--validation_file="/mnt/disks/flaxdisk/corpus/validation-shard-0001-of-0001.json" \
|
| 8 |
+
--cache_dir="/mnt/disks/flaxdisk/cache/" \
|
| 9 |
--max_seq_length="128" \
|
| 10 |
--weight_decay="0.01" \
|
| 11 |
--per_device_train_batch_size="128" \
|
|
|
|
| 19 |
--logging_steps="5000" \
|
| 20 |
--save_steps="5000" \
|
| 21 |
--eval_steps="5000" \
|
| 22 |
+
--preprocessing_num_workers="64" \
|
| 23 |
--push_to_hub
|