pere commited on
Commit
3103067
·
1 Parent(s): 96275ea

Saving weights and logs of step 5000

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": ".",
3
  "architectures": [
4
  "RobertaForMaskedLM"
5
  ],
 
1
  {
2
+ "_name_or_path": "./",
3
  "architectures": [
4
  "RobertaForMaskedLM"
5
  ],
events.out.tfevents.1639431874.t1v-n-ccbf3e94-w-0.1053519.3.v2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68887780af1577a229cee0ce20bb9da8be2c8465ca4f2b6508402c6256754f4a
3
+ size 735136
flax_model.msgpack CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a993bcaf3ce549644ccbe6e0640cf03169148e4fbf4700be812d6e5a0b11164
3
  size 498796983
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ff2cd2aa2ccf0aa8ecc9af3e713ed51b9f3814590547b10d550c380ee3bc0df
3
  size 498796983
run_w5_long.sh CHANGED
@@ -3,8 +3,9 @@
3
  --model_type="roberta" \
4
  --config_name="./" \
5
  --tokenizer_name="./" \
6
- --train_file="/mnt/disks/flaxdisk/corpus/train-shard-0001-of-0001.json" \
7
  --validation_file="/mnt/disks/flaxdisk/corpus/validation-shard-0001-of-0001.json" \
 
8
  --max_seq_length="128" \
9
  --weight_decay="0.01" \
10
  --per_device_train_batch_size="128" \
@@ -18,4 +19,5 @@
18
  --logging_steps="5000" \
19
  --save_steps="5000" \
20
  --eval_steps="5000" \
 
21
  --push_to_hub
 
3
  --model_type="roberta" \
4
  --config_name="./" \
5
  --tokenizer_name="./" \
6
+ --train_file="/mnt/disks/flaxdisk/corpus/long_train.json" \
7
  --validation_file="/mnt/disks/flaxdisk/corpus/validation-shard-0001-of-0001.json" \
8
+ --cache_dir="/mnt/disks/flaxdisk/cache/" \
9
  --max_seq_length="128" \
10
  --weight_decay="0.01" \
11
  --per_device_train_batch_size="128" \
 
19
  --logging_steps="5000" \
20
  --save_steps="5000" \
21
  --eval_steps="5000" \
22
+ --preprocessing_num_workers="64" \
23
  --push_to_hub