NbAiLab
/

roberta_des_ada_128

Model card Files Files and versions

Metrics Training metrics Community

pere commited on Dec 31, 2021

Commit

682b4fd

·

1 Parent(s): 7f2a9ca

update

Files changed (1) hide show

run_step1.sh +7 -6

run_step1.sh CHANGED Viewed

@@ -3,16 +3,17 @@
     --model_type="roberta" \
     --config_name="./" \
     --tokenizer_name="./" \
-    --dataset_name="NbAiLab/nbailab_extended" \
     --cache_dir="/mnt/disks/flaxdisk/cache/" \
     --max_seq_length="128" \
     --weight_decay="0.01" \
-    --per_device_train_batch_size="256" \
-    --per_device_eval_batch_size="256" \
-    --learning_rate="6e-4" \
     --warmup_steps="10000" \
     --overwrite_output_dir \
-    --num_train_epochs="1000" \
     --adam_beta1="0.9" \
     --adam_beta2="0.98" \
     --logging_steps="10000" \
@@ -21,6 +22,6 @@
     --preprocessing_num_workers="64" \
     --auth_token="True" \
     --static_learning_rate="True" \
-    --dtype="bloat16" \
     --adafactor \
     --push_to_hub

     --model_type="roberta" \
     --config_name="./" \
     --tokenizer_name="./" \
+    --train_file /mnt/disks/flaxdisk/corpus/train_1_4.json \
+    --validation_file /mnt/disks/flaxdisk/corpus/validation.json \
     --cache_dir="/mnt/disks/flaxdisk/cache/" \
     --max_seq_length="128" \
     --weight_decay="0.01" \
+    --per_device_train_batch_size="200" \
+    --per_device_eval_batch_size="200" \
+    --learning_rate="4e-4" \
     --warmup_steps="10000" \
     --overwrite_output_dir \
+    --num_train_epochs="2" \
     --adam_beta1="0.9" \
     --adam_beta2="0.98" \
     --logging_steps="10000" \
     --preprocessing_num_workers="64" \
     --auth_token="True" \
     --static_learning_rate="True" \
+    --dtype="bfloat16" \
     --adafactor \
     --push_to_hub