| python run_translation_t5_flax.py \ | |
| --output_dir "." \ | |
| --model_name_or_path NbAiLab/nb-t5-base \ | |
| --tokenizer_name NbAiLab/nb-t5-base \ | |
| --train_file nb_nn_nb.json \ | |
| --validation_file parallel_src_tgt_dev.json \ | |
| --test_file parallel_src_tgt_test.json \ | |
| --do_train --do_eval --do_predict \ | |
| --predict_with_generate \ | |
| --num_train_epochs 10 \ | |
| --learning_rate 7e-4 \ | |
| --warmup_steps 3000 \ | |
| --per_device_train_batch_size 8 \ | |
| --per_device_eval_batch_size 8 \ | |
| --overwrite_output_dir \ | |
| --max_source_length 512 \ | |
| --max_target_length 512 \ | |
| --adafactor | |