| export CUDA_VISIBLE_DEVICES="1" | |
| MODEL="flax-community/t5-base-dutch" | |
| OUTPUT="./output" | |
| TRAIN="/home/yeb/Developer/data/cnnuxsum/cnnuxsum_train.json" | |
| VAL="/home/yeb/Developer/data/cnnuxsum/cnnuxsum_val.json" | |
| TEST="/home/yeb/Developer/data/cnnuxsum/cnnuxsum_test.json" | |
| mkdir -p "${OUTPUT}" | |
| python ./run_summarization_flax.py \ | |
| --model_name_or_path "${MODEL}" \ | |
| --learning_rate "5e-4" \ | |
| --warmup_steps 500 \ | |
| --do_train \ | |
| --do_predict \ | |
| --do_eval \ | |
| --train_file "${TRAIN}" \ | |
| --validation_file "${VAL}" \ | |
| --test_file "${TEST}" \ | |
| --max_train_samples 1366592 \ | |
| --max_eval_samples 32 \ | |
| --max_predict_samples 8 \ | |
| --text_column "complete_text" \ | |
| --summary_column "summary_text" \ | |
| --max_source_length 1024 \ | |
| --max_target_length 142 \ | |
| --output_dir "${OUTPUT}" \ | |
| --per_device_train_batch_size=8 \ | |
| --per_device_eval_batch_size=8 \ | |
| --overwrite_output_dir \ | |
| --num_train_epochs="1" \ | |
| --logging_steps="100" \ | |
| --save_steps="20000" \ | |
| --eval_steps="5000" \ | |
| --num_beams 4 \ | |
| --prediction_debug \ | |
| --predict_with_generate | |
| # --source_prefix "summarize: " \ | |