| cache_dir=/tmp/DeBERTa/ | |
| base_model=deberta-v3-base | |
| task=CoLA | |
| export CUDA_MPS_PIPE_DIRECTORY="${HOME}/mps_pipe" | |
| export CUDA_MPS_LOG_DIRECTORY="${HOME}/mps_log" | |
| # Optional: Print to verify | |
| echo "MPS Pipe at: $CUDA_MPS_PIPE_DIRECTORY" | |
| python -m DeBERTa.apps.run --model_config config.json \ | |
| --tag $base_model \ | |
| --do_train \ | |
| --do_eval \ | |
| --do_predict \ | |
| --max_seq_len 64 \ | |
| --dump_interval 100 \ | |
| --num_train_epochs 34 \ | |
| --fp16 True \ | |
| --warmup 100 \ | |
| --learning_rate 9e-3 \ | |
| --train_batch_size 32 \ | |
| --cls_drop_out 0.1 \ | |
| --task_name $task \ | |
| --data_dir $cache_dir/glue_tasks/$task \ | |
| --init_model $base_model \ | |
| --output_dir $cache_dir/outputs/$base_model/$task \ | |
| --eval_batch_size 256 \ | |
| --predict_batch_size 256 \ | |