HRA / nlu /experiments /glue /cola.sh
nvan13's picture
Add files using upload-large-folder tool
ab0f6ec verified
#!/bin/bash
cache_dir=/tmp/DeBERTa/
base_model=deberta-v3-base
task=CoLA
export CUDA_MPS_PIPE_DIRECTORY="${HOME}/mps_pipe"
export CUDA_MPS_LOG_DIRECTORY="${HOME}/mps_log"
# Optional: Print to verify
echo "MPS Pipe at: $CUDA_MPS_PIPE_DIRECTORY"
python -m DeBERTa.apps.run --model_config config.json \
--tag $base_model \
--do_train \
--do_eval \
--do_predict \
--max_seq_len 64 \
--dump_interval 100 \
--num_train_epochs 34 \
--fp16 True \
--warmup 100 \
--learning_rate 9e-3 \
--train_batch_size 32 \
--cls_drop_out 0.1 \
--task_name $task \
--data_dir $cache_dir/glue_tasks/$task \
--init_model $base_model \
--output_dir $cache_dir/outputs/$base_model/$task \
--eval_batch_size 256 \
--predict_batch_size 256 \