| #SBATCH --job-name=dmmi-rcc50 | |
| #SBATCH --partition=a6000 | |
| #SBATCH --nodelist=node07 | |
| #SBATCH --gres=gpu:2 | |
| #SBATCH --time=12-00:00:00 # d-hh:mm:ss, job time limit | |
| #SBATCH --mem=40000 # cpu memory size | |
| #SBATCH --cpus-per-task=6 | |
| #SBATCH --output=./trainlog_filter/refcoco/ACE_rcc_m10_tmp007_proj_thr070_bs24.log | |
| ml purge | |
| ml load cuda/11.8 | |
| eval "$(conda shell.bash hook)" | |
| conda activate risall | |
| cd /data2/projects/chaeyun/RIS-DMMI | |
| export NCCL_P2P_DISABLE=1 | |
| export NVIDIA_TF32_OVERRIDE=0 | |
| GPUS=2 | |
| OUTPUT_DIR=$1 | |
| EXP_NAME=$2 | |
| MARGIN=$3 | |
| TEMP=$4 | |
| MODE=$5 | |
| MASTER_PORT=1927 | |
| FILTER_THRES=0.7 | |
| # TRAIN | |
| # hardpos_only, hardpos_only_rev | |
| python_args="--model dmmi_swin_hardpos_only \ | |
| --dataset refcoco \ | |
| --splitBy unc \ | |
| --output_dir ${OUTPUT_DIR} \ | |
| --model_id ${EXP_NAME} \ | |
| --batch-size 12 \ | |
| --lr 0.00005 \ | |
| --wd 1e-2 \ | |
| --window12 \ | |
| --swin_type base \ | |
| --pretrained_backbone /data2/projects/chaeyun/LAVT-RIS/pretrained_weights/swin_base_patch4_window12_384_22k.pth \ | |
| --epochs 40 \ | |
| --img_size 480 \ | |
| --metric_learning \ | |
| --margin_value ${MARGIN} \ | |
| --filter_thres ${FILTER_THRES} \ | |
| --temperature ${TEMP} \ | |
| --metric_mode ${MODE} \ | |
| --exclude_multiobj " | |
| CUDA_VISIBLE_DEVICES=0,1 torchrun --nproc_per_node=$GPUS --master_port=$MASTER_PORT train_rev_refcocop.py $python_args | |
| # sbatch train_ace_rcconly.sh ./experiments/dmmi_rcc_ace_filtered/ACE_rcc_m10_tmp007_thr050_bs24 ACE_rcc_m10_tmp007_thr050_bs24 10 0.07 hardpos_only_refined | |