MRaCL / RIS-DMMI /train_ace_rcconly.sh
dianecy's picture
Upload folder using huggingface_hub
1120a2f verified
#!/bin/bash
#SBATCH --job-name=dmmi-rcc50
#SBATCH --partition=a6000
#SBATCH --nodelist=node07
#SBATCH --gres=gpu:2
#SBATCH --time=12-00:00:00 # d-hh:mm:ss, job time limit
#SBATCH --mem=40000 # cpu memory size
#SBATCH --cpus-per-task=6
#SBATCH --output=./trainlog_filter/refcoco/ACE_rcc_m10_tmp007_proj_thr070_bs24.log
ml purge
ml load cuda/11.8
eval "$(conda shell.bash hook)"
conda activate risall
cd /data2/projects/chaeyun/RIS-DMMI
export NCCL_P2P_DISABLE=1
export NVIDIA_TF32_OVERRIDE=0
GPUS=2
OUTPUT_DIR=$1
EXP_NAME=$2
MARGIN=$3
TEMP=$4
MODE=$5
MASTER_PORT=1927
FILTER_THRES=0.7
# TRAIN
# hardpos_only, hardpos_only_rev
python_args="--model dmmi_swin_hardpos_only \
--dataset refcoco \
--splitBy unc \
--output_dir ${OUTPUT_DIR} \
--model_id ${EXP_NAME} \
--batch-size 12 \
--lr 0.00005 \
--wd 1e-2 \
--window12 \
--swin_type base \
--pretrained_backbone /data2/projects/chaeyun/LAVT-RIS/pretrained_weights/swin_base_patch4_window12_384_22k.pth \
--epochs 40 \
--img_size 480 \
--metric_learning \
--margin_value ${MARGIN} \
--filter_thres ${FILTER_THRES} \
--temperature ${TEMP} \
--metric_mode ${MODE} \
--exclude_multiobj "
CUDA_VISIBLE_DEVICES=0,1 torchrun --nproc_per_node=$GPUS --master_port=$MASTER_PORT train_rev_refcocop.py $python_args
# sbatch train_ace_rcconly.sh ./experiments/dmmi_rcc_ace_filtered/ACE_rcc_m10_tmp007_thr050_bs24 ACE_rcc_m10_tmp007_thr050_bs24 10 0.07 hardpos_only_refined