export CUDA_VISIBLE_DEVICES=3,4,5,6 python -u ./smiles/train.py \ --validity_weight 200 \ --gamma 2.0 \ --epochs 5 \ --learning_rate 1e-4 \ --weight_decay 1e-5 \ --model_dim 768 \ --n_heads 8 \ --n_layers 8 \ --checkpoint_dir ./smiles/ckpt