Qwen_save3 / train /run89.sh
Yaning1001's picture
Add files using upload-large-folder tool
8333a01 verified
#!/bin/bash
# Run the first training script
CUDA_VISIBLE_DEVICES=0 torchrun --nproc_per_node 1 --master_port=22239 train_qwen_72B_shuffle.py --perturbation shuffle_control --train_set 10M --batch_size 1 --epoch 2 --seed 0
# Run the second training script after the first one has finished
CUDA_VISIBLE_DEVICES=1 torchrun --nproc_per_node 1 --master_port=22229 train_qwen_72B_shuffle.py --perturbation shuffle_nondeterministic --train_set 10M --batch_size 1 --epoch 2 --seed 0
# Run the third training script after the second one has finished
CUDA_VISIBLE_DEVICES=2 torchrun --nproc_per_node 1 --master_port=22219 train_qwen_72B_reverse.py --perturbation reverse_control --train_set 10M --batch_size 1 --epoch 2 --seed 0
# Run the fourth training script after the third one has finished
CUDA_VISIBLE_DEVICES=3 torchrun --nproc_per_node 1 --master_port=22139 train_qwen_72B_reverse.py --perturbation reverse_partial --train_set 10M --batch_size 1 --epoch 2 --seed 0
CUDA_VISIBLE_DEVICES=4 torchrun --nproc_perd_node 1 --master_port=22339 train_qwen_72B_hop.py --perturbation hop_control --train_set 10M --batch_size 1 --epoch 2 --seed 0
CUDA_VISIBLE_DEVICES=5 torchrun --nproc_per_node 1 --master_port=22439 train_qwen_72B_hop.py --perturbation hop_words4 --train_set 10M --batch_size 1 --epoch 2 --seed 0
# reverse
nohup bash -c "CUDA_VISIBLE_DEVICES=0,1,2,3 /home/czhang/anaconda3/envs/impossible_llm/bin/torchrun --nproc_per_node=4 --master_port=24235 ./train_qwen_14B_reverse.py --perturbation reverse_partial --train_set 10M --batch_size 2 --epoch 2 --seed 0" > nohup/Qwen_14B_reverse.txt 2>&1 &
# shuffle
nohup bash -c "CUDA_VISIBLE_DEVICES=4,5,6,7 /home/czhang/anaconda3/envs/impossible_llm/bin/torchrun --nproc_per_node=4 --master_port=24239 ./train_qwen_14B_shuffle.py --perturbation shuffle_control --train_set 10M --batch_size 2 --epoch 2 --seed 0" > nohup/Qwen_14B_shuffle_control.txt 2>&1 &
nohup bash -c "CUDA_VISIBLE_DEVICES=0,1,2,3 /home/czhang/anaconda3/envs/impossible_llm/bin/torchrun --nproc_per_node=4 --master_port=24237 ./train_qwen_14B_shuffle.py --perturbation shuffle_nondeterministic --train_set 10M --batch_size 2 --epoch 2 --seed 0" > nohup/shuffle_nondeterministic.txt 2>&1 &
nohup bash -c "CUDA_VISIBLE_DEVICES=0,1,2,3 /home/czhang/anaconda3/envs/impossible_llm/bin/torchrun --nproc_per_node=4 --master_port=24237 ./train_qwen_14B_shuffle.py --perturbation shuffle_even_odd --train_set 10M --batch_size 2 --epoch 2 --seed 0" > nohup/shuffle_even_odd.txt 2>&1 &
nohup bash -c "CUDA_VISIBLE_DEVICES=4,5,6,7 /home/czhang/anaconda3/envs/impossible_llm/bin/torchrun --nproc_per_node=4 --master_port=24238 ./train_qwen_14B_hop.py --perturbation hop_words4 --train_set 10M --batch_size 2 --epoch 2 --seed 0" > nohup/hop_words4.txt 2>&1 &
nohup python repo_upload2.py > impossible_llm.txt 2>&1 &