xuan-luo commited on
Commit
01633c1
·
verified ·
1 Parent(s): 36e3d1b

Create evals.sh

Browse files
Files changed (1) hide show
  1. evals.sh +6 -0
evals.sh ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks mmlu --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 1 > 1-mmlu.out 2>&1
2
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks hellaswag --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 1 > 2-hellaswag.out 2>&1
3
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks commonsense_qa --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 1 > 3-commonsenseqa.out 2>&1
4
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks gsm8k --num_fewshot 5 --apply_chat_template --fewshot_as_multiturn --batch_size 1 > 4-gsm8k.out 2>&1
5
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks mbpp --batch_size 1 --apply_chat_template --fewshot_as_multiturn --confirm_run_unsafe_code > 5-mbpp.out 2>&1
6
+ accelerate launch --main_process_port 29501 -m lm_eval --model hf --model_args pretrained=../,trust_remote_code=True --tasks longbench_multi_news --apply_chat_template --batch_size 1 > 6-multinews.out 2>&1