| python main.py \ | |
| --model /home/aiscuser/fhw/model_weights/warriordeep448/ \ | |
| --trust_remote_code \ | |
| --tasks output_prediction \ | |
| --batch_size 20 \ | |
| --n_samples 10 \ | |
| --max_length_generation 4096 \ | |
| --precision fp16 \ | |
| --temperature 0.8 \ | |
| --save_generations \ | |
| --save_generations_path model_generations_raw/warriordeep448_temp0.8_output/shard_0.json \ | |
| --shuffle \ | |
| --tensor_parallel_size 8 | |
| python main.py \ | |
| --model /home/aiscuser/fhw/model_weights/warriordeep448/ \ | |
| --trust_remote_code \ | |
| --tasks output_prediction \ | |
| --batch_size 20 \ | |
| --n_samples 10 \ | |
| --max_length_generation 4096 \ | |
| --precision fp16 \ | |
| --temperature 0.2 \ | |
| --save_generations \ | |
| --save_generations_path model_generations_raw/warriordeep448_temp0.2_output/shard_0.json \ | |
| --shuffle \ | |
| --tensor_parallel_size 8 | |
| python main.py \ | |
| --model /home/aiscuser/fhw/model_weights/warriordeep448/ \ | |
| --trust_remote_code \ | |
| --tasks output_prediction \ | |
| --batch_size 20 \ | |
| --n_samples 10 \ | |
| --max_length_generation 4096 \ | |
| --precision fp16 \ | |
| --temperature 0.8 \ | |
| --save_generations \ | |
| --save_generations_path model_generations_raw/warriordeep448+cot_temp0.8_output/shard_0.json \ | |
| --cot \ | |
| --shuffle \ | |
| --tensor_parallel_size 8 | |
| python main.py \ | |
| --model /home/aiscuser/fhw/model_weights/warriordeep448/ \ | |
| --trust_remote_code \ | |
| --tasks output_prediction \ | |
| --batch_size 20 \ | |
| --n_samples 10 \ | |
| --max_length_generation 4096 \ | |
| --precision fp16 \ | |
| --temperature 0.2 \ | |
| --save_generations \ | |
| --save_generations_path model_generations_raw/warriordeep448+cot_temp0.2_output/shard_0.json \ | |
| --cot \ | |
| --shuffle \ | |
| --tensor_parallel_size 8 | |
| python main.py \ | |
| --model /home/aiscuser/fhw/model_weights/warriordeep448/ \ | |
| --trust_remote_code \ | |
| --tasks input_prediction \ | |
| --batch_size 20 \ | |
| --n_samples 10 \ | |
| --max_length_generation 4096 \ | |
| --precision fp16 \ | |
| --temperature 0.8 \ | |
| --save_generations \ | |
| --save_generations_path model_generations_raw/warriordeep448+cot_temp0.8_input/shard_0.json \ | |
| --cot \ | |
| --shuffle \ | |
| --tensor_parallel_size 8 | |
| python main.py \ | |
| --model /home/aiscuser/fhw/model_weights/warriordeep448/ \ | |
| --trust_remote_code \ | |
| --tasks input_prediction \ | |
| --batch_size 20 \ | |
| --n_samples 10 \ | |
| --max_length_generation 4096 \ | |
| --precision fp16 \ | |
| --temperature 0.2 \ | |
| --save_generations \ | |
| --save_generations_path model_generations_raw/warriordeep448+cot_temp0.2_input/shard_0.json \ | |
| --cot \ | |
| --shuffle \ | |
| --tensor_parallel_size 8 | |