clone / evaluation /valid.sh
chenyili818's picture
Add files using upload-large-folder tool
661c54a verified
#!/usr/bin/env bash
set -euo pipefail
# 确保输出目录存在
mkdir -p /pfs/lichenyi/work/evaluation/predictions_in
mkdir -p /pfs/lichenyi/work/evaluation/predictions_ood
for i in 100 200 300 400 500 600 700 748; do
echo "======= Running checkpoint-$i ======="
model_path="/pfs/lichenyi/work/train_ddp/checkpoint-$i"
########################
# 1) in-domain valid
########################
data_path="/pfs/lichenyi/work/evaluation/valid_in.json"
torchrun --nproc_per_node 4 simple_valid.py \
--model_path "${model_path}" \
--out_path /pfs/lichenyi/work/evaluation/predictions_in \
--data_path "${data_path}" \
--dtype bf16 \
--use_system \
--temperature 0.0
python get_valid_score.py \
--pred_path "/pfs/lichenyi/work/evaluation/predictions_in/predictions_checkpoint-${i}.json" \
--out_path "/pfs/lichenyi/work/evaluation/valid_score_in_${i}.json"
########################
# 2) ood valid
########################
data_path="/pfs/lichenyi/work/evaluation/valid_ood.json"
torchrun --nproc_per_node 4 simple_valid.py \
--model_path "${model_path}" \
--data_path "${data_path}" \
--out_path /pfs/lichenyi/work/evaluation/predictions_ood \
--dtype bf16 \
--use_system \
--temperature 0.0
python get_valid_score.py \
--pred_path "/pfs/lichenyi/work/evaluation/predictions_ood/predictions_checkpoint-${i}.json" \
--out_path "/pfs/lichenyi/work/evaluation/valid_score_ood_${i}.json"
done