File size: 1,575 Bytes
661c54a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
#!/usr/bin/env bash
set -euo pipefail

# 确保输出目录存在
mkdir -p /pfs/lichenyi/work/evaluation/predictions_in
mkdir -p /pfs/lichenyi/work/evaluation/predictions_ood

for i in 100 200 300 400 500 600 700 748; do
    echo "======= Running checkpoint-$i ======="

    model_path="/pfs/lichenyi/work/train_ddp/checkpoint-$i"

    ########################
    # 1) in-domain valid
    ########################
    data_path="/pfs/lichenyi/work/evaluation/valid_in.json"

    torchrun --nproc_per_node 4 simple_valid.py \
        --model_path "${model_path}" \
        --out_path /pfs/lichenyi/work/evaluation/predictions_in \
        --data_path "${data_path}" \
        --dtype bf16 \
        --use_system \
        --temperature 0.0

    python get_valid_score.py \
        --pred_path "/pfs/lichenyi/work/evaluation/predictions_in/predictions_checkpoint-${i}.json" \
        --out_path "/pfs/lichenyi/work/evaluation/valid_score_in_${i}.json"

    ########################
    # 2) ood valid
    ########################
    data_path="/pfs/lichenyi/work/evaluation/valid_ood.json"

    torchrun --nproc_per_node 4 simple_valid.py \
        --model_path "${model_path}" \
        --data_path "${data_path}" \
        --out_path /pfs/lichenyi/work/evaluation/predictions_ood \
        --dtype bf16 \
        --use_system \
        --temperature 0.0

    python get_valid_score.py \
        --pred_path "/pfs/lichenyi/work/evaluation/predictions_ood/predictions_checkpoint-${i}.json" \
        --out_path "/pfs/lichenyi/work/evaluation/valid_score_ood_${i}.json"

done