File size: 1,312 Bytes
a80200a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38

# Qwen2.5-Math-Instruct Series
PROMPT_TYPE="deepseek3"
# PROMPT_TYPE="qwen25-math-cot"
# Qwen2.5-Math-1.5B-Instruct
# DATA_NAME="amc23"
DATA_NAME="olympiadbench"
# DATA_NAME="aime24"
# DATA_NAME="math500"

# export CUDA_VISIBLE_DEVICES="4,5"
# export CUDA_VISIBLE_DEVICES="6,7"
export CUDA_VISIBLE_DEVICES="4,5,6,7"
# export CUDA_VISIBLE_DEVICES="0,1,2,3"
export remaining=default
# export CUDA_VISIBLE_DEVICES="0,1,2,3,4,5,6,7"

export CUDA_CACHE_DISABLE=1

bash delete_file.sh ./start_positions.pt
bash delete_file.sh ./early_positions.pt


MODEL_NAME_OR_PATH=' /mnt/lyc/wuxinrui/DS_Huggingface/Laser-D-L4096-7B/models'
# MODEL_NAME_OR_PATH='/mnt/lyc/wuxinrui/DS_Huggingface/Laser-L8192-1_5B/models/'
PARENT_DIR=$(dirname "$MODEL_NAME_OR_PATH")  # 获取父目录
MODEL_NAME=$(basename "$PARENT_DIR")        # 获取父目录的最后一部分
echo MODEL_NAME: $MODEL_NAME
export PE_MODE=default
export position=ori
export tip=Laser
export stage=2
export mode=TIP-$tip-STAGE-$stage
export model=MODEL-$MODEL_NAME
export modelname=MODEL-$MODEL_NAME-TIP-$tip-STAGE-$stage-DATA-$DATA_NAME
bash ./sh/remaining.sh $PROMPT_TYPE $MODEL_NAME_OR_PATH $DATA_NAME
# bash ./sh/remaining_sample_n.sh $PROMPT_TYPE $MODEL_NAME_OR_PATH $DATA_NAME
# bash ./sh/remaining_sample_64.sh $PROMPT_TYPE $MODEL_NAME_OR_PATH $DATA_NAME