VLLM_USE_V1=1 ASCEND_RT_VISIBLE_DEVICES=0 python main.py --mode train \ --device npu \ --model_name "FreedomIntelligence/openPangu-Embedded-7B" \ --train_data processed_data/MATH/train.jsonl \ --val_data processed_data/MATH/val.jsonl \ --num_epochs 5 \ --batch_size 16 \ --num_samples 4 \ --token_budget 4096 \ --checkpoint_dir checkpoints/MATH/pangu \ --task_type math \