# 1. 对比学习预训练 python train_contrastive.py --use_wandb --freeze_protein_model --freeze_text_model # 2. 监督微调 python train_protein_qwen.py --model_type protein-llm --text_model_finetune True # 3. GRPO训练 python protein_reason.py --sft_checkpoint ./checkpoints/best_model