| # Copyright 2025 PKU-Alignment Team. All Rights Reserved. | |
| # | |
| # Licensed under the Apache License, Version 2.0 (the "License"); | |
| # you may not use this file except in compliance with the License. | |
| # You may obtain a copy of the License at | |
| # | |
| # http://www.apache.org/licenses/LICENSE-2.0 | |
| # | |
| # Unless required by applicable law or agreed to in writing, software | |
| # distributed under the License is distributed on an "AS IS" BASIS, | |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
| # See the License for the specific language governing permissions and | |
| # limitations under the License. | |
| # ============================================================================== | |
| # Initialize variables | |
| export CUDA_VISIBLE_DEVICES=0,1,2 | |
| MODEL_NAME_OR_PATH="/data5/czh/pretrain_models/Janus-Pro-1B" | |
| TRAIN_DATASETS="/home/czh/bxh/align-anything/projects/janus/example/supervised/text_to_image" | |
| TRAIN_DATA_FILE="Reasoning_Spatial_2.pt" | |
| #EVAL_DATASETS="/home/czh/bxh/align-anything/projects/janus/example/supervised/text_to_image" | |
| #EVAL_DATA_FILE="train_unify.pt" | |
| OUTPUT_DIR="/data5/czh/bxh/test_2" | |
| JANUS_REPO_PATH="/home/czh/bxh/Align_Anything_Janus" # change to your own path to Align_Anything_Janus | |
| export PYTHONPATH=$PYTHONPATH:$JANUS_REPO_PATH | |
| export WANDB_API_KEY="744522a73a6fd3ff6b9d0c40506a080b194aa628" | |
| export WANDB_MODE=offline | |
| # Source the setup script | |
| source ../setup.sh | |
| # Execute deepspeed command | |
| deepspeed \ | |
| --master_port 29000 \ | |
| --module align_anything.trainers.janus.sft_gen \ | |
| --model_name_or_path ${MODEL_NAME_OR_PATH} \ | |
| --train_datasets ${TRAIN_DATASETS} \ | |
| --train_data_files ${TRAIN_DATA_FILE} \ | |
| --train_split train \ | |
| --learning_rate 5e-6 \ | |
| --epochs 3 \ | |
| --lr_scheduler_type cosine \ | |
| --output_dir ${OUTPUT_DIR} | |