Fahad-S commited on
Commit
c0042e5
·
verified ·
1 Parent(s): cb413e3

Upload /mix_all_train_unimvuv5_7B_alpha05_berzelius_job.sh with huggingface_hub

Browse files
mix_all_train_unimvuv5_7B_alpha05_berzelius_job.sh ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ #!/bin/bash
2
+
3
+ #SBATCH --job-name=UniMVU
4
+ #SBATCH --nodes=1
5
+ #SBATCH --ntasks-per-node=1
6
+ #SBATCH --time=0-72:00:00
7
+ #SBATCH --output=logs/slurmm1.0-%j.out
8
+ #SBATCH --error=logs/slurmm1.0-%j.out
9
+ #SBATCH --account=berzelius-2025-198
10
+ #SBATCH --gres=gpu:A100-SXM4-80GB:8
11
+
12
+ module load buildenv-nvhpc/24.5-cuda12.4
13
+ source $(conda info --base)/etc/profile.d/conda.sh
14
+ export PYTHONPATH="./:$PYTHONPATH"
15
+
16
+ export HF_HOME=/proj/cvl/users/x_fahkh2/caches
17
+ export TORCH_HOME=/proj/cvl/users/x_fahkh2/caches
18
+ export PIP_CACHE_DIR=/proj/cvl/users/x_fahkh2/caches
19
+ export TMPDIR=/proj/cvl/users/x_fahkh2/caches
20
+ export TRITON_CACHE_DIR=/proj/cvl/users/x_fahkh2/caches
21
+
22
+ export CUDA_HOME=/software/sse/manual/NVHPC/23.3-bdist/Linux_x86_64/23.3/compilers
23
+ module avail CUDA # checks which CUDA modules are available
24
+ module load buildenv-gcccuda/12.1.1-gcc12.3.0
25
+
26
+ NCCL_P2P_DISABLE=1 \
27
+ deepspeed train_vlmm_alpha.py \
28
+ --deepspeed ./scripts/zero2_flops_uni.json \
29
+ --lora_enable True \
30
+ --lora_alpha 128 \
31
+ --data_class VideoFeatMixedDataArguments \
32
+ --datasets llava_video*4 avqa music_avqa avsd scanqa sqa3d \
33
+ --dataset_video_backbone_map avqa:tv \
34
+ --annotation_path \
35
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_academic_oe_v0_1_qa_processed_2pv.json \
36
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_youtube_oe_v0_1_qa_processed_2pv.json \
37
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_academic_oe_v0_1_qa_processed_2pv.json \
38
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_youtube_oe_v0_1_qa_processed_2pv.json \
39
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avqa/train_qa_instruct.json \
40
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/music_avqa/music_avqa_train_instruct_duplicate_audio.json \
41
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avsd/avsd_train_instruct.json \
42
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/scanqa_train_instruct.json \
43
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/sqa3q_ScanQA_format/SQA_train_instruct.json \
44
+ --fast_path_mapping_path \
45
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_academic_v0_1_feat_mapping.json \
46
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_youtube_v0_1_feat_mapping.json \
47
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_academic_v0_1_feat_mapping.json \
48
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_youtube_v0_1_feat_mapping.json \
49
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avqa/from_vid_to_feat_name.json \
50
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/music_avqa/music_avqa_all_imagebind_feature_mapping.json \
51
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avsd/avsd_all_feats_mapping.json \
52
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/scannet_from_scan_id_to_video_feature.json \
53
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/scannet_from_scan_id_to_video_feature.json \
54
+ --slow_path_mapping_path \
55
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_academic_v0_1_videos_mapping_updated.json \
56
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_youtube_v0_1_videos_mapping_updated.json \
57
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_academic_v0_1_videos_mapping_updated.json \
58
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_youtube_v0_1_videos_mapping_updated.json \
59
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avqa/from_vid_to_video_name.json \
60
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/music_avqa/music_avqa_all_videos_mapping.json \
61
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avsd/avsd_all_videos_mapping.json \
62
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/scannet_from_scan_id_to_video_folder.json \
63
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/scannet_from_scan_id_to_video_folder.json \
64
+ --data_root \
65
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_academic_v0_1/languagebind_feat \
66
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_youtube_v0_1/languagebind_feat \
67
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_academic_v0_1/languagebind_feat \
68
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_youtube_v0_1/languagebind_feat \
69
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avqa/avqa_subset_audio_imagebind_feat \
70
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/music_avqa \
71
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avsd/Charades_v1_audio_imagebind_feat \
72
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/video_features_new \
73
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/video_features_new \
74
+ --slow_path_data_root \
75
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_academic_v0_1/academic_source_ds \
76
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/1_2_m_youtube_v0_1/liwei_youtube_videos_ds \
77
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_academic_v0_1/academic_source_ds \
78
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/LLaVA_Video_178K/2_3_m_youtube_v0_1/liwei_youtube_videos_ds \
79
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avqa/avqa_subset \
80
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/music_avqa \
81
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/avsd/Charades_v1_480 \
82
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/posed_images_new \
83
+ /proj/cvl/users/x_fahkh2/UniMVU/UniMVUDatasets/scannet/posed_images_new \
84
+ --use_fast_feat True \
85
+ --use_slow True \
86
+ --shuffle True \
87
+ --mix_sampling_alpha 0.5 \
88
+ --video_loading_backbone decord \
89
+ --model_type unimvuv5_stage2 \
90
+ --model_name_or_path lmms-lab/llava-onevision-qwen2-7b-ov \
91
+ --version conv_llava_ov_qwen \
92
+ --model_class VideoFeatModelArgumentsUniMVUV5Stage2_7B \
93
+ --output_dir /proj/cvl/users/x_fahkh2/UniMVU/checkpoints/unimvuv5_qwen2_lora_alpha_128_all_mix_alpha05_7B \
94
+ --extra_trainable_modules modality_aggregator modality_projectors modality_special_token_aggregator modality_tokens \
95
+ --num_train_epochs 3 \
96
+ --per_device_train_batch_size 1 \
97
+ --per_device_eval_batch_size 1 \
98
+ --gradient_accumulation_steps 8 \
99
+ --evaluation_strategy no \
100
+ --save_strategy steps \
101
+ --save_steps 1000 \
102
+ --learning_rate 2e-5 \
103
+ --weight_decay 0. \
104
+ --warmup_ratio 0.03 \
105
+ --lr_scheduler_type cosine \
106
+ --ddp_find_unused_parameters True \
107
+ --group_by_modality_length True \
108
+ --logging_steps 1 \
109
+ --model_max_length 2048 \
110
+ --gradient_checkpointing True \
111
+ --dataloader_num_workers 4 \
112
+ --lazy_preprocess True \
113
+ --report_to wandb \
114
+ --bf16 True \
115
+ --tf32 False \
116
+ --mm_newline_position grid \
117
+ --mm_spatial_pool_mode bilinear \
118
+ --feat_combine_method add \
119
+ --num_cross_modality_hidden_layers 1 \
120
+ --support_modalities video audio 3d_feature dense_video \
121
+ --modality_input_dims video:1024,audio:1024,3d_feature:1024,dense_video:1024
122
+ ~