Spatial-Omni / train_args.json
dieKarotte's picture
Add files using upload-large-folder tool
3f73500 verified
Raw
History Blame Contribute Delete
1.92 kB
{
"attn_impl": "sdpa",
"audio_feature_cache_manifest": "path_to_your_audio_cache/manifest.json",
"audio_feature_cache_max_entries": 256,
"batch_size": 2,
"beats_checkpoint": "path_to_your_SO_encoder_checkpoint",
"beats_lr": 1e-06,
"beats_repo": "",
"device": "cuda:0",
"distributed": true,
"dtype": "bfloat16",
"encoder_token_rate": 10.0,
"epochs": 3,
"grad_accum_steps": 3,
"gradient_checkpointing": false,
"local_rank": 0,
"log_every": 10,
"lora_alpha": 32,
"lora_dropout": 0.05,
"lora_lr": 3e-05,
"lora_r": 16,
"lora_target_modules": [
"q_proj",
"k_proj",
"v_proj",
"o_proj"
],
"lora_target_prefixes": [
"thinker.model"
],
"lr": 3e-05,
"max_grad_norm": 1.0,
"max_train_samples": null,
"max_valid_samples": null,
"model_id": "path_to_original_Qwen2.5-Omni-7B",
"num_workers": 8,
"optimizer_step_per_batch": false,
"output_dir": "output",
"persistent_workers": true,
"prefetch_factor": 4,
"projector_fp32": false,
"projector_lr": 1e-06,
"projector_shuffle_factor": 4,
"projector_type": "pixel_shuffle",
"projector_weight_decay": null,
"qa_root": "path_to_SO_Dataset/qa",
"qa_roots": [
"path_to_SO_Dataset/qa"
],
"rank": 0,
"resume_checkpoint_path": "path_to_SO_7b_pretrain_checkpoint",
"resume_model_only": false,
"resume_tag": null,
"save_every_epoch": true,
"save_every_n_optimizer_steps": 1000,
"save_full_model": false,
"seed": 1234,
"so_repo": "",
"step_valid_subset_ratio": 0.05,
"train_mode": "beats_lora",
"train_split": "train",
"valid_do_sample": false,
"valid_every_n_optimizer_steps": 1000,
"valid_generate_batch_size": 1,
"valid_generate_full": true,
"valid_generate_max_samples": 32,
"valid_max_new_tokens": 96,
"valid_num_beams": 1,
"valid_split": "valid",
"valid_subset_ratio": 0.1,
"warmup_ratio": 0.03,
"weight_decay": 0.01,
"world_size": 8
}