data: language: ne sample_rate: 16000 hf_dataset_id: Firoj112/voxcpm-nepali-data train_manifest: finetuning_data/manifests/train_manifest.jsonl val_manifest: finetuning_data/manifests/val_manifest.jsonl hardware: gpu_count: 1 load_in_4bit: false gradient_checkpointing: true vram_gb_per_gpu: 24.0 lora: alpha: 96 bias: none dropout: 0.05 enabled: true rank: 96 target_modules: - q_proj - v_proj - k_proj - o_proj metadata: config_type: lora language: ne model_version: '2' model: name_or_path: openbmb/VoxCPM2 optimize: false version: '2' training: amp: bf16 bf16: true dataloader_num_workers: 0 ddp_find_unused_parameters: false epochs: 20 eval_steps: 500 fp16: false gradient_accumulation_steps: 32 gradient_checkpointing: true learning_rate: 0.00005 logging_steps: 50 max_grad_norm: 1.0 max_steps: 20000 output_dir: ./checkpoints/lora_nepali_v2 per_device_train_batch_size: 1 report_to: - wandb - tensorboard save_steps: 500 warmup_steps: 500 lr_scheduler_type: cosine wandb: log_model: checkpoint project: Vox-CPM-Nepali-Fine-Tune watch: gradients