{ "model_name": "meta-llama/Llama-3.2-1B", "output_dir": "models/scu_fixed_sigma_20250903_222442", "mode": "ce_kl_auto", "max_steps": 270, "max_epochs": 10, "num_epochs": null, "batch_size": 1, "gradient_accumulation_steps": 4, "learning_rate": 0.0005, "fp16": true, "data_path": "training_data/train_512k.txt", "sample_size": 2000000, "lora_r": 16, "lora_alpha": 32, "prior_sigma": 0.1, "target_S": 0.01, "lam_init": 1.0, "l2_weight": 0.1 }