{
    "output_dir": "/home/user_1/tts-dev/indrivoice/raya-tts/hi_en/hi/omnivoice/exp_distill_hi_8step",
    "data_config": "/home/user_1/tts-dev/indrivoice/raya-tts/hi_en/hi/omnivoice/data_config_hi_dev_small.json",
    "llm_name_or_path": "Qwen/Qwen3-0.6B",
    "audio_vocab_size": 1025,
    "audio_mask_id": 1024,
    "num_audio_codebook": 8,
    "audio_codebook_weights": [
        8,
        8,
        6,
        6,
        4,
        4,
        2,
        2
    ],
    "drop_cond_ratio": 0.1,
    "prompt_ratio_range": [
        0.0,
        0.3
    ],
    "mask_ratio_range": [
        0.0,
        1.0
    ],
    "language_ratio": 0.8,
    "use_pinyin_ratio": 0.0,
    "instruct_ratio": 0.0,
    "only_instruct_ratio": 0.0,
    "resume_from_checkpoint": null,
    "init_from_checkpoint": "k2-fsa/OmniVoice",
    "learning_rate": 1e-05,
    "weight_decay": 0.01,
    "max_grad_norm": 1.0,
    "steps": 8000,
    "seed": 42,
    "lr_scheduler_type": "cosine",
    "warmup_type": "ratio",
    "warmup_ratio": 0.01,
    "warmup_steps": 0,
    "batch_tokens": 4096,
    "gradient_accumulation_steps": 1,
    "num_workers": 2,
    "mixed_precision": "bf16",
    "allow_tf32": true,
    "use_deepspeed": false,
    "deepspeed_config": null,
    "attn_implementation": "sdpa",
    "max_sample_tokens": 2000,
    "min_sample_tokens": 50,
    "max_batch_size": 32,
    "logging_steps": 50,
    "eval_steps": 500,
    "save_steps": 500,
    "keep_last_n_checkpoints": 3,
    "teacher_checkpoint": "k2-fsa/OmniVoice",
    "teacher_num_step": 16,
    "student_num_step": 8,
    "teacher_guidance_scale": 2.0,
    "teacher_t_shift": 0.1,
    "teacher_layer_penalty_factor": 5.0,
    "teacher_position_temperature": 0.0,
    "teacher_class_temperature": 0.0,
    "block_size_frames": 12,
    "use_block_reveal": true,
    "kd_ratio": 0.5,
    "kd_alpha": 0.6,
    "kd_temperature": 2.0,
    "kd_loss_type": "reverse_kl",
    "sample_reveal_step": true,
    "teacher_dtype": "float16"
}