{ "base_model": "unsloth/DeepSeek-R1-Distill-Llama-8B", "training_dataset": "nvidia/OpenCodeReasoning", "training_method": "LoRA", "lora_rank": 16, "lora_alpha": 16, "difficulty_filter": [ "VERY_HARD", 10, 11 ], "max_seq_length": 2048, "training_date": "2025-07-12", "framework": "unsloth", "compatible_for_further_training": true }