| { | |
| "base_model": "unsloth/DeepSeek-R1-Distill-Llama-8B", | |
| "training_dataset": "nvidia/OpenCodeReasoning", | |
| "training_method": "LoRA", | |
| "lora_rank": 16, | |
| "lora_alpha": 16, | |
| "difficulty_filter": [ | |
| "VERY_HARD", | |
| 10, | |
| 11 | |
| ], | |
| "max_seq_length": 2048, | |
| "training_date": "2025-07-12", | |
| "framework": "unsloth", | |
| "compatible_for_further_training": true | |
| } |