code-reasoning-deepseek-8b / training_metadata.json
Soumyajit-7's picture
Add training metadata
0d1f03d verified
raw
history blame contribute delete
366 Bytes
{
"base_model": "unsloth/DeepSeek-R1-Distill-Llama-8B",
"training_dataset": "nvidia/OpenCodeReasoning",
"training_method": "LoRA",
"lora_rank": 16,
"lora_alpha": 16,
"difficulty_filter": [
"VERY_HARD",
10,
11
],
"max_seq_length": 2048,
"training_date": "2025-07-12",
"framework": "unsloth",
"compatible_for_further_training": true
}