Math-MCQ-Generator-v1 / training_info.json
danxh's picture
Upload training_info.json with huggingface_hub
8332f1f verified
raw
history blame contribute delete
465 Bytes
{
"model_name": "Math-MCQ-Generator-v1",
"base_model": "deepseek-ai/deepseek-math-7b-instruct",
"training_method": "QLoRA (4-bit quantization)",
"upload_date": "2025-09-03T22:27:38.364105",
"dataset_size": 1519,
"epochs": 5,
"final_loss": "~0.20",
"date": "2025-09-03",
"lora_config": {
"r": 64,
"lora_alpha": 128,
"target_modules": [
"q_proj",
"v_proj",
"k_proj",
"o_proj"
],
"lora_dropout": 0.05
}
}