danxh
/

Math-MCQ-Generator-v1

Text Generation

Model card Files Files and versions

Math-MCQ-Generator-v1 / training_info.json

danxh's picture

Upload training_info.json with huggingface_hub

8332f1f verified 5 months ago

history blame contribute delete

465 Bytes

	{
	"model_name": "Math-MCQ-Generator-v1",
	"base_model": "deepseek-ai/deepseek-math-7b-instruct",
	"training_method": "QLoRA (4-bit quantization)",
	"upload_date": "2025-09-03T22:27:38.364105",
	"dataset_size": 1519,
	"epochs": 5,
	"final_loss": "~0.20",
	"date": "2025-09-03",
	"lora_config": {
	"r": 64,
	"lora_alpha": 128,
	"target_modules": [
	"q_proj",
	"v_proj",
	"k_proj",
	"o_proj"
	],
	"lora_dropout": 0.05
	}
	}