MachFund / model_card.json
firstsko's picture
Upload mach-fund-1 merged model (Qwen2.5-3B fine-tuned)
bf8ca78 verified
raw
history blame contribute delete
555 Bytes
{
"model_name": "mach-fund-1",
"base_model": "Qwen/Qwen2.5-3B-Instruct",
"training": {
"train_samples": 6976,
"eval_samples": 769,
"epochs": 2,
"lora_rank": 32,
"batch_size": 2,
"grad_accum": 8,
"max_seq_len": 6144,
"total_steps": 872,
"train_loss": 0.9269,
"train_time_min": 141.0,
"gpu": "NVIDIA A100 80GB PCIe",
"completed_at": "2026-03-21 06:58:25"
},
"merged_at": "2026-03-21 16:13:47",
"description": "Private equity fund analysis model, distilled from Gemini 2.5 Pro"
}