brick-complexity-2-max / training_metadata.json
massaindustries's picture
Initial LoRA adapter upload
d790e60 verified
{
"config": {
"base": "Qwen/Qwen3.5-0.8B",
"train": "/data/dataset/train_llm_judged_122b.jsonl",
"val": "/data/dataset/val_llm_judged_122b.jsonl",
"test": "/data/dataset/test_llm_judged_122b.jsonl",
"output": "/data/output/qwen35-judged-asym-lora",
"epochs": 3,
"batch_size": 16,
"lr": "1e-4",
"max_length": 768,
"lora_r": 32,
"lora_alpha": 32,
"lora_dropout": 0.1,
"over_lambda": 0.7,
"label_smoothing": 0.08,
"medium_boost": 1.0,
"hard_boost": 1.0,
"symmetric_smoothing": false,
"eval_steps": 500
},
"training_time_s": 7645.5,
"system_prompt": "PRODUCTION (for Brick drop-in compatibility)",
"test": {
"n": 4571,
"accuracy": 0.7716035878363596,
"over_rate": 0.06234959527455699,
"under_rate": 0.16604681688908335,
"macro_f1": 0.7707187288592569
}
}