| { | |
| "config": { | |
| "base": "Qwen/Qwen3.5-0.8B", | |
| "train": "/data/dataset/train_llm_judged_122b.jsonl", | |
| "val": "/data/dataset/val_llm_judged_122b.jsonl", | |
| "test": "/data/dataset/test_llm_judged_122b.jsonl", | |
| "output": "/data/output/qwen35-judged-asym-lora", | |
| "epochs": 3, | |
| "batch_size": 16, | |
| "lr": "1e-4", | |
| "max_length": 768, | |
| "lora_r": 32, | |
| "lora_alpha": 32, | |
| "lora_dropout": 0.1, | |
| "over_lambda": 0.7, | |
| "label_smoothing": 0.08, | |
| "medium_boost": 1.0, | |
| "hard_boost": 1.0, | |
| "symmetric_smoothing": false, | |
| "eval_steps": 500 | |
| }, | |
| "training_time_s": 7645.5, | |
| "system_prompt": "PRODUCTION (for Brick drop-in compatibility)", | |
| "test": { | |
| "n": 4571, | |
| "accuracy": 0.7716035878363596, | |
| "over_rate": 0.06234959527455699, | |
| "under_rate": 0.16604681688908335, | |
| "macro_f1": 0.7707187288592569 | |
| } | |
| } |