{ "run_name": "docket-duration", "base_model": "answerdotai/ModernBERT-large", "push_to_hub": "nadahlberg/docket-duration", "run_args": { "max_length": 768, "labels": [ "DURATION", "IMPRISONMENT_DURATION", "SUPERVISED_RELEASE_DURATION" ], "return_offsets_mapping": true }, "training_args": { "num_train_epochs": 2, "per_device_train_batch_size": 4, "per_device_eval_batch_size": 4, "gradient_accumulation_steps": 4, "learning_rate": 5e-05, "warmup_ratio": 0.05, "weight_decay": 0.1, "max_grad_norm": 1, "save_total_limit": 2, "load_best_model_at_end": true, "eval_steps": 0.1, "save_steps": 0.1, "eval_strategy": "steps", "report_to": "tensorboard" }, "model_args": {}, "routine": "multi-task" }