{ "model_name": "microsoft/deberta-v3-large", "dataset_name": "jainsatyam26/guardrail-215k-splits", "max_length": 512, "epochs": 4, "batch_size": 8, "grad_accum": 4, "learning_rate": 1e-05, "weight_decay": 0.01, "warmup_ratio": 0.1, "use_llrd": true, "llrd_alpha": 0.9, "use_multisample_dropout": true, "num_dropout_samples": 5, "dropout_rate": 0.3, "use_label_smoothing": true, "label_smoothing": 0.1, "use_focal_loss": true, "focal_alpha": 0.7, "focal_gamma": 2.0, "use_hard_negative": true, "hard_negative_ratio": 0.3, "num_folds": 3, "optimize_thresholds": true, "output_dir": "./guardrail_model", "checkpoint_steps": 500, "logging_steps": 50, "eval_steps": 500, "hf_repo_id": "jainsatyam26/bertclassfier", "hf_token": "***REDACTED***", "deploy_every_minutes": 30, "deploy_every_steps": 400, "auto_deploy": true, "private_repo": false, "auto_resume": true, "resume_from_hf": true, "use_wandb": true, "wandb_project": "safety-classifier", "fp16": false, "bf16": true, "dataloader_num_workers": 4, "seed": 42 }