{
  "model_name": "microsoft/deberta-v3-large",
  "dataset_name": "jainsatyam26/guardrail-215k-splits",
  "max_length": 512,
  "epochs": 4,
  "batch_size": 8,
  "grad_accum": 4,
  "learning_rate": 1e-05,
  "weight_decay": 0.01,
  "warmup_ratio": 0.1,
  "use_llrd": true,
  "llrd_alpha": 0.9,
  "use_multisample_dropout": true,
  "num_dropout_samples": 5,
  "dropout_rate": 0.3,
  "use_label_smoothing": true,
  "label_smoothing": 0.1,
  "use_focal_loss": true,
  "focal_alpha": 0.7,
  "focal_gamma": 2.0,
  "use_hard_negative": true,
  "hard_negative_ratio": 0.3,
  "num_folds": 3,
  "optimize_thresholds": true,
  "output_dir": "./guardrail_model",
  "checkpoint_steps": 500,
  "logging_steps": 50,
  "eval_steps": 500,
  "hf_repo_id": "jainsatyam26/bertclassfier",
  "hf_token": "***REDACTED***",
  "deploy_every_minutes": 30,
  "deploy_every_steps": 400,
  "auto_deploy": true,
  "private_repo": false,
  "auto_resume": true,
  "resume_from_hf": true,
  "use_wandb": true,
  "wandb_project": "safety-classifier",
  "fp16": false,
  "bf16": true,
  "dataloader_num_workers": 4,
  "seed": 42
}