bertclassfier / training_config.json
jainsatyam26's picture
Auto-deploy: Step 400 | F1: N/A
dfb99c0 verified
{
"model_name": "microsoft/deberta-v3-large",
"dataset_name": "jainsatyam26/guardrail-215k-splits",
"max_length": 512,
"epochs": 4,
"batch_size": 8,
"grad_accum": 4,
"learning_rate": 1e-05,
"weight_decay": 0.01,
"warmup_ratio": 0.1,
"use_llrd": true,
"llrd_alpha": 0.9,
"use_multisample_dropout": true,
"num_dropout_samples": 5,
"dropout_rate": 0.3,
"use_label_smoothing": true,
"label_smoothing": 0.1,
"use_focal_loss": true,
"focal_alpha": 0.7,
"focal_gamma": 2.0,
"use_hard_negative": true,
"hard_negative_ratio": 0.3,
"num_folds": 3,
"optimize_thresholds": true,
"output_dir": "./guardrail_model",
"checkpoint_steps": 500,
"logging_steps": 50,
"eval_steps": 500,
"hf_repo_id": "jainsatyam26/bertclassfier",
"hf_token": "***REDACTED***",
"deploy_every_minutes": 30,
"deploy_every_steps": 400,
"auto_deploy": true,
"private_repo": false,
"auto_resume": true,
"resume_from_hf": true,
"use_wandb": true,
"wandb_project": "safety-classifier",
"fp16": false,
"bf16": true,
"dataloader_num_workers": 4,
"seed": 42
}