| { | |
| "release_dir": null, | |
| "preprocessed_dir": "data", | |
| "model_architecture": "MultiHeadGuardModel", | |
| "training_format": "multitask_structured", | |
| "num_categories": 13, | |
| "category_vocabulary": [ | |
| "animal_cruelty", | |
| "fraud_and_social_engineering", | |
| "harassment_and_bullying", | |
| "hate_speech", | |
| "human_trafficking", | |
| "illegal_drugs", | |
| "non_consensual_sexual_content", | |
| "offensive_cyber", | |
| "property_crime_and_theft", | |
| "self_harm_and_suicide", | |
| "terrorism_and_extremism", | |
| "violence", | |
| "weapons_and_firearms" | |
| ], | |
| "hyperparameters": { | |
| "lambda_cat": 0.1, | |
| "epochs": 1, | |
| "batch_size": 512, | |
| "grad_accum": 1, | |
| "effective_batch": 512, | |
| "backbone_lr": 5e-05, | |
| "head_lr": 0.0005, | |
| "lr_scheduler": "cosine", | |
| "warmup_steps": null, | |
| "warmup_ratio": 0.05, | |
| "weight_decay": 0.01, | |
| "max_grad_norm": 1.0, | |
| "max_length": 512, | |
| "dropout": 0.1, | |
| "use_lora": false, | |
| "lora_rank": null, | |
| "lora_alpha": null, | |
| "lora_dropout": null, | |
| "gradient_checkpointing": true, | |
| "pack_sequences": true | |
| } | |
| } | |