cortyx / meta_v2.json
QuantaSparkLabs's picture
Upload meta_v2.json with huggingface_hub
8b3b2e4 verified
{
"model": "cortyx_v2_final.pt",
"base": "microsoft/deberta-v3-small",
"version": "v2.0",
"epochs": 10,
"best_f1_macro": 0.6129,
"labels": [
"safe",
"mild_toxicity",
"severe_toxicity",
"harassment",
"hate_speech",
"threat",
"insult",
"profanity",
"sexual_content",
"violence",
"self_harm",
"extremism",
"illegal_instruction",
"jailbreak_attempt",
"prompt_injection",
"obfuscated_toxicity",
"misinformation_risk"
],
"thresholds": {
"safe": 0.5,
"mild_toxicity": 0.7,
"severe_toxicity": 0.4,
"harassment": 0.5,
"hate_speech": 0.45,
"threat": 0.4,
"insult": 0.55,
"profanity": 0.6,
"sexual_content": 0.45,
"violence": 0.4,
"self_harm": 0.35,
"extremism": 0.4,
"illegal_instruction": 0.45,
"jailbreak_attempt": 0.45,
"prompt_injection": 0.45,
"obfuscated_toxicity": 0.5,
"misinformation_risk": 0.5
},
"datasets": [
"QuantaSparkLabs/cortyx-safety-dataset",
"google/civil_comments",
"lmsys/toxic-chat",
"lmsys/lmsys-chat-1m",
"cardiffnlp/tweet_eval"
],
"training_samples": 1844,
"val_samples": 462
}