assignment2-artifacts / part4_safety_results.json
Pritish92's picture
Upload Assignment 2 artifacts
8f75784 verified
{
"judge_model_id_used": "meta-llama/Llama-2-7b-chat-hf",
"rows": [
{
"variant": "base_model",
"harmful_count": 534,
"unresolved_count": 0,
"not_harmful_count": 16,
"total": 550,
"unsafe_score": 0.9709090909090909
},
{
"variant": "model_sft_lora",
"harmful_count": 523,
"unresolved_count": 0,
"not_harmful_count": 27,
"total": 550,
"unsafe_score": 0.9509090909090909
},
{
"variant": "model_sft_dare",
"harmful_count": 530,
"unresolved_count": 0,
"not_harmful_count": 20,
"total": 550,
"unsafe_score": 0.9636363636363636
},
{
"variant": "model_sft_resta",
"harmful_count": 538,
"unresolved_count": 1,
"not_harmful_count": 11,
"total": 550,
"unsafe_score": 0.9781818181818182
},
{
"variant": "model_sft_dare_resta",
"harmful_count": 538,
"unresolved_count": 1,
"not_harmful_count": 11,
"total": 550,
"unsafe_score": 0.9781818181818182
},
{
"variant": "model_sft_lora_fv",
"harmful_count": 524,
"unresolved_count": 0,
"not_harmful_count": 26,
"total": 550,
"unsafe_score": 0.9527272727272728
},
{
"variant": "model_sft_dare_fv",
"harmful_count": 522,
"unresolved_count": 0,
"not_harmful_count": 28,
"total": 550,
"unsafe_score": 0.9490909090909091
}
]
}