File size: 2,841 Bytes
36cc3ec
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
{
  "hyperparameters": {
    "include_attention_output_dense": false,
    "learning_rate_sampled": 0.00044569416489470884,
    "weight_decay": 0.022491619139739856,
    "warmup_ratio": 0.0463266472104081,
    "lr_scheduler_num_cycles": 1,
    "per_device_train_batch_size": 8,
    "gradient_accumulation_steps": 4,
    "num_train_epochs": 2,
    "lora_r": 32,
    "lora_alpha": 128,
    "lora_dropout": 0.0,
    "lora_target_modules": [
      "query_proj",
      "key_proj",
      "value_proj"
    ],
    "learning_rate": 4.456941648947089e-05,
    "lr_scheduler_type": "cosine_with_restarts",
    "max_grad_norm": 0.5,
    "optim": "adamw_torch_fused"
  },
  "threshold_optimization": {
    "max_f1": {
      "threshold": 0.9032942056655884,
      "metrics": {
        "threshold": 0.9032942056655884,
        "auroc": 0.9969044529302581,
        "average_precision": 0.9965060417039346,
        "f1": 0.9734939759036144,
        "accuracy": 0.9762551119595773,
        "precision": 0.9854536098796707,
        "recall": 0.9618211495185389,
        "specificity": 0.9882255881198587,
        "precision_human": 0.9689546846776094,
        "recall_human": 0.9882255881198587,
        "precision_ai": 0.9854536098796707,
        "recall_ai": 0.9618211495185389,
        "confusion_matrix": {
          "true_negative": 123377,
          "false_positive": 1470,
          "false_negative": 3953,
          "true_positive": 99586
        }
      }
    },
    "precision_at_95recall": {
      "threshold": 5.1442217227304354e-05,
      "metrics": {
        "threshold": 5.1442217227304354e-05,
        "auroc": 0.9969044529302581,
        "average_precision": 0.9965060417039346,
        "f1": 0.6238698501167432,
        "accuracy": 0.45335090592242955,
        "precision": 0.45335090592242955,
        "recall": 1.0,
        "specificity": 0.0,
        "precision_human": 0.0,
        "recall_human": 0.0,
        "precision_ai": 0.45335090592242955,
        "recall_ai": 1.0,
        "confusion_matrix": {
          "true_negative": 0,
          "false_positive": 124847,
          "false_negative": 0,
          "true_positive": 103539
        }
      }
    }
  },
  "test_metrics": {
    "threshold": 0.9032942056655884,
    "auroc": 0.9970131530896283,
    "average_precision": 0.9966291954050931,
    "f1": 0.9739500109946493,
    "accuracy": 0.976658040956797,
    "precision": 0.9856685063200997,
    "recall": 0.9625068814649552,
    "specificity": 0.9883938869665513,
    "precision_human": 0.9695005538925684,
    "recall_human": 0.9883938869665513,
    "precision_ai": 0.9856685063200997,
    "recall_ai": 0.9625068814649552,
    "confusion_matrix": {
      "true_negative": 123399,
      "false_positive": 1449,
      "false_negative": 3882,
      "true_positive": 99657
    }
  },
  "timestamp": "20251113_111139",
  "seed": 42
}