tiny-router-checkpoint / metrics.json
Dexifried's picture
Tiny-router checkpoint (encoder=microsoft/MiniLM-L12-H384-uncased, epochs=10)
db34ed6 verified
{
"per_head": {
"relation_to_previous": {
"accuracy": 0.8768,
"macro_f1": 0.7893,
"per_label": {
"new": {
"precision": 1.0,
"recall": 1.0,
"f1": 1.0,
"support": 102
},
"follow_up": {
"precision": 0.8764,
"recall": 0.9176,
"f1": 0.8966,
"support": 85
},
"correction": {
"precision": 0.6786,
"recall": 0.6552,
"f1": 0.6667,
"support": 29
},
"confirmation": {
"precision": 0.8235,
"recall": 0.7,
"f1": 0.7568,
"support": 20
},
"cancellation": {
"precision": 0.7143,
"recall": 0.4762,
"f1": 0.5714,
"support": 21
},
"closure": {
"precision": 0.7308,
"recall": 1.0,
"f1": 0.8444,
"support": 19
}
},
"confusion_matrix": [
[
102,
0,
0,
0,
0,
0
],
[
0,
78,
3,
0,
2,
2
],
[
0,
5,
19,
2,
2,
1
],
[
0,
3,
0,
14,
0,
3
],
[
0,
3,
6,
1,
10,
1
],
[
0,
0,
0,
0,
0,
19
]
]
},
"actionability": {
"accuracy": 0.7101,
"macro_f1": 0.6834,
"per_label": {
"none": {
"precision": 0.6786,
"recall": 0.623,
"f1": 0.6496,
"support": 61
},
"review": {
"precision": 0.6571,
"recall": 0.5823,
"f1": 0.6174,
"support": 79
},
"act": {
"precision": 0.7467,
"recall": 0.8235,
"f1": 0.7832,
"support": 136
}
},
"confusion_matrix": [
[
38,
13,
10
],
[
5,
46,
28
],
[
13,
11,
112
]
]
},
"retention": {
"accuracy": 0.7029,
"macro_f1": 0.6849,
"per_label": {
"ephemeral": {
"precision": 0.6628,
"recall": 0.6404,
"f1": 0.6514,
"support": 89
},
"useful": {
"precision": 0.7025,
"recall": 0.7929,
"f1": 0.745,
"support": 140
},
"remember": {
"precision": 0.8125,
"recall": 0.5532,
"f1": 0.6582,
"support": 47
}
},
"confusion_matrix": [
[
57,
31,
1
],
[
24,
111,
5
],
[
5,
16,
26
]
]
},
"urgency": {
"accuracy": 0.6449,
"macro_f1": 0.5777,
"per_label": {
"low": {
"precision": 0.7536,
"recall": 0.7647,
"f1": 0.7591,
"support": 136
},
"medium": {
"precision": 0.5357,
"recall": 0.6316,
"f1": 0.5797,
"support": 95
},
"high": {
"precision": 0.5385,
"recall": 0.3111,
"f1": 0.3944,
"support": 45
}
},
"confusion_matrix": [
[
104,
28,
4
],
[
27,
60,
8
],
[
7,
24,
14
]
]
}
},
"overall": {
"exact_match": 0.3406,
"macro_average_f1": 0.6838,
"automation_safe_accuracy": 0.6222,
"automation_safe_coverage": 0.163,
"confidence_threshold": 0.8,
"confidence_calibration": {
"ece": 0.395419,
"bins": [
{
"range": [
0.5,
0.6
],
"count": 6,
"avg_confidence": 0.5757,
"accuracy": 0.3333
},
{
"range": [
0.6,
0.7
],
"count": 86,
"avg_confidence": 0.6646,
"accuracy": 0.2326
},
{
"range": [
0.7,
0.8
],
"count": 139,
"avg_confidence": 0.7484,
"accuracy": 0.3165
},
{
"range": [
0.8,
0.9
],
"count": 42,
"avg_confidence": 0.8384,
"accuracy": 0.5952
},
{
"range": [
0.9,
1.0
],
"count": 3,
"avg_confidence": 0.9038,
"accuracy": 1.0
}
]
}
},
"temperature_scaling": {
"method": "per_head_temperature_scaling",
"per_head": {
"relation_to_previous": 0.630957,
"actionability": 0.891251,
"retention": 0.944061,
"urgency": 0.891251
}
}
}