paper7-bert-layer-analysis / results /sst2_layer_analysis.json
leoncynn's picture
Upload folder using huggingface_hub
2c6b8f0 verified
{
"task": "sst2",
"orig_acc": 0.934,
"layers": {
"0": {
"sep": 89225.16024069591,
"delta": 89225.16024069591,
"acc": 0.53,
"role": "embedding"
},
"1": {
"sep": 129.12223518499397,
"delta": -89096.03800551091,
"acc": 0.544,
"role": "harmful (separability decrease)"
},
"2": {
"sep": 109.14816514194835,
"delta": -19.974070043045614,
"acc": 0.588,
"role": "harmful (separability decrease)"
},
"3": {
"sep": 119.95343254648107,
"delta": 10.805267404532714,
"acc": 0.598,
"role": "critical (separability boost)"
},
"4": {
"sep": 82.62206736035587,
"delta": -37.3313651861252,
"acc": 0.552,
"role": "harmful (separability decrease)"
},
"5": {
"sep": 64.85882702122912,
"delta": -17.763240339126753,
"acc": 0.684,
"role": "harmful (separability decrease)"
},
"6": {
"sep": 56.68732706293641,
"delta": -8.171499958292706,
"acc": 0.614,
"role": "harmful (separability decrease)"
},
"7": {
"sep": 57.44462349827881,
"delta": 0.757296435342397,
"acc": 0.74,
"role": "moderate"
},
"8": {
"sep": 67.34111023033665,
"delta": 9.896486732057845,
"acc": 0.622,
"role": "important"
},
"9": {
"sep": 95.00798469418417,
"delta": 27.66687446384752,
"acc": 0.88,
"role": "critical (separability boost)"
},
"10": {
"sep": 119.43788584435403,
"delta": 24.429901150169854,
"acc": 0.924,
"role": "critical (separability boost)"
},
"11": {
"sep": 133.79458581341888,
"delta": 14.356699969064849,
"acc": 0.932,
"role": "critical (separability boost)"
},
"12": {
"sep": 171.96615672879156,
"delta": 38.17157091537268,
"acc": 0.938,
"role": "critical (separability boost)"
}
},
"ffn": {
"0": {
"attn": 0.606,
"ffn": 0.544,
"delta": -0.061999999999999944,
"verdict": "harmful"
},
"1": {
"attn": 0.548,
"ffn": 0.588,
"delta": 0.039999999999999925,
"verdict": "beneficial"
},
"2": {
"attn": 0.538,
"ffn": 0.598,
"delta": 0.05999999999999994,
"verdict": "beneficial"
},
"3": {
"attn": 0.53,
"ffn": 0.552,
"delta": 0.02200000000000002,
"verdict": "beneficial"
},
"4": {
"attn": 0.614,
"ffn": 0.684,
"delta": 0.07000000000000006,
"verdict": "beneficial"
},
"5": {
"attn": 0.536,
"ffn": 0.614,
"delta": 0.07799999999999996,
"verdict": "beneficial"
},
"6": {
"attn": 0.674,
"ffn": 0.74,
"delta": 0.06599999999999995,
"verdict": "beneficial"
},
"7": {
"attn": 0.792,
"ffn": 0.622,
"delta": -0.17000000000000004,
"verdict": "harmful"
},
"8": {
"attn": 0.866,
"ffn": 0.88,
"delta": 0.014000000000000012,
"verdict": "beneficial"
},
"9": {
"attn": 0.914,
"ffn": 0.924,
"delta": 0.010000000000000009,
"verdict": "beneficial"
},
"10": {
"attn": 0.93,
"ffn": 0.932,
"delta": 0.0020000000000000018,
"verdict": "neutral"
},
"11": {
"attn": 0.932,
"ffn": 0.938,
"delta": 0.005999999999999894,
"verdict": "neutral"
}
},
"error_analysis": {
"total_wrong": 30,
"c0_to_c1": 7,
"c1_to_c0": 23,
"avg_margin": 0.3854449843858634
}
}