1-parameter-classifier / stage_4c /training_log.json
phanerozoic's picture
Stage 4C: direct classifier-score supervision, F1 0.729 (+0.006 over 4B)
faf011c verified
{
"student_params": 3267304,
"loss": "MSE_on_classifier_scalar",
"epochs": [
{
"epoch": 1,
"loss": 338.8909246066799,
"F1": 0.7214378118515015,
"precision": 0.5653923749923706,
"recall": 0.9964538812637329,
"threshold": 24.078125
},
{
"epoch": 2,
"loss": 328.9103960763321,
"F1": 0.7205128073692322,
"precision": 0.564257025718689,
"recall": 0.9964538812637329,
"threshold": 28.883697509765625
},
{
"epoch": 3,
"loss": 328.8529856922911,
"F1": 0.72258061170578,
"precision": 0.5679513216018677,
"recall": 0.9929078221321106,
"threshold": 28.009765625
},
{
"epoch": 4,
"loss": 326.7125272106021,
"F1": 0.7221510410308838,
"precision": 0.5651302337646484,
"recall": 1.0,
"threshold": 26.10400390625
},
{
"epoch": 5,
"loss": 325.2882255967271,
"F1": 0.7241829633712769,
"precision": 0.5734989643096924,
"recall": 0.9822695255279541,
"threshold": 26.7830810546875
},
{
"epoch": 6,
"loss": 326.14567763865386,
"F1": 0.7298701405525208,
"precision": 0.5758196711540222,
"recall": 0.9964538812637329,
"threshold": 26.697509765625
},
{
"epoch": 7,
"loss": 325.15346100816646,
"F1": 0.7221510410308838,
"precision": 0.5651302337646484,
"recall": 1.0,
"threshold": 24.860595703125
},
{
"epoch": 8,
"loss": 321.891113616252,
"F1": 0.7402032017707825,
"precision": 0.6265356540679932,
"recall": 0.9042553305625916,
"threshold": 25.110595703125
},
{
"epoch": 9,
"loss": 324.80503095718103,
"F1": 0.7258687615394592,
"precision": 0.5696969628334045,
"recall": 1.0,
"threshold": 24.62255859375
},
{
"epoch": 10,
"loss": 323.8681324547888,
"F1": 0.7338129878044128,
"precision": 0.6174334287643433,
"recall": 0.9042553305625916,
"threshold": 25.044189453125
},
{
"epoch": 11,
"loss": 322.2317366366947,
"F1": 0.7270233035087585,
"precision": 0.5928411483764648,
"recall": 0.9397163391113281,
"threshold": 25.876220703125
},
{
"epoch": 12,
"loss": 323.8775074345158,
"F1": 0.7272727489471436,
"precision": 0.5786163806915283,
"recall": 0.978723406791687,
"threshold": 26.55078125
},
{
"epoch": 13,
"loss": 322.46046450084134,
"F1": 0.729658842086792,
"precision": 0.5791666507720947,
"recall": 0.9858155846595764,
"threshold": 25.8525390625
},
{
"epoch": 14,
"loss": 321.4742774784218,
"F1": 0.7279894948005676,
"precision": 0.5782880783081055,
"recall": 0.9822695255279541,
"threshold": 25.83251953125
},
{
"epoch": 15,
"loss": 322.15041381942024,
"F1": 0.7289474010467529,
"precision": 0.5794979333877563,
"recall": 0.9822695255279541,
"threshold": 25.84033203125
}
]
}