shannon-control-unit / training_summary.json
hunterbown's picture
Update: Replace main adapter with validated 1B SCU model (6.2% BPT improvement)
71a6b60 verified
raw
history blame contribute delete
461 Bytes
{
"mode": "ce_kl_auto",
"model": "meta-llama/Llama-3.2-1B",
"steps": 270,
"N_tokens": 445718,
"target_S": 0.01,
"final_metrics": {
"data_bpt": 2.1664955498827014,
"param_bpt": 0.03528421491730657,
"total_bpt": 2.201779764800008,
"S_ratio": 0.016025315284206688,
"lambda": 0.46282422077910096
},
"avg_last_100": {
"data_bpt": 2.297084885769371,
"total_bpt": 2.3255800839060363,
"S_ratio": 0.01281555231171954
}
}