CognitiveMemoryLayer-models / forgetting_action_policy_epoch_stats.json
avinashm's picture
Upload all trained models
e65379c verified
{
"task": "forgetting_action_policy",
"epoch_stats": [
{
"epoch": 1,
"train_loss": 1.2100253536409593,
"eval_macro_f1": 0.8943120476934178,
"eval_accuracy": 0.8914
},
{
"epoch": 2,
"train_loss": 0.6452919559225608,
"eval_macro_f1": 0.9476649277600788,
"eval_accuracy": 0.9484
},
{
"epoch": 3,
"train_loss": 0.482522361606962,
"eval_macro_f1": 0.9696191896424656,
"eval_accuracy": 0.9696
},
{
"epoch": 4,
"train_loss": 0.3768140496231193,
"eval_macro_f1": 0.9718038787431208,
"eval_accuracy": 0.9718
},
{
"epoch": 5,
"train_loss": 0.2870782903271907,
"eval_macro_f1": 0.9796027083744441,
"eval_accuracy": 0.9796
},
{
"epoch": 6,
"train_loss": 0.20888356409232609,
"eval_macro_f1": 0.9825928670083165,
"eval_accuracy": 0.9826
},
{
"epoch": 7,
"train_loss": 0.15703109322336797,
"eval_macro_f1": 0.9839922007228425,
"eval_accuracy": 0.984
},
{
"epoch": 8,
"train_loss": 0.11633934278838558,
"eval_macro_f1": 0.9835931767915431,
"eval_accuracy": 0.9836
}
],
"training_summary": {
"actual_epochs": 8,
"best_epoch": 7,
"early_stopped": false,
"backbone_model_name": "microsoft/deberta-v3-base",
"tokenizer_name": "microsoft/deberta-v3-base",
"selection_metric": "macro_f1",
"selection_value": 0.9839922007228425
},
"calibration": {
"method": "temperature_grid_search",
"rows": 5000,
"temperature": 2.0,
"loss": 0.08134587520392533
},
"hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/forgetting_action_policy_hf"
}