| { |
| "task": "forgetting_action_policy", |
| "epoch_stats": [ |
| { |
| "epoch": 1, |
| "train_loss": 1.2100253536409593, |
| "eval_macro_f1": 0.8943120476934178, |
| "eval_accuracy": 0.8914 |
| }, |
| { |
| "epoch": 2, |
| "train_loss": 0.6452919559225608, |
| "eval_macro_f1": 0.9476649277600788, |
| "eval_accuracy": 0.9484 |
| }, |
| { |
| "epoch": 3, |
| "train_loss": 0.482522361606962, |
| "eval_macro_f1": 0.9696191896424656, |
| "eval_accuracy": 0.9696 |
| }, |
| { |
| "epoch": 4, |
| "train_loss": 0.3768140496231193, |
| "eval_macro_f1": 0.9718038787431208, |
| "eval_accuracy": 0.9718 |
| }, |
| { |
| "epoch": 5, |
| "train_loss": 0.2870782903271907, |
| "eval_macro_f1": 0.9796027083744441, |
| "eval_accuracy": 0.9796 |
| }, |
| { |
| "epoch": 6, |
| "train_loss": 0.20888356409232609, |
| "eval_macro_f1": 0.9825928670083165, |
| "eval_accuracy": 0.9826 |
| }, |
| { |
| "epoch": 7, |
| "train_loss": 0.15703109322336797, |
| "eval_macro_f1": 0.9839922007228425, |
| "eval_accuracy": 0.984 |
| }, |
| { |
| "epoch": 8, |
| "train_loss": 0.11633934278838558, |
| "eval_macro_f1": 0.9835931767915431, |
| "eval_accuracy": 0.9836 |
| } |
| ], |
| "training_summary": { |
| "actual_epochs": 8, |
| "best_epoch": 7, |
| "early_stopped": false, |
| "backbone_model_name": "microsoft/deberta-v3-base", |
| "tokenizer_name": "microsoft/deberta-v3-base", |
| "selection_metric": "macro_f1", |
| "selection_value": 0.9839922007228425 |
| }, |
| "calibration": { |
| "method": "temperature_grid_search", |
| "rows": 5000, |
| "temperature": 2.0, |
| "loss": 0.08134587520392533 |
| }, |
| "hf_model_dir": "/nvme/CognitiveMemoryLayer/packages/models/trained_models/forgetting_action_policy_hf" |
| } |