{ "history": [ { "epoch": 1, "train_sum_loss": 6.272962152862549, "train_class_loss": 1.0185239918708802, "train_class_acc": 0.4368, "val_sum_loss": 5.8008860549926755, "val_class_loss": 1.1023406219482421, "val_class_acc": 0.304, "val_rouge1": 0.17660690248954364, "val_rouge2": 0.018371370658335634, "val_rougeL": 0.15689190075772386 }, { "epoch": 2, "train_sum_loss": 5.219159950256348, "train_class_loss": 1.099994719696045, "train_class_acc": 0.3462, "val_sum_loss": 5.416218318939209, "val_class_loss": 1.0967657680511476, "val_class_acc": 0.386, "val_rouge1": 0.21779871449217764, "val_rouge2": 0.028536134623968267, "val_rougeL": 0.19329056631523484 }, { "epoch": 3, "train_sum_loss": 4.404316672515869, "train_class_loss": 1.0899620735168456, "train_class_acc": 0.361, "val_sum_loss": 5.30168932723999, "val_class_loss": 1.7727555074691772, "val_class_acc": 0.342, "val_rouge1": 0.22501668712961082, "val_rouge2": 0.03326989668183761, "val_rougeL": 0.20778061653444058 } ], "config": { "tokenizer": "t5-small", "max_input_len": 512, "max_target_len": 64, "hidden_dim": 512, "num_experts": 6, "top_k": 2, "batch_size": 8, "learning_rate": 0.0005, "num_epochs": 3, "seed": 42, "device": "cuda", "hf_repo": "Deepu1965/bonus2-multitask-moe" } }