debug_gpt2 / metrics.json
nbtpj's picture
Upload best model checkpoint
174b104 verified
{
"rl_info/A2G": -0.006648760288953781,
"rl_info/entropy": 3.1247427463531494,
"rl_info/total_token": 1710.0,
"rl_info/advantage_b4_norm": -524.6408081054688,
"rl_info/advantage_after_gnorm": 1.010803461074829,
"rl_info/kl_w_ref": 0.0,
"train/rl_loss": 0.6645635962486267,
"train/lm_loss": 6.4453349113464355,
"train/total_loss": 7.109898567199707,
"samsum/rouge1": 0.07018707411132723,
"samsum/rouge2": 0.015589278392518668,
"samsum/rougeL": 0.05694806401174433,
"samsum/rougeLsum": 0.05097452753746131,
"samsum/bertscore_precision": 0.6306706219911575,
"samsum/bertscore_recall": 0.7116748541593552,
"samsum/bertscore_f1": 0.6681777884562811,
"xsum/rouge1": 0.07577425197474222,
"xsum/rouge2": 0.015173697537833916,
"xsum/rougeL": 0.06791431460162027,
"xsum/rougeLsum": 0.06226845688932118,
"xsum/bertscore_precision": 0.685419961810112,
"xsum/bertscore_recall": 0.6998258779446284,
"xsum/bertscore_f1": 0.6894047458966573,
"gigaword/rouge1": 0.01673533809218624,
"gigaword/rouge2": 0.002688706117978111,
"gigaword/rougeL": 0.016448820149720444,
"gigaword/rougeLsum": 0.015425704010653109,
"gigaword/bertscore_precision": 0.5675247123837471,
"gigaword/bertscore_recall": 0.6473609921336174,
"gigaword/bertscore_f1": 0.6041367189586162,
"cnndm/rouge1": 0.12628644770575717,
"cnndm/rouge2": 0.04433825429137848,
"cnndm/rougeL": 0.09875398462560836,
"cnndm/rougeLsum": 0.10678645281701828,
"cnndm/bertscore_precision": 0.6603378802537918,
"cnndm/bertscore_recall": 0.7300801773866018,
"cnndm/bertscore_f1": 0.6927102555831274,
"eval_agg/avg_all_rougef": 0.052643335804179334,
"eval_agg/avg_all_bertf": 0.6636073772236705,
"eval_agg/avg_all": 0.3581253565139249,
"num_rl_rollout": 4,
"lm_epoch": 0,
"rl_epoch": 0,
"step": 400,
"total_data_token": 668982,
"total_rl_token": 849448,
"total_lm_token": 625452,
"total_token": 1474900,
"completed_steps": 400,
"tune_objective": 0.784820971275843
}