| { |
| "step": 450, |
| "metrics": { |
| "eval_rew_align/loss_libero_90": 0.13319981321692467, |
| "eval_rew_align/pearson_libero_90": 0.8769948951244139, |
| "eval_p_rank/kendall_last_libero_90": 0.7238356164383561, |
| "eval_p_rank/kendall_rewind_last_libero_90": 0.9726027397260274, |
| "eval_p_rank/avg_succ_fail_diff_last_libero_90": 0.19305384261661196, |
| "eval_p_rank/min_succ_fail_diff_last_libero_90": -0.07096144258975984, |
| "eval_p_rank/max_succ_fail_diff_last_libero_90": 0.5362282678484916, |
| "eval_p_rank/ranking_acc_last_libero_90": 0.8619178082191781, |
| "eval_p_rank/ranking_acc_all_pairs_last_libero_90": 0.8619178082191781, |
| "eval_p_rank/ranking_acc_failure_vs_successful_last_libero_90": 0.8619178082191781, |
| "eval_p_rank/kendall_avg_libero_90": 0.7238356164383561, |
| "eval_p_rank/kendall_rewind_avg_libero_90": 0.9726027397260274, |
| "eval_p_rank/avg_succ_fail_diff_avg_libero_90": 0.19305384261661196, |
| "eval_p_rank/min_succ_fail_diff_avg_libero_90": -0.07096144258975984, |
| "eval_p_rank/max_succ_fail_diff_avg_libero_90": 0.5362282678484916, |
| "eval_p_rank/ranking_acc_avg_libero_90": 0.8619178082191781, |
| "eval_p_rank/ranking_acc_all_pairs_avg_libero_90": 0.8619178082191781, |
| "eval_p_rank/ranking_acc_failure_vs_successful_avg_libero_90": 0.8619178082191781, |
| "eval_p_rank/kendall_sum_libero_90": 0.7238356164383561, |
| "eval_p_rank/kendall_rewind_sum_libero_90": 0.9726027397260274, |
| "eval_p_rank/avg_succ_fail_diff_sum_libero_90": 0.19305384261661196, |
| "eval_p_rank/min_succ_fail_diff_sum_libero_90": -0.07096144258975984, |
| "eval_p_rank/max_succ_fail_diff_sum_libero_90": 0.5362282678484916, |
| "eval_p_rank/ranking_acc_sum_libero_90": 0.8619178082191781, |
| "eval_p_rank/ranking_acc_all_pairs_sum_libero_90": 0.8619178082191781, |
| "eval_p_rank/ranking_acc_failure_vs_successful_sum_libero_90": 0.8619178082191781, |
| "eval_rew_align/loss_libero_10": 0.1326389029622078, |
| "eval_rew_align/pearson_libero_10": 0.9187725430307424, |
| "eval_p_rank/kendall_last_libero_10": 0.8960000000000001, |
| "eval_p_rank/kendall_rewind_last_libero_10": 1.0, |
| "eval_p_rank/avg_succ_fail_diff_last_libero_10": 0.20152622431516648, |
| "eval_p_rank/min_succ_fail_diff_last_libero_10": 0.014177948236465454, |
| "eval_p_rank/max_succ_fail_diff_last_libero_10": 0.29674754142761234, |
| "eval_p_rank/ranking_acc_last_libero_10": 0.948, |
| "eval_p_rank/ranking_acc_all_pairs_last_libero_10": 0.948, |
| "eval_p_rank/ranking_acc_failure_vs_successful_last_libero_10": 0.948, |
| "eval_p_rank/kendall_avg_libero_10": 0.8960000000000001, |
| "eval_p_rank/kendall_rewind_avg_libero_10": 1.0, |
| "eval_p_rank/avg_succ_fail_diff_avg_libero_10": 0.20152622431516648, |
| "eval_p_rank/min_succ_fail_diff_avg_libero_10": 0.014177948236465454, |
| "eval_p_rank/max_succ_fail_diff_avg_libero_10": 0.29674754142761234, |
| "eval_p_rank/ranking_acc_avg_libero_10": 0.948, |
| "eval_p_rank/ranking_acc_all_pairs_avg_libero_10": 0.948, |
| "eval_p_rank/ranking_acc_failure_vs_successful_avg_libero_10": 0.948, |
| "eval_p_rank/kendall_sum_libero_10": 0.8960000000000001, |
| "eval_p_rank/kendall_rewind_sum_libero_10": 1.0, |
| "eval_p_rank/avg_succ_fail_diff_sum_libero_10": 0.20152622431516648, |
| "eval_p_rank/min_succ_fail_diff_sum_libero_10": 0.014177948236465454, |
| "eval_p_rank/max_succ_fail_diff_sum_libero_10": 0.29674754142761234, |
| "eval_p_rank/ranking_acc_sum_libero_10": 0.948, |
| "eval_p_rank/ranking_acc_all_pairs_sum_libero_10": 0.948, |
| "eval_p_rank/ranking_acc_failure_vs_successful_sum_libero_10": 0.948, |
| "time/custom_evaluations": 51.121184929972515 |
| } |
| } |