File size: 5,600 Bytes
1cf6661
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
{
  "step": 1000,
  "metrics": {
    "eval_rew_align/success_auprc_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_rew_align/positive_success_acc_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_rew_align/negative_success_acc_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_rew_align/loss_amburger66_robotsmith_rbm_task08_robotsmith": 3.805146312713623,
    "eval_rew_align/pearson_amburger66_robotsmith_rbm_task08_robotsmith": 0.9732821199050438,
    "eval_p_rank/kendall_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.9733333333333333,
    "eval_p_rank/kendall_rewind_last_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_p_rank/avg_succ_subopt_diff_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.18584245443344116,
    "eval_p_rank/min_succ_subopt_diff_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.18584245443344116,
    "eval_p_rank/max_succ_subopt_diff_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.18584245443344116,
    "eval_p_rank/avg_subopt_fail_diff_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.5381864190101623,
    "eval_p_rank/min_subopt_fail_diff_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.5381864190101623,
    "eval_p_rank/max_subopt_fail_diff_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.5381864190101623,
    "eval_p_rank/avg_succ_fail_diff_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.7240288734436034,
    "eval_p_rank/min_succ_fail_diff_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.7240288734436034,
    "eval_p_rank/max_succ_fail_diff_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.7240288734436034,
    "eval_p_rank/ranking_acc_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.9866666666666667,
    "eval_p_rank/ranking_acc_all_pairs_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.9866666666666667,
    "eval_p_rank/ranking_acc_suboptimal_vs_successful_last_amburger66_robotsmith_rbm_task08_robotsmith": 0.96,
    "eval_p_rank/ranking_acc_failure_vs_successful_last_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_p_rank/ranking_acc_failure_vs_suboptimal_last_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_p_rank/kendall_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.9733333333333333,
    "eval_p_rank/kendall_rewind_avg_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_p_rank/avg_succ_subopt_diff_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.18584245443344116,
    "eval_p_rank/min_succ_subopt_diff_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.18584245443344116,
    "eval_p_rank/max_succ_subopt_diff_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.18584245443344116,
    "eval_p_rank/avg_subopt_fail_diff_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.5381864190101623,
    "eval_p_rank/min_subopt_fail_diff_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.5381864190101623,
    "eval_p_rank/max_subopt_fail_diff_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.5381864190101623,
    "eval_p_rank/avg_succ_fail_diff_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.7240288734436034,
    "eval_p_rank/min_succ_fail_diff_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.7240288734436034,
    "eval_p_rank/max_succ_fail_diff_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.7240288734436034,
    "eval_p_rank/ranking_acc_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.9866666666666667,
    "eval_p_rank/ranking_acc_all_pairs_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.9866666666666667,
    "eval_p_rank/ranking_acc_suboptimal_vs_successful_avg_amburger66_robotsmith_rbm_task08_robotsmith": 0.96,
    "eval_p_rank/ranking_acc_failure_vs_successful_avg_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_p_rank/ranking_acc_failure_vs_suboptimal_avg_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_p_rank/kendall_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.9733333333333333,
    "eval_p_rank/kendall_rewind_sum_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_p_rank/avg_succ_subopt_diff_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.18584245443344116,
    "eval_p_rank/min_succ_subopt_diff_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.18584245443344116,
    "eval_p_rank/max_succ_subopt_diff_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.18584245443344116,
    "eval_p_rank/avg_subopt_fail_diff_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.5381864190101623,
    "eval_p_rank/min_subopt_fail_diff_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.5381864190101623,
    "eval_p_rank/max_subopt_fail_diff_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.5381864190101623,
    "eval_p_rank/avg_succ_fail_diff_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.7240288734436034,
    "eval_p_rank/min_succ_fail_diff_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.7240288734436034,
    "eval_p_rank/max_succ_fail_diff_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.7240288734436034,
    "eval_p_rank/ranking_acc_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.9866666666666667,
    "eval_p_rank/ranking_acc_all_pairs_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.9866666666666667,
    "eval_p_rank/ranking_acc_suboptimal_vs_successful_sum_amburger66_robotsmith_rbm_task08_robotsmith": 0.96,
    "eval_p_rank/ranking_acc_failure_vs_successful_sum_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "eval_p_rank/ranking_acc_failure_vs_suboptimal_sum_amburger66_robotsmith_rbm_task08_robotsmith": 1.0,
    "time/custom_evaluations": 45.985100037418306
  }
}