lsnu commited on
Commit
9381b57
·
verified ·
1 Parent(s): f69c0bb

Add files using upload-large-folder tool

Browse files
Files changed (47) hide show
  1. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/front_rgb/rgb_0000.png +0 -0
  2. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/front_rgb/rgb_0001.png +0 -0
  3. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/wrist_left_rgb/rgb_0000.png +0 -0
  4. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/wrist_left_rgb/rgb_0001.png +0 -0
  5. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/wrist_right_rgb/rgb_0000.png +0 -0
  6. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/wrist_right_rgb/rgb_0001.png +0 -0
  7. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode1/front_rgb/rgb_0000.png +0 -0
  8. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode1/front_rgb/rgb_0001.png +0 -0
  9. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode1/wrist_left_rgb/rgb_0000.png +0 -0
  10. artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode1/wrist_left_rgb/rgb_0001.png +0 -0
  11. artifacts/outputs/interaction/proxy_interaction_state/config_resolved.yaml +120 -0
  12. artifacts/outputs/interaction/proxy_interaction_state/diagnostics/proxy_diagnostics.json +7 -0
  13. artifacts/outputs/interaction/proxy_interaction_state/metrics.json +314 -0
  14. artifacts/outputs/interaction/proxy_interaction_state_smoke/config_resolved.yaml +120 -0
  15. artifacts/outputs/interaction/proxy_interaction_state_smoke/diagnostics/proxy_diagnostics.json +7 -0
  16. artifacts/outputs/interaction/proxy_interaction_state_smoke/metrics.json +88 -0
  17. artifacts/outputs/interaction/proxy_reveal_state_full_diagnostics/proxy_diagnostics.json +7 -0
  18. artifacts/outputs/interaction/proxy_reveal_state_smoke_diagnostics/proxy_diagnostics.json +7 -0
  19. artifacts/outputs/interaction/reveal_ablation_interaction_ep1/ablations.json +80 -0
  20. artifacts/outputs/interaction/reveal_ablation_interaction_ep1/ablations.md +49 -0
  21. artifacts/outputs/interaction/reveal_ablation_interaction_ep1/ablations.partial.json +135 -0
  22. artifacts/outputs/interaction/reveal_eval_interaction_ep2/reveal_benchmark.json +15 -0
  23. artifacts/outputs/interaction/reveal_eval_interaction_ep2/reveal_benchmark.md +13 -0
  24. artifacts/outputs/interaction/reveal_eval_interaction_full_ep2/reveal_benchmark.json +15 -0
  25. artifacts/outputs/interaction/reveal_eval_interaction_full_ep2/reveal_benchmark.md +13 -0
  26. artifacts/outputs/interaction/rlbench_env_smoke/import_and_train_command.txt +19 -0
  27. artifacts/outputs/interaction/rlbench_env_smoke/import_smoke.json +18 -0
  28. artifacts/outputs/interaction/rlbench_env_smoke/launch_reset_smoke.json +24 -0
  29. artifacts/outputs/interaction/rlbench_env_smoke/launch_smoke_cli.json +40 -0
  30. artifacts/outputs/interaction/rlbench_env_smoke/launch_step_smoke.json +10 -0
  31. artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/config_resolved.yaml +126 -0
  32. artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/metrics.json +27 -0
  33. artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/summary.json +50 -0
  34. artifacts/outputs/interaction/rlbench_open_drawer_rollout_eval/rollout_eval.json +23 -0
  35. artifacts/outputs/interaction/rlbench_open_drawer_rollout_eval/rollout_eval.md +11 -0
  36. artifacts/outputs/interaction/smoke_checks/smoke_checks.json +156 -0
  37. artifacts/outputs/interaction_rolefix/proxy_interaction_state_smoke/config_resolved.yaml +120 -0
  38. artifacts/outputs/interaction_rolefix/proxy_interaction_state_smoke/diagnostics/proxy_diagnostics.json +7 -0
  39. artifacts/outputs/interaction_rolefix/proxy_interaction_state_smoke/metrics.json +88 -0
  40. artifacts/outputs/interaction_rolefix/reveal_eval_interaction_smoke/reveal_benchmark.json +15 -0
  41. artifacts/outputs/interaction_rolefix/reveal_eval_interaction_smoke/reveal_benchmark.md +13 -0
  42. artifacts/outputs/interaction_rolefix/smoke_checks/smoke_checks.json +156 -0
  43. artifacts/outputs/interaction_rolefix_full/proxy_interaction_state/config_resolved.yaml +120 -0
  44. artifacts/outputs/interaction_rolefix_full/proxy_interaction_state/diagnostics/proxy_diagnostics.json +7 -0
  45. artifacts/outputs/interaction_rolefix_full/proxy_interaction_state/metrics.json +346 -0
  46. artifacts/outputs/interaction_rolefix_full/reveal_eval_interaction/reveal_benchmark.json +15 -0
  47. artifacts/outputs/interaction_rolefix_full/reveal_eval_interaction/reveal_benchmark.md +13 -0
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/front_rgb/rgb_0000.png ADDED
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/front_rgb/rgb_0001.png ADDED
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/wrist_left_rgb/rgb_0000.png ADDED
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/wrist_left_rgb/rgb_0001.png ADDED
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/wrist_right_rgb/rgb_0000.png ADDED
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode0/wrist_right_rgb/rgb_0001.png ADDED
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode1/front_rgb/rgb_0000.png ADDED
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode1/front_rgb/rgb_0001.png ADDED
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode1/wrist_left_rgb/rgb_0000.png ADDED
artifacts/data/rlbench_smoke_open_drawer/open_drawer/all_variations/episodes/episode1/wrist_left_rgb/rgb_0001.png ADDED
artifacts/outputs/interaction/proxy_interaction_state/config_resolved.yaml ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ experiment_name: proxy_interaction_state
2
+ output_dir: /workspace/VLAarchtests/artifacts/outputs/interaction
3
+ device: cuda
4
+ seed: 13
5
+ data:
6
+ proxies:
7
+ - foliage_proxy
8
+ - bag_proxy
9
+ - cloth_proxy
10
+ resolution: 96
11
+ train_episodes_per_proxy: 48
12
+ val_episodes_per_proxy: 16
13
+ train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v4_noleak_counterfactual.pt
14
+ val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v4_noleak_counterfactual.pt
15
+ rebuild_dataset: false
16
+ chunk_horizon: 8
17
+ rollout_horizon: 5
18
+ history_steps: 6
19
+ planner_candidates: 8
20
+ seed: 13
21
+ optim:
22
+ epochs: 8
23
+ batch_size: 16
24
+ num_workers: 0
25
+ lr: 0.001
26
+ weight_decay: 0.0001
27
+ trainer:
28
+ policy_type: interaction_state
29
+ use_bf16: true
30
+ grad_clip_norm: 1.0
31
+ freeze_backbone: true
32
+ gradient_checkpointing: false
33
+ plan_during_train: true
34
+ plan_during_eval: true
35
+ support_mode_conditioning: true
36
+ planner_mode: trainable
37
+ policy:
38
+ backbone:
39
+ model_name: openai/clip-vit-base-patch32
40
+ hidden_dim: 128
41
+ max_text_tokens: 32
42
+ freeze_backbone: true
43
+ gradient_checkpointing: false
44
+ use_dummy_backbone: true
45
+ fusion:
46
+ hidden_dim: 128
47
+ num_cameras: 3
48
+ num_layers: 2
49
+ num_heads: 4
50
+ ff_dim: 256
51
+ dropout: 0.1
52
+ proprio_dim: 32
53
+ proprio_tokens: 1
54
+ memory:
55
+ hidden_dim: 128
56
+ history_steps: 6
57
+ num_layers: 2
58
+ dropout: 0.1
59
+ memory_bank_size: 4
60
+ num_heads: 4
61
+ max_history_steps: 8
62
+ decoder:
63
+ hidden_dim: 128
64
+ num_heads: 4
65
+ num_layers: 2
66
+ ff_dim: 256
67
+ dropout: 0.1
68
+ chunk_size: 8
69
+ action_dim: 14
70
+ arm_action_dim: 7
71
+ num_candidates: 8
72
+ num_phases: 5
73
+ num_arm_roles: 4
74
+ reveal_head:
75
+ hidden_dim: 128
76
+ num_support_modes: 3
77
+ num_approach_templates: 32
78
+ rollout_horizon: 5
79
+ belief_map_size: 32
80
+ field_size: 16
81
+ num_heads: 4
82
+ predict_belief_map: true
83
+ num_phases: 5
84
+ num_arm_roles: 4
85
+ num_interaction_tokens: 8
86
+ world_model:
87
+ hidden_dim: 128
88
+ action_dim: 14
89
+ num_support_modes: 3
90
+ num_approach_templates: 32
91
+ rollout_horizon: 5
92
+ field_size: 16
93
+ num_heads: 4
94
+ num_phases: 5
95
+ num_arm_roles: 4
96
+ num_interaction_tokens: 8
97
+ planner:
98
+ hidden_dim: 128
99
+ num_candidates: 8
100
+ action_dim: 14
101
+ num_support_modes: 3
102
+ utility_margin: 0.1
103
+ num_heads: 4
104
+ num_layers: 2
105
+ num_phases: 5
106
+ num_arm_roles: 4
107
+ loss_weights:
108
+ action: 1.0
109
+ support_mode: 0.15
110
+ corridor: 0.2
111
+ persistence: 0.1
112
+ disturbance: 0.1
113
+ world_model: 0.25
114
+ belief: 0.05
115
+ planner_success: 0.2
116
+ planner_risk: 0.1
117
+ planner_ranking: 0.1
118
+ proposal_reconstruction: 0.2
119
+ proposal_success: 0.1
120
+ proposal_ranking: 0.1
artifacts/outputs/interaction/proxy_interaction_state/diagnostics/proxy_diagnostics.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "planner_top1_accuracy": 0.42857142857142855,
3
+ "planner_regret": 0.1302730292081833,
4
+ "risk_calibration_mse": 0.010318642482161522,
5
+ "role_collapse_rate": 1.0,
6
+ "num_samples": 126
7
+ }
artifacts/outputs/interaction/proxy_interaction_state/metrics.json ADDED
@@ -0,0 +1,314 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "epoch": 0,
4
+ "train": {
5
+ "action": 0.08913872321136296,
6
+ "belief": 0.2182194758206606,
7
+ "corridor": 0.3059119439373414,
8
+ "disturbance": 0.026565797566339217,
9
+ "persistence": 4.247902105251948,
10
+ "planner_ranking": 0.1385585286964973,
11
+ "planner_risk": 0.01735761243617162,
12
+ "planner_success": 0.6056295608480772,
13
+ "proposal_ranking": 0.17030407022684813,
14
+ "proposal_reconstruction": 0.1340707956502835,
15
+ "proposal_success": 0.6101961359381676,
16
+ "reocclusion": 0.6835535218318304,
17
+ "support_mode": 0.7136615564425787,
18
+ "total": 1.6980353395144145,
19
+ "uncertainty": 0.25639228243380785,
20
+ "world_model": 2.977962007125219
21
+ },
22
+ "val": {
23
+ "action": 0.026339974952861667,
24
+ "belief": 0.12528764735907316,
25
+ "corridor": 0.2495101224631071,
26
+ "disturbance": 0.0031769238121341914,
27
+ "persistence": 4.169311195611954,
28
+ "planner_ranking": 0.10334245767444372,
29
+ "planner_risk": 0.011477399850264192,
30
+ "planner_success": 0.5406695902347565,
31
+ "proposal_ranking": 0.12281709257513285,
32
+ "proposal_reconstruction": 0.05566257517784834,
33
+ "proposal_success": 0.6215158998966217,
34
+ "reocclusion": 0.66676115244627,
35
+ "support_mode": 0.6648052111268044,
36
+ "total": 1.4975968450307846,
37
+ "uncertainty": 0.11675945483148098,
38
+ "world_model": 2.713745206594467
39
+ }
40
+ },
41
+ {
42
+ "epoch": 1,
43
+ "train": {
44
+ "action": 0.026542372380693752,
45
+ "belief": 0.11461626676221688,
46
+ "corridor": 0.24775489792227745,
47
+ "disturbance": 0.0027499570617995537,
48
+ "persistence": 4.069600621859233,
49
+ "planner_ranking": 0.13798692263662815,
50
+ "planner_risk": 0.012379237974528223,
51
+ "planner_success": 0.5266842084626356,
52
+ "proposal_ranking": 0.10805700657268365,
53
+ "proposal_reconstruction": 0.05344949491942922,
54
+ "proposal_success": 0.6047845358649889,
55
+ "reocclusion": 0.6740957250197729,
56
+ "support_mode": 0.6921681016683578,
57
+ "total": 1.4517146944999695,
58
+ "uncertainty": 0.04957114780942599,
59
+ "world_model": 2.5700205266475677
60
+ },
61
+ "val": {
62
+ "action": 0.02145913220010698,
63
+ "belief": 0.10869172494858503,
64
+ "corridor": 0.23724456690251827,
65
+ "disturbance": 0.0021989822344039567,
66
+ "persistence": 3.844908654689789,
67
+ "planner_ranking": 0.12535850331187248,
68
+ "planner_risk": 0.01136385987047106,
69
+ "planner_success": 0.5217581205070019,
70
+ "proposal_ranking": 0.10524471942335367,
71
+ "proposal_reconstruction": 0.04592850711196661,
72
+ "proposal_success": 0.6284073293209076,
73
+ "reocclusion": 0.6619901061058044,
74
+ "support_mode": 0.7111924216151237,
75
+ "total": 1.4133924543857574,
76
+ "uncertainty": 0.025329279713332653,
77
+ "world_model": 2.534369081258774
78
+ }
79
+ },
80
+ {
81
+ "epoch": 2,
82
+ "train": {
83
+ "action": 0.024407408433035016,
84
+ "belief": 0.1138611612841487,
85
+ "corridor": 0.2458544857800007,
86
+ "disturbance": 0.004206997211440466,
87
+ "persistence": 3.9157366255919137,
88
+ "planner_ranking": 0.11510052252560854,
89
+ "planner_risk": 0.011586199165321887,
90
+ "planner_success": 0.5286323353648186,
91
+ "proposal_ranking": 0.10212837501118581,
92
+ "proposal_reconstruction": 0.04920657336091002,
93
+ "proposal_success": 0.6089240709940592,
94
+ "reocclusion": 0.6643339196840922,
95
+ "support_mode": 0.6847635904947916,
96
+ "total": 1.3605846464633942,
97
+ "uncertainty": 0.02807092812145129,
98
+ "world_model": 2.2947811782360077
99
+ },
100
+ "val": {
101
+ "action": 0.02334526553750038,
102
+ "belief": 0.15983260795474052,
103
+ "corridor": 0.28226315788924694,
104
+ "disturbance": 0.017097398158512078,
105
+ "persistence": 3.902952551841736,
106
+ "planner_ranking": 0.10127842240035534,
107
+ "planner_risk": 0.012675322766881436,
108
+ "planner_success": 0.5396927110850811,
109
+ "proposal_ranking": 0.10627106577157974,
110
+ "proposal_reconstruction": 0.04857080662623048,
111
+ "proposal_success": 0.6166459769010544,
112
+ "reocclusion": 0.6506054624915123,
113
+ "support_mode": 0.665102630853653,
114
+ "total": 1.2038391679525375,
115
+ "uncertainty": 0.08320197206921875,
116
+ "world_model": 1.6363814026117325
117
+ }
118
+ },
119
+ {
120
+ "epoch": 3,
121
+ "train": {
122
+ "action": 0.02514208061620593,
123
+ "belief": 0.11728278330216806,
124
+ "corridor": 0.24663691284755865,
125
+ "disturbance": 0.006238660357970123,
126
+ "persistence": 3.951133112112681,
127
+ "planner_ranking": 0.1094918263455232,
128
+ "planner_risk": 0.010860085254535079,
129
+ "planner_success": 0.4831004776060581,
130
+ "proposal_ranking": 0.09784856469680865,
131
+ "proposal_reconstruction": 0.04991315118968487,
132
+ "proposal_success": 0.6049580449859301,
133
+ "reocclusion": 0.6561904201904932,
134
+ "support_mode": 0.6671389614542326,
135
+ "total": 1.2903279686967533,
136
+ "uncertainty": 0.028790034314927954,
137
+ "world_model": 2.047424097855886
138
+ },
139
+ "val": {
140
+ "action": 0.026369616854935884,
141
+ "belief": 0.10613519884645939,
142
+ "corridor": 0.22941571101546288,
143
+ "disturbance": 0.003113830098300241,
144
+ "persistence": 3.742612451314926,
145
+ "planner_ranking": 0.09627582784742117,
146
+ "planner_risk": 0.01076946739340201,
147
+ "planner_success": 0.47833504155278206,
148
+ "proposal_ranking": 0.09593241196125746,
149
+ "proposal_reconstruction": 0.0534784197807312,
150
+ "proposal_success": 0.6306303292512894,
151
+ "reocclusion": 0.6404713988304138,
152
+ "support_mode": 0.6704101711511612,
153
+ "total": 1.1889225989580154,
154
+ "uncertainty": 0.02097803057404235,
155
+ "world_model": 1.7339447140693665
156
+ }
157
+ },
158
+ {
159
+ "epoch": 4,
160
+ "train": {
161
+ "action": 0.02463891791800658,
162
+ "belief": 0.10698648542165756,
163
+ "corridor": 0.23474377828339735,
164
+ "disturbance": 0.0030594476411351934,
165
+ "persistence": 3.8452726304531097,
166
+ "planner_ranking": 0.10481727588921785,
167
+ "planner_risk": 0.011097095673903823,
168
+ "planner_success": 0.44664503013094264,
169
+ "proposal_ranking": 0.09467410761862993,
170
+ "proposal_reconstruction": 0.04960497561842203,
171
+ "proposal_success": 0.6051262418429056,
172
+ "reocclusion": 0.6540075515707334,
173
+ "support_mode": 0.6753946940104166,
174
+ "total": 1.2287767976522446,
175
+ "uncertainty": 0.02127678649655233,
176
+ "world_model": 1.8863319009542465
177
+ },
178
+ "val": {
179
+ "action": 0.019384633051231503,
180
+ "belief": 0.10288739763200283,
181
+ "corridor": 0.22519288212060928,
182
+ "disturbance": 0.0021419554541353136,
183
+ "persistence": 3.7146196961402893,
184
+ "planner_ranking": 0.10946678463369608,
185
+ "planner_risk": 0.011642372934147716,
186
+ "planner_success": 0.47963740676641464,
187
+ "proposal_ranking": 0.08971122652292252,
188
+ "proposal_reconstruction": 0.04226163262501359,
189
+ "proposal_success": 0.6239738017320633,
190
+ "reocclusion": 0.6498126462101936,
191
+ "support_mode": 0.6662197485566139,
192
+ "total": 1.228643923997879,
193
+ "uncertainty": 0.010205027123447508,
194
+ "world_model": 1.946038767695427
195
+ }
196
+ },
197
+ {
198
+ "epoch": 5,
199
+ "train": {
200
+ "action": 0.023295348898197215,
201
+ "belief": 0.10408696439117193,
202
+ "corridor": 0.23216054091850916,
203
+ "disturbance": 0.002513651920404906,
204
+ "persistence": 3.805388251940409,
205
+ "planner_ranking": 0.09554585038373868,
206
+ "planner_risk": 0.010421493653363237,
207
+ "planner_success": 0.438693817704916,
208
+ "proposal_ranking": 0.09420504545172055,
209
+ "proposal_reconstruction": 0.04733991126219431,
210
+ "proposal_success": 0.6043872957428297,
211
+ "reocclusion": 0.6555871988336245,
212
+ "support_mode": 0.6715305869777998,
213
+ "total": 1.1565892845392227,
214
+ "uncertainty": 0.0161813710971425,
215
+ "world_model": 1.636805718143781
216
+ },
217
+ "val": {
218
+ "action": 0.020826205611228943,
219
+ "belief": 0.10143636167049408,
220
+ "corridor": 0.2232594806700945,
221
+ "disturbance": 0.001781191662303172,
222
+ "persistence": 3.6273659467697144,
223
+ "planner_ranking": 0.16842342726886272,
224
+ "planner_risk": 0.01012508076382801,
225
+ "planner_success": 0.5004390366375446,
226
+ "proposal_ranking": 0.08787750266492367,
227
+ "proposal_reconstruction": 0.04392921878024936,
228
+ "proposal_success": 0.624223992228508,
229
+ "reocclusion": 0.6372809633612633,
230
+ "support_mode": 0.664175495505333,
231
+ "total": 1.1100417152047157,
232
+ "uncertainty": 0.01541757385712117,
233
+ "world_model": 1.4644491225481033
234
+ }
235
+ },
236
+ {
237
+ "epoch": 6,
238
+ "train": {
239
+ "action": 0.02248762206484874,
240
+ "belief": 0.10121824126690626,
241
+ "corridor": 0.2321634783099095,
242
+ "disturbance": 0.0020452279277378693,
243
+ "persistence": 3.836012969414393,
244
+ "planner_ranking": 0.11302779614925385,
245
+ "planner_risk": 0.01022351956150184,
246
+ "planner_success": 0.4348009414970875,
247
+ "proposal_ranking": 0.09360451406488816,
248
+ "proposal_reconstruction": 0.0462404570231835,
249
+ "proposal_success": 0.6066909035046896,
250
+ "reocclusion": 0.6465126698215803,
251
+ "support_mode": 0.6658426920572916,
252
+ "total": 1.1116433491309483,
253
+ "uncertainty": 0.013347609317861497,
254
+ "world_model": 1.4494130065043767
255
+ },
256
+ "val": {
257
+ "action": 0.01996314455755055,
258
+ "belief": 0.10138983093202114,
259
+ "corridor": 0.22823662497103214,
260
+ "disturbance": 0.002091344154905528,
261
+ "persistence": 3.6982297003269196,
262
+ "planner_ranking": 0.09198376163840294,
263
+ "planner_risk": 0.010279824957251549,
264
+ "planner_success": 0.47799063101410866,
265
+ "proposal_ranking": 0.09706298727542162,
266
+ "proposal_reconstruction": 0.04272295255213976,
267
+ "proposal_success": 0.6218197643756866,
268
+ "reocclusion": 0.6380461752414703,
269
+ "support_mode": 0.6696624308824539,
270
+ "total": 1.0816360414028168,
271
+ "uncertainty": 0.007035618589725345,
272
+ "world_model": 1.3655437678098679
273
+ }
274
+ },
275
+ {
276
+ "epoch": 7,
277
+ "train": {
278
+ "action": 0.021682963396112125,
279
+ "belief": 0.10601237788796425,
280
+ "corridor": 0.23365325729052225,
281
+ "disturbance": 0.002228843019111082,
282
+ "persistence": 3.7541938523451486,
283
+ "planner_ranking": 0.0957260721673568,
284
+ "planner_risk": 0.01018386852229014,
285
+ "planner_success": 0.4461444852252801,
286
+ "proposal_ranking": 0.09633061879624923,
287
+ "proposal_reconstruction": 0.044885387644171715,
288
+ "proposal_success": 0.6029221788048744,
289
+ "reocclusion": 0.6449378555019697,
290
+ "support_mode": 0.6726728156208992,
291
+ "total": 1.0910143380363782,
292
+ "uncertainty": 0.01619089951661105,
293
+ "world_model": 1.3958957940340042
294
+ },
295
+ "val": {
296
+ "action": 0.01988930464722216,
297
+ "belief": 0.10534531436860561,
298
+ "corridor": 0.22113148868083954,
299
+ "disturbance": 0.001838716707425192,
300
+ "persistence": 3.629800319671631,
301
+ "planner_ranking": 0.12714975513517857,
302
+ "planner_risk": 0.008069174771662802,
303
+ "planner_success": 0.6245891973376274,
304
+ "proposal_ranking": 0.10471091698855162,
305
+ "proposal_reconstruction": 0.043083535972982645,
306
+ "proposal_success": 0.6201159805059433,
307
+ "reocclusion": 0.6348166316747665,
308
+ "support_mode": 0.6840479746460915,
309
+ "total": 1.1184726804494858,
310
+ "uncertainty": 0.022346424055285752,
311
+ "world_model": 1.4034390151500702
312
+ }
313
+ }
314
+ ]
artifacts/outputs/interaction/proxy_interaction_state_smoke/config_resolved.yaml ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ experiment_name: proxy_interaction_state_smoke
2
+ output_dir: /workspace/VLAarchtests/artifacts/outputs/interaction
3
+ device: cuda
4
+ seed: 13
5
+ data:
6
+ proxies:
7
+ - foliage_proxy
8
+ - bag_proxy
9
+ - cloth_proxy
10
+ resolution: 64
11
+ train_episodes_per_proxy: 6
12
+ val_episodes_per_proxy: 2
13
+ train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_smoke_v4.pt
14
+ val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_smoke_v4.pt
15
+ rebuild_dataset: false
16
+ chunk_horizon: 4
17
+ rollout_horizon: 3
18
+ history_steps: 6
19
+ planner_candidates: 4
20
+ seed: 13
21
+ optim:
22
+ epochs: 2
23
+ batch_size: 8
24
+ num_workers: 0
25
+ lr: 0.001
26
+ weight_decay: 0.0001
27
+ trainer:
28
+ policy_type: interaction_state
29
+ use_bf16: true
30
+ grad_clip_norm: 1.0
31
+ freeze_backbone: true
32
+ gradient_checkpointing: false
33
+ plan_during_train: true
34
+ plan_during_eval: true
35
+ support_mode_conditioning: true
36
+ planner_mode: trainable
37
+ policy:
38
+ backbone:
39
+ model_name: openai/clip-vit-base-patch32
40
+ hidden_dim: 64
41
+ max_text_tokens: 32
42
+ freeze_backbone: true
43
+ gradient_checkpointing: false
44
+ use_dummy_backbone: true
45
+ fusion:
46
+ hidden_dim: 64
47
+ num_cameras: 3
48
+ num_layers: 2
49
+ num_heads: 4
50
+ ff_dim: 128
51
+ dropout: 0.1
52
+ proprio_dim: 32
53
+ proprio_tokens: 1
54
+ memory:
55
+ hidden_dim: 64
56
+ history_steps: 6
57
+ num_layers: 2
58
+ dropout: 0.1
59
+ memory_bank_size: 4
60
+ num_heads: 4
61
+ max_history_steps: 8
62
+ decoder:
63
+ hidden_dim: 64
64
+ num_heads: 4
65
+ num_layers: 2
66
+ ff_dim: 128
67
+ dropout: 0.1
68
+ chunk_size: 4
69
+ action_dim: 14
70
+ arm_action_dim: 7
71
+ num_candidates: 4
72
+ num_phases: 5
73
+ num_arm_roles: 4
74
+ reveal_head:
75
+ hidden_dim: 64
76
+ num_support_modes: 3
77
+ num_approach_templates: 32
78
+ rollout_horizon: 3
79
+ belief_map_size: 32
80
+ field_size: 16
81
+ num_heads: 4
82
+ predict_belief_map: true
83
+ num_phases: 5
84
+ num_arm_roles: 4
85
+ num_interaction_tokens: 8
86
+ world_model:
87
+ hidden_dim: 64
88
+ action_dim: 14
89
+ num_support_modes: 3
90
+ num_approach_templates: 32
91
+ rollout_horizon: 3
92
+ field_size: 16
93
+ num_heads: 4
94
+ num_phases: 5
95
+ num_arm_roles: 4
96
+ num_interaction_tokens: 8
97
+ planner:
98
+ hidden_dim: 64
99
+ num_candidates: 4
100
+ action_dim: 14
101
+ num_support_modes: 3
102
+ utility_margin: 0.1
103
+ num_heads: 4
104
+ num_layers: 2
105
+ num_phases: 5
106
+ num_arm_roles: 4
107
+ loss_weights:
108
+ action: 1.0
109
+ support_mode: 0.15
110
+ corridor: 0.2
111
+ persistence: 0.1
112
+ disturbance: 0.1
113
+ world_model: 0.25
114
+ belief: 0.05
115
+ planner_success: 0.2
116
+ planner_risk: 0.1
117
+ planner_ranking: 0.1
118
+ proposal_reconstruction: 0.2
119
+ proposal_success: 0.1
120
+ proposal_ranking: 0.1
artifacts/outputs/interaction/proxy_interaction_state_smoke/diagnostics/proxy_diagnostics.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "planner_top1_accuracy": 0.375,
3
+ "planner_regret": 0.4054882526397705,
4
+ "risk_calibration_mse": 0.01106204278767109,
5
+ "role_collapse_rate": 1.0,
6
+ "num_samples": 16
7
+ }
artifacts/outputs/interaction/proxy_interaction_state_smoke/metrics.json ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "epoch": 0,
4
+ "train": {
5
+ "action": 0.15396334496991976,
6
+ "arm_role": 1.0464913504464286,
7
+ "belief": 0.5699181130954197,
8
+ "corridor": 0.5832605191639492,
9
+ "disturbance": 0.10345468350819179,
10
+ "persistence": 1.7334490844181605,
11
+ "phase": 1.1630859375,
12
+ "planner_ranking": 0.1581665085894721,
13
+ "planner_risk": 0.02096142333799175,
14
+ "planner_success": 0.6495738455227443,
15
+ "proposal_ranking": 0.19803496769496373,
16
+ "proposal_reconstruction": 0.20699733815022878,
17
+ "proposal_success": 0.6321364641189575,
18
+ "reocclusion": 0.6904009750911168,
19
+ "support_mode": 0.8394252232142857,
20
+ "total": 1.6638009548187256,
21
+ "uncertainty": 0.6862367732184274,
22
+ "world_model": 2.6067678928375244
23
+ },
24
+ "val": {
25
+ "action": 0.06714679300785065,
26
+ "arm_role": 0.8156493306159973,
27
+ "belief": 0.4122387021780014,
28
+ "corridor": 0.43514861166477203,
29
+ "disturbance": 0.04421420395374298,
30
+ "persistence": 1.679144263267517,
31
+ "phase": 0.795434981584549,
32
+ "planner_ranking": 0.10125493630766869,
33
+ "planner_risk": 0.014165664557367563,
34
+ "planner_success": 0.7003250122070312,
35
+ "proposal_ranking": 0.19173914939165115,
36
+ "proposal_reconstruction": 0.10236449539661407,
37
+ "proposal_success": 0.6280835568904877,
38
+ "reocclusion": 0.6901499629020691,
39
+ "support_mode": 0.7109985053539276,
40
+ "total": 1.3141186237335205,
41
+ "uncertainty": 0.560584306716919,
42
+ "world_model": 2.025277078151703
43
+ }
44
+ },
45
+ {
46
+ "epoch": 1,
47
+ "train": {
48
+ "action": 0.06967730287994657,
49
+ "arm_role": 0.7705426897321429,
50
+ "belief": 0.3012138817991529,
51
+ "corridor": 0.35292174773556845,
52
+ "disturbance": 0.01887136205498661,
53
+ "persistence": 1.7558837277548653,
54
+ "phase": 0.8579799107142857,
55
+ "planner_ranking": 0.13363037151949747,
56
+ "planner_risk": 0.010756842027019178,
57
+ "planner_success": 0.6408852168491909,
58
+ "proposal_ranking": 0.12252488732337952,
59
+ "proposal_reconstruction": 0.10212650469371251,
60
+ "proposal_success": 0.619073646409171,
61
+ "reocclusion": 0.7055942841938564,
62
+ "support_mode": 0.7973284040178571,
63
+ "total": 1.2046506234577723,
64
+ "uncertainty": 0.47724126066480366,
65
+ "world_model": 1.6589686359677995
66
+ },
67
+ "val": {
68
+ "action": 0.05438657104969025,
69
+ "arm_role": 0.727223664522171,
70
+ "belief": 0.16894277185201645,
71
+ "corridor": 0.2628409117460251,
72
+ "disturbance": 0.0024247884866781533,
73
+ "persistence": 1.7001646757125854,
74
+ "phase": 0.7108556628227234,
75
+ "planner_ranking": 0.10945596918463707,
76
+ "planner_risk": 0.010194436646997929,
77
+ "planner_success": 0.6684828102588654,
78
+ "proposal_ranking": 0.09799150377511978,
79
+ "proposal_reconstruction": 0.09263791516423225,
80
+ "proposal_success": 0.6696180105209351,
81
+ "reocclusion": 0.7087761461734772,
82
+ "support_mode": 0.6864266693592072,
83
+ "total": 1.1171032786369324,
84
+ "uncertainty": 0.3682785928249359,
85
+ "world_model": 1.591063678264618
86
+ }
87
+ }
88
+ ]
artifacts/outputs/interaction/proxy_reveal_state_full_diagnostics/proxy_diagnostics.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "planner_top1_accuracy": 0.2698412698412698,
3
+ "planner_regret": 0.3642531931400299,
4
+ "risk_calibration_mse": 0.011263838969171047,
5
+ "role_collapse_rate": 0.0,
6
+ "num_samples": 126
7
+ }
artifacts/outputs/interaction/proxy_reveal_state_smoke_diagnostics/proxy_diagnostics.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "planner_top1_accuracy": 0.25,
3
+ "planner_regret": 0.2715669870376587,
4
+ "risk_calibration_mse": 0.0521860271692276,
5
+ "role_collapse_rate": 0.0,
6
+ "num_samples": 16
7
+ }
artifacts/outputs/interaction/reveal_ablation_interaction_ep1/ablations.json ADDED
@@ -0,0 +1,80 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "full_model": {
3
+ "per_task_success": {
4
+ "foliage_proxy": 0.0,
5
+ "bag_proxy": 0.0,
6
+ "cloth_proxy": 0.0
7
+ },
8
+ "mean_success": 0.0,
9
+ "visibility_integral": 67.46570078531902,
10
+ "corridor_availability": 0.9835391044616699,
11
+ "reocclusion_rate": 0.0,
12
+ "persistence_horizon_mae": 2.9001280729969343,
13
+ "disturbance_cost": 0.7520796457926432
14
+ },
15
+ "no_interaction_head": {
16
+ "per_task_success": {
17
+ "foliage_proxy": 0.0,
18
+ "bag_proxy": 0.0,
19
+ "cloth_proxy": 0.0
20
+ },
21
+ "mean_success": 0.0,
22
+ "visibility_integral": 63.56013615926107,
23
+ "corridor_availability": 0.9876543283462524,
24
+ "reocclusion_rate": 0.0,
25
+ "persistence_horizon_mae": null,
26
+ "disturbance_cost": 0.8973869283994039
27
+ },
28
+ "no_world_model": {
29
+ "per_task_success": {
30
+ "foliage_proxy": 0.0,
31
+ "bag_proxy": 0.0,
32
+ "cloth_proxy": 0.0
33
+ },
34
+ "mean_success": 0.0,
35
+ "visibility_integral": 63.46492385864258,
36
+ "corridor_availability": 0.9876543283462524,
37
+ "reocclusion_rate": 0.0,
38
+ "persistence_horizon_mae": 2.8303335145115853,
39
+ "disturbance_cost": 0.900044322013855
40
+ },
41
+ "no_planner": {
42
+ "per_task_success": {
43
+ "foliage_proxy": 0.0,
44
+ "bag_proxy": 0.0,
45
+ "cloth_proxy": 0.0
46
+ },
47
+ "mean_success": 0.0,
48
+ "visibility_integral": 63.54209772745768,
49
+ "corridor_availability": 0.9876543283462524,
50
+ "reocclusion_rate": 0.0,
51
+ "persistence_horizon_mae": 2.8313964143395425,
52
+ "disturbance_cost": 0.8962932030359904
53
+ },
54
+ "no_role_tokens": {
55
+ "per_task_success": {
56
+ "foliage_proxy": 0.0,
57
+ "bag_proxy": 0.0,
58
+ "cloth_proxy": 0.0
59
+ },
60
+ "mean_success": 0.0,
61
+ "visibility_integral": 67.39010111490886,
62
+ "corridor_availability": 0.9835391044616699,
63
+ "reocclusion_rate": 0.0,
64
+ "persistence_horizon_mae": 2.8990648205081624,
65
+ "disturbance_cost": 0.7544853488604227
66
+ },
67
+ "short_history": {
68
+ "per_task_success": {
69
+ "foliage_proxy": 0.0,
70
+ "bag_proxy": 0.0,
71
+ "cloth_proxy": 0.0
72
+ },
73
+ "mean_success": 0.0,
74
+ "visibility_integral": 67.46627298990886,
75
+ "corridor_availability": 0.9835391044616699,
76
+ "reocclusion_rate": 0.0,
77
+ "persistence_horizon_mae": 2.900133213897546,
78
+ "disturbance_cost": 0.7520630160967509
79
+ }
80
+ }
artifacts/outputs/interaction/reveal_ablation_interaction_ep1/ablations.md ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Reveal Ablations
2
+
3
+ ## full_model
4
+ - mean_success: 0.000
5
+ - visibility_integral: 67.466
6
+ - corridor_availability: 0.984
7
+ - reocclusion_rate: 0.000
8
+ - persistence_horizon_mae: 2.900
9
+ - disturbance_cost: 0.752
10
+
11
+ ## no_interaction_head
12
+ - mean_success: 0.000
13
+ - visibility_integral: 63.560
14
+ - corridor_availability: 0.988
15
+ - reocclusion_rate: 0.000
16
+ - persistence_horizon_mae: 0.000
17
+ - disturbance_cost: 0.897
18
+
19
+ ## no_world_model
20
+ - mean_success: 0.000
21
+ - visibility_integral: 63.465
22
+ - corridor_availability: 0.988
23
+ - reocclusion_rate: 0.000
24
+ - persistence_horizon_mae: 2.830
25
+ - disturbance_cost: 0.900
26
+
27
+ ## no_planner
28
+ - mean_success: 0.000
29
+ - visibility_integral: 63.542
30
+ - corridor_availability: 0.988
31
+ - reocclusion_rate: 0.000
32
+ - persistence_horizon_mae: 2.831
33
+ - disturbance_cost: 0.896
34
+
35
+ ## no_role_tokens
36
+ - mean_success: 0.000
37
+ - visibility_integral: 67.390
38
+ - corridor_availability: 0.984
39
+ - reocclusion_rate: 0.000
40
+ - persistence_horizon_mae: 2.899
41
+ - disturbance_cost: 0.754
42
+
43
+ ## short_history
44
+ - mean_success: 0.000
45
+ - visibility_integral: 67.466
46
+ - corridor_availability: 0.984
47
+ - reocclusion_rate: 0.000
48
+ - persistence_horizon_mae: 2.900
49
+ - disturbance_cost: 0.752
artifacts/outputs/interaction/reveal_ablation_interaction_ep1/ablations.partial.json ADDED
@@ -0,0 +1,135 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "checkpoint": "/workspace/VLAarchtests/artifacts/outputs/interaction/proxy_interaction_state_smoke/checkpoint_best.pt",
3
+ "episodes": 1,
4
+ "sections": {
5
+ "full_model": {
6
+ "mean_success": 0.0,
7
+ "visibility_integral": 67.46570078531902,
8
+ "corridor_availability": 0.9835391044616699,
9
+ "reocclusion_rate": 0.0,
10
+ "persistence_horizon_mae": 2.9001280729969343,
11
+ "disturbance_cost": 0.7520796457926432
12
+ },
13
+ "no_interaction_head": {
14
+ "mean_success": 0.0,
15
+ "visibility_integral": 63.56013615926107,
16
+ "corridor_availability": 0.9876543283462524,
17
+ "reocclusion_rate": 0.0,
18
+ "persistence_horizon_mae": 0.0,
19
+ "disturbance_cost": 0.8973869283994039
20
+ },
21
+ "no_world_model": {
22
+ "mean_success": 0.0,
23
+ "visibility_integral": 63.46492385864258,
24
+ "corridor_availability": 0.9876543283462524,
25
+ "reocclusion_rate": 0.0,
26
+ "persistence_horizon_mae": 2.8303335145115853,
27
+ "disturbance_cost": 0.900044322013855
28
+ },
29
+ "no_planner": {
30
+ "mean_success": 0.0,
31
+ "visibility_integral": 63.54209772745768,
32
+ "corridor_availability": 0.9876543283462524,
33
+ "reocclusion_rate": 0.0,
34
+ "persistence_horizon_mae": 2.8313964143395425,
35
+ "disturbance_cost": 0.8962932030359904
36
+ },
37
+ "no_role_tokens": {
38
+ "mean_success": 0.0,
39
+ "visibility_integral": 67.39010111490886,
40
+ "corridor_availability": 0.9835391044616699,
41
+ "reocclusion_rate": 0.0,
42
+ "persistence_horizon_mae": 2.8990648205081624,
43
+ "disturbance_cost": 0.7544853488604227
44
+ },
45
+ "short_history": {
46
+ "mean_success": 0.0,
47
+ "visibility_integral": 67.46627298990886,
48
+ "corridor_availability": 0.9835391044616699,
49
+ "reocclusion_rate": 0.0,
50
+ "persistence_horizon_mae": 2.900133213897546,
51
+ "disturbance_cost": 0.7520630160967509
52
+ }
53
+ },
54
+ "raw": {
55
+ "full_model": {
56
+ "per_task_success": {
57
+ "foliage_proxy": 0.0,
58
+ "bag_proxy": 0.0,
59
+ "cloth_proxy": 0.0
60
+ },
61
+ "mean_success": 0.0,
62
+ "visibility_integral": 67.46570078531902,
63
+ "corridor_availability": 0.9835391044616699,
64
+ "reocclusion_rate": 0.0,
65
+ "persistence_horizon_mae": 2.9001280729969343,
66
+ "disturbance_cost": 0.7520796457926432
67
+ },
68
+ "no_interaction_head": {
69
+ "per_task_success": {
70
+ "foliage_proxy": 0.0,
71
+ "bag_proxy": 0.0,
72
+ "cloth_proxy": 0.0
73
+ },
74
+ "mean_success": 0.0,
75
+ "visibility_integral": 63.56013615926107,
76
+ "corridor_availability": 0.9876543283462524,
77
+ "reocclusion_rate": 0.0,
78
+ "persistence_horizon_mae": null,
79
+ "disturbance_cost": 0.8973869283994039
80
+ },
81
+ "no_world_model": {
82
+ "per_task_success": {
83
+ "foliage_proxy": 0.0,
84
+ "bag_proxy": 0.0,
85
+ "cloth_proxy": 0.0
86
+ },
87
+ "mean_success": 0.0,
88
+ "visibility_integral": 63.46492385864258,
89
+ "corridor_availability": 0.9876543283462524,
90
+ "reocclusion_rate": 0.0,
91
+ "persistence_horizon_mae": 2.8303335145115853,
92
+ "disturbance_cost": 0.900044322013855
93
+ },
94
+ "no_planner": {
95
+ "per_task_success": {
96
+ "foliage_proxy": 0.0,
97
+ "bag_proxy": 0.0,
98
+ "cloth_proxy": 0.0
99
+ },
100
+ "mean_success": 0.0,
101
+ "visibility_integral": 63.54209772745768,
102
+ "corridor_availability": 0.9876543283462524,
103
+ "reocclusion_rate": 0.0,
104
+ "persistence_horizon_mae": 2.8313964143395425,
105
+ "disturbance_cost": 0.8962932030359904
106
+ },
107
+ "no_role_tokens": {
108
+ "per_task_success": {
109
+ "foliage_proxy": 0.0,
110
+ "bag_proxy": 0.0,
111
+ "cloth_proxy": 0.0
112
+ },
113
+ "mean_success": 0.0,
114
+ "visibility_integral": 67.39010111490886,
115
+ "corridor_availability": 0.9835391044616699,
116
+ "reocclusion_rate": 0.0,
117
+ "persistence_horizon_mae": 2.8990648205081624,
118
+ "disturbance_cost": 0.7544853488604227
119
+ },
120
+ "short_history": {
121
+ "per_task_success": {
122
+ "foliage_proxy": 0.0,
123
+ "bag_proxy": 0.0,
124
+ "cloth_proxy": 0.0
125
+ },
126
+ "mean_success": 0.0,
127
+ "visibility_integral": 67.46627298990886,
128
+ "corridor_availability": 0.9835391044616699,
129
+ "reocclusion_rate": 0.0,
130
+ "persistence_horizon_mae": 2.900133213897546,
131
+ "disturbance_cost": 0.7520630160967509
132
+ }
133
+ },
134
+ "elapsed_seconds": 56.18267846107483
135
+ }
artifacts/outputs/interaction/reveal_eval_interaction_ep2/reveal_benchmark.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "interaction": {
3
+ "per_task_success": {
4
+ "foliage_proxy": 0.0,
5
+ "bag_proxy": 0.0,
6
+ "cloth_proxy": 0.0
7
+ },
8
+ "mean_success": 0.0,
9
+ "visibility_integral": 62.47385279337565,
10
+ "corridor_availability": 0.9876543283462524,
11
+ "reocclusion_rate": 0.0,
12
+ "persistence_horizon_mae": 2.8290874414145946,
13
+ "disturbance_cost": 0.9037613173325857
14
+ }
15
+ }
artifacts/outputs/interaction/reveal_eval_interaction_ep2/reveal_benchmark.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Reveal Proxy Benchmark
2
+
3
+ ## interaction
4
+ - checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction/proxy_interaction_state_smoke/checkpoint_best.pt
5
+ - mean_success: 0.000
6
+ - visibility_integral: 62.474
7
+ - corridor_availability: 0.988
8
+ - reocclusion_rate: 0.000
9
+ - persistence_horizon_mae: 2.829
10
+ - disturbance_cost: 0.904
11
+ - foliage_proxy_success: 0.000
12
+ - bag_proxy_success: 0.000
13
+ - cloth_proxy_success: 0.000
artifacts/outputs/interaction/reveal_eval_interaction_full_ep2/reveal_benchmark.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "interaction": {
3
+ "per_task_success": {
4
+ "foliage_proxy": 0.0,
5
+ "bag_proxy": 0.0,
6
+ "cloth_proxy": 0.0
7
+ },
8
+ "mean_success": 0.0,
9
+ "visibility_integral": 62.6574592590332,
10
+ "corridor_availability": 0.9876543283462524,
11
+ "reocclusion_rate": 0.0,
12
+ "persistence_horizon_mae": 2.1672919432322186,
13
+ "disturbance_cost": 0.8980477948983511
14
+ }
15
+ }
artifacts/outputs/interaction/reveal_eval_interaction_full_ep2/reveal_benchmark.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Reveal Proxy Benchmark
2
+
3
+ ## interaction
4
+ - checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction/proxy_interaction_state/checkpoint_best.pt
5
+ - mean_success: 0.000
6
+ - visibility_integral: 62.657
7
+ - corridor_availability: 0.988
8
+ - reocclusion_rate: 0.000
9
+ - persistence_horizon_mae: 2.167
10
+ - disturbance_cost: 0.898
11
+ - foliage_proxy_success: 0.000
12
+ - bag_proxy_success: 0.000
13
+ - cloth_proxy_success: 0.000
artifacts/outputs/interaction/rlbench_env_smoke/import_and_train_command.txt ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "camera_names": [
3
+ "front",
4
+ "wrist_left",
5
+ "wrist_right"
6
+ ],
7
+ "resolution": [
8
+ 224,
9
+ 224
10
+ ],
11
+ "global_camera": "front",
12
+ "resolved_upstream_root": "/workspace/third_party/peract_bimanual/peract",
13
+ "imports": {
14
+ "rlbench": "ok",
15
+ "pyrep": "ok",
16
+ "yarr": "ok"
17
+ }
18
+ }
19
+ xvfb-run -a -s '-screen 0 1280x1024x24' /workspace/envs/rlbench/bin/python train.py method=PERACT_BC rlbench.task_name=multi_3cam 'rlbench.tasks=[bimanual_push_box,bimanual_lift_ball,bimanual_dual_push_buttons,bimanual_pick_plate,bimanual_put_item_in_drawer,bimanual_put_bottle_in_fridge,bimanual_handover_item,bimanual_pick_laptop,bimanual_straighten_rope,bimanual_sweep_to_dustpan,bimanual_lift_tray,bimanual_handover_item_easy,bimanual_take_tray_out_of_oven]' rlbench.demos=100 rlbench.demo_path=/workspace/data/rlbench2 replay.path=/workspace/replays/rlbench2 framework.logdir=/workspace/logs/rlbench2 framework.training_iterations=40000 framework.gpu=0 framework.env_gpu=0 framework.start_seed=0 ddp.num_devices=1 'rlbench.cameras=[front,wrist2,wrist]' 'rlbench.camera_resolution=[224,224]'
artifacts/outputs/interaction/rlbench_env_smoke/import_smoke.json ADDED
@@ -0,0 +1,18 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "camera_names": [
3
+ "front",
4
+ "wrist_left",
5
+ "wrist_right"
6
+ ],
7
+ "resolution": [
8
+ 224,
9
+ 224
10
+ ],
11
+ "global_camera": "front",
12
+ "resolved_upstream_root": "/workspace/third_party/peract_bimanual/peract",
13
+ "imports": {
14
+ "rlbench": "ok",
15
+ "pyrep": "ok",
16
+ "yarr": "ok"
17
+ }
18
+ }
artifacts/outputs/interaction/rlbench_env_smoke/launch_reset_smoke.json ADDED
@@ -0,0 +1,24 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "description": "hold the drawer with left hand and open the bottom drawer with right hand",
3
+ "front_rgb_shape": [
4
+ 128,
5
+ 128,
6
+ 3
7
+ ],
8
+ "wrist_rgb_shape": [
9
+ 128,
10
+ 128,
11
+ 3
12
+ ],
13
+ "wrist2_rgb_shape": [
14
+ 128,
15
+ 128,
16
+ 3
17
+ ],
18
+ "right_pose_shape": [
19
+ 7
20
+ ],
21
+ "left_pose_shape": [
22
+ 7
23
+ ]
24
+ }
artifacts/outputs/interaction/rlbench_env_smoke/launch_smoke_cli.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Launching task_design_open_drawer.ttt
2
+ dominant hand in open_drawer init_episode:
3
+ base_rotation_bounds:
4
+ {
5
+ "display": ":103",
6
+ "headless": true,
7
+ "task": "OpenDrawer",
8
+ "description": "hold the drawer with left hand and open the bottom drawer with right hand",
9
+ "front_rgb_shape": [
10
+ 128,
11
+ 128,
12
+ 3
13
+ ],
14
+ "wrist_rgb_shape": [
15
+ 128,
16
+ 128,
17
+ 3
18
+ ],
19
+ "wrist2_rgb_shape": [
20
+ 128,
21
+ 128,
22
+ 3
23
+ ],
24
+ "right_pose_shape": [
25
+ 7
26
+ ],
27
+ "left_pose_shape": [
28
+ 7
29
+ ],
30
+ "stepped_arm": "right",
31
+ "reward": 0.0,
32
+ "done": false,
33
+ "front_rgb_shape_after_step": [
34
+ 128,
35
+ 128,
36
+ 3
37
+ ]
38
+ }
39
+ Environment2Robots is shutting down
40
+ [CoppeliaSim:loadinfo] done.
artifacts/outputs/interaction/rlbench_env_smoke/launch_step_smoke.json ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "description": "hold the drawer with left hand and open the bottom drawer with right hand",
3
+ "reward": 0.0,
4
+ "done": false,
5
+ "front_rgb_shape_after_step": [
6
+ 128,
7
+ 128,
8
+ 3
9
+ ]
10
+ }
artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/config_resolved.yaml ADDED
@@ -0,0 +1,126 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ experiment_name: rlbench_open_drawer_interaction_smoke
2
+ output_dir: /workspace/VLAarchtests/artifacts/outputs/interaction
3
+ device: cuda
4
+ seed: 13
5
+ init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction/proxy_interaction_state_smoke/checkpoint_best.pt
6
+ init_strict: false
7
+ data:
8
+ dataset_root: /workspace/VLAarchtests/artifacts/data/rlbench_smoke_open_drawer
9
+ tasks:
10
+ - open_drawer
11
+ train_episodes:
12
+ - 0
13
+ val_episodes:
14
+ - 1
15
+ resolution: 128
16
+ chunk_horizon: 4
17
+ proprio_dim: 32
18
+ history_steps: 6
19
+ max_train_samples: 8
20
+ max_val_samples: 4
21
+ optim:
22
+ epochs: 1
23
+ batch_size: 2
24
+ num_workers: 0
25
+ lr: 0.0005
26
+ weight_decay: 0.0001
27
+ trainer:
28
+ policy_type: interaction_state
29
+ use_bf16: true
30
+ grad_clip_norm: 1.0
31
+ freeze_backbone: true
32
+ gradient_checkpointing: false
33
+ plan_during_train: false
34
+ plan_during_eval: true
35
+ support_mode_conditioning: true
36
+ planner_mode: proxy_pretrained
37
+ policy:
38
+ backbone:
39
+ model_name: openai/clip-vit-base-patch32
40
+ hidden_dim: 64
41
+ max_text_tokens: 32
42
+ freeze_backbone: true
43
+ gradient_checkpointing: false
44
+ use_dummy_backbone: true
45
+ fusion:
46
+ hidden_dim: 64
47
+ num_cameras: 3
48
+ num_layers: 2
49
+ num_heads: 4
50
+ ff_dim: 128
51
+ dropout: 0.1
52
+ proprio_dim: 32
53
+ proprio_tokens: 1
54
+ memory:
55
+ hidden_dim: 64
56
+ history_steps: 6
57
+ num_layers: 2
58
+ dropout: 0.1
59
+ memory_bank_size: 4
60
+ num_heads: 4
61
+ max_history_steps: 8
62
+ decoder:
63
+ hidden_dim: 64
64
+ num_heads: 4
65
+ num_layers: 2
66
+ ff_dim: 128
67
+ dropout: 0.1
68
+ chunk_size: 4
69
+ action_dim: 14
70
+ arm_action_dim: 7
71
+ num_candidates: 4
72
+ num_phases: 5
73
+ num_arm_roles: 4
74
+ reveal_head:
75
+ hidden_dim: 64
76
+ num_support_modes: 3
77
+ num_approach_templates: 32
78
+ rollout_horizon: 3
79
+ belief_map_size: 32
80
+ field_size: 16
81
+ num_heads: 4
82
+ predict_belief_map: true
83
+ num_phases: 5
84
+ num_arm_roles: 4
85
+ num_interaction_tokens: 8
86
+ world_model:
87
+ hidden_dim: 64
88
+ action_dim: 14
89
+ num_support_modes: 3
90
+ num_approach_templates: 32
91
+ rollout_horizon: 3
92
+ field_size: 16
93
+ num_heads: 4
94
+ num_phases: 5
95
+ num_arm_roles: 4
96
+ num_interaction_tokens: 8
97
+ belief_map_size: 32
98
+ predict_belief_map: true
99
+ planner:
100
+ hidden_dim: 64
101
+ num_candidates: 4
102
+ action_dim: 14
103
+ num_support_modes: 3
104
+ utility_margin: 0.1
105
+ corridor_weight: 1.0
106
+ persistence_weight: 0.5
107
+ proposal_weight: 0.5
108
+ task_progress_weight: 0.75
109
+ disturbance_weight: 0.75
110
+ reocclusion_weight: 0.5
111
+ visibility_weight: 0.25
112
+ num_heads: 4
113
+ num_layers: 2
114
+ num_phases: 5
115
+ num_arm_roles: 4
116
+ loss_weights:
117
+ action: 1.0
118
+ support_mode: 0.0
119
+ corridor: 0.0
120
+ persistence: 0.0
121
+ disturbance: 0.0
122
+ world_model: 0.0
123
+ belief: 0.0
124
+ planner_success: 0.0
125
+ planner_risk: 0.0
126
+ planner_ranking: 0.0
artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/metrics.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "epoch": 0,
4
+ "train": {
5
+ "action": 0.1628243774175644,
6
+ "planner_ranking": 0.0,
7
+ "planner_risk": 0.0,
8
+ "planner_success": 0.0,
9
+ "proposal_ranking": 0.0,
10
+ "proposal_reconstruction": 0.0,
11
+ "proposal_success": 0.0,
12
+ "total": 0.1628243774175644,
13
+ "world_model": 0.0
14
+ },
15
+ "val": {
16
+ "action": 0.05217807739973068,
17
+ "planner_ranking": 0.0,
18
+ "planner_risk": 0.0,
19
+ "planner_success": 0.0,
20
+ "proposal_ranking": 0.0,
21
+ "proposal_reconstruction": 0.0,
22
+ "proposal_success": 0.0,
23
+ "total": 0.05217807739973068,
24
+ "world_model": 0.0
25
+ }
26
+ }
27
+ ]
artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/summary.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "experiment_name": "rlbench_open_drawer_interaction_smoke",
3
+ "device": "cuda",
4
+ "best_checkpoint": "/workspace/VLAarchtests/artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/checkpoint_best.pt",
5
+ "final_train_total": 0.1628243774175644,
6
+ "final_val_total": 0.05217807739973068,
7
+ "train_dataset": {
8
+ "dataset_root": "/workspace/VLAarchtests/artifacts/data/rlbench_smoke_open_drawer",
9
+ "tasks": [
10
+ "open_drawer"
11
+ ],
12
+ "episode_indices": [
13
+ 0
14
+ ],
15
+ "num_episodes": 1,
16
+ "num_samples": 1,
17
+ "resolution": 128,
18
+ "chunk_size": 4,
19
+ "proprio_dim": 32,
20
+ "history_steps": 6
21
+ },
22
+ "val_dataset": {
23
+ "dataset_root": "/workspace/VLAarchtests/artifacts/data/rlbench_smoke_open_drawer",
24
+ "tasks": [
25
+ "open_drawer"
26
+ ],
27
+ "episode_indices": [
28
+ 1
29
+ ],
30
+ "num_episodes": 1,
31
+ "num_samples": 1,
32
+ "resolution": 128,
33
+ "chunk_size": 4,
34
+ "proprio_dim": 32,
35
+ "history_steps": 6
36
+ },
37
+ "init_info": {
38
+ "path": "/workspace/VLAarchtests/artifacts/outputs/interaction/proxy_interaction_state_smoke/checkpoint_best.pt",
39
+ "missing_keys": [],
40
+ "unexpected_keys": []
41
+ },
42
+ "planner_mode": "proxy_pretrained",
43
+ "plan_enabled_for_train": false,
44
+ "plan_enabled_for_eval": true,
45
+ "frozen_modules": [
46
+ "interaction_head",
47
+ "world_model",
48
+ "planner"
49
+ ]
50
+ }
artifacts/outputs/interaction/rlbench_open_drawer_rollout_eval/rollout_eval.json ADDED
@@ -0,0 +1,23 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "checkpoint": "/workspace/VLAarchtests/artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/checkpoint_best.pt",
3
+ "plan_requested": true,
4
+ "plan_applied": true,
5
+ "planner_mode": "proxy_pretrained",
6
+ "support_mode_conditioning": true,
7
+ "episodes_per_task": 1,
8
+ "episode_length": 2,
9
+ "resolution": 128,
10
+ "cameras": [
11
+ "front",
12
+ "wrist_left",
13
+ "wrist_right"
14
+ ],
15
+ "tasks": {
16
+ "open_drawer": {
17
+ "error": "A path could not be found because the target is outside of workspace.",
18
+ "mean_success": 0.0,
19
+ "mean_return": 0.0
20
+ }
21
+ },
22
+ "mean_success": 0.0
23
+ }
artifacts/outputs/interaction/rlbench_open_drawer_rollout_eval/rollout_eval.md ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # RLBench Rollout Eval
2
+
3
+ - Checkpoint: `/workspace/VLAarchtests/artifacts/outputs/interaction/rlbench_open_drawer_interaction_smoke/checkpoint_best.pt`
4
+ - Plan requested: `True`
5
+ - Plan applied: `True`
6
+ - Support-mode conditioning: `True`
7
+ - Mean success: `0.000`
8
+
9
+ ## Per-task
10
+
11
+ - `open_drawer`: error=A path could not be found because the target is outside of workspace.
artifacts/outputs/interaction/smoke_checks/smoke_checks.json ADDED
@@ -0,0 +1,156 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "proxy": {
3
+ "losses": {
4
+ "action": 0.2892940640449524,
5
+ "phase": 1.4684441089630127,
6
+ "arm_role": 1.4457536935806274,
7
+ "support_mode": 1.0726321935653687,
8
+ "corridor": 0.7346047163009644,
9
+ "persistence": 1.7679060697555542,
10
+ "disturbance": 0.1656816601753235,
11
+ "belief": 0.6104393005371094,
12
+ "reocclusion": 0.6754688024520874,
13
+ "uncertainty": 0.733498752117157,
14
+ "world_model": 3.4413514137268066,
15
+ "planner_success": 0.5609128475189209,
16
+ "planner_risk": 0.09320252388715744,
17
+ "planner_ranking": 0.06516511738300323,
18
+ "proposal_reconstruction": 0.36118850111961365,
19
+ "proposal_success": 0.7169663906097412,
20
+ "proposal_ranking": 0.1487310826778412,
21
+ "total": 1.251321792602539
22
+ },
23
+ "grad_norm": 1.7515980005264282,
24
+ "candidate_shape": [
25
+ 2,
26
+ 4,
27
+ 4,
28
+ 14
29
+ ],
30
+ "rollout_phase_shape": [
31
+ 2,
32
+ 4,
33
+ 4,
34
+ 5
35
+ ]
36
+ },
37
+ "rlbench": {
38
+ "losses": {
39
+ "action": 0.4834498167037964,
40
+ "world_model": 0.0,
41
+ "planner_success": 0.0,
42
+ "planner_risk": 0.0,
43
+ "planner_ranking": 0.0,
44
+ "proposal_reconstruction": 0.0,
45
+ "proposal_success": 0.0,
46
+ "proposal_ranking": 0.0,
47
+ "total": 0.4834498167037964
48
+ },
49
+ "grad_norm": 2.1583147048950195,
50
+ "candidate_shape": [
51
+ 2,
52
+ 4,
53
+ 4,
54
+ 14
55
+ ],
56
+ "rollout_phase_shape": [
57
+ 2,
58
+ 4,
59
+ 4,
60
+ 5
61
+ ],
62
+ "planner_enabled_for_eval": true,
63
+ "frozen_modules": [
64
+ "interaction_head",
65
+ "world_model",
66
+ "planner"
67
+ ]
68
+ },
69
+ "policy_config": {
70
+ "backbone": {
71
+ "model_name": "openai/clip-vit-base-patch32",
72
+ "hidden_dim": 64,
73
+ "max_text_tokens": 32,
74
+ "freeze_backbone": true,
75
+ "gradient_checkpointing": false,
76
+ "use_dummy_backbone": true
77
+ },
78
+ "fusion": {
79
+ "hidden_dim": 64,
80
+ "num_cameras": 3,
81
+ "num_layers": 2,
82
+ "num_heads": 4,
83
+ "ff_dim": 128,
84
+ "dropout": 0.1,
85
+ "proprio_dim": 32,
86
+ "proprio_tokens": 1
87
+ },
88
+ "memory": {
89
+ "hidden_dim": 64,
90
+ "history_steps": 6,
91
+ "num_layers": 2,
92
+ "dropout": 0.1,
93
+ "memory_bank_size": 4,
94
+ "num_heads": 4,
95
+ "max_history_steps": 8
96
+ },
97
+ "decoder": {
98
+ "hidden_dim": 64,
99
+ "num_heads": 4,
100
+ "num_layers": 2,
101
+ "ff_dim": 128,
102
+ "dropout": 0.1,
103
+ "chunk_size": 4,
104
+ "action_dim": 14,
105
+ "arm_action_dim": 7,
106
+ "num_candidates": 4,
107
+ "num_phases": 5,
108
+ "num_arm_roles": 4
109
+ },
110
+ "reveal_head": {
111
+ "hidden_dim": 64,
112
+ "num_support_modes": 3,
113
+ "num_approach_templates": 32,
114
+ "rollout_horizon": 3,
115
+ "belief_map_size": 32,
116
+ "field_size": 16,
117
+ "num_heads": 4,
118
+ "predict_belief_map": true,
119
+ "num_phases": 5,
120
+ "num_arm_roles": 4,
121
+ "num_interaction_tokens": 8
122
+ },
123
+ "world_model": {
124
+ "hidden_dim": 64,
125
+ "action_dim": 14,
126
+ "num_support_modes": 3,
127
+ "num_approach_templates": 32,
128
+ "rollout_horizon": 3,
129
+ "field_size": 16,
130
+ "num_heads": 4,
131
+ "num_phases": 5,
132
+ "num_arm_roles": 4,
133
+ "num_interaction_tokens": 8,
134
+ "belief_map_size": 32,
135
+ "predict_belief_map": true
136
+ },
137
+ "planner": {
138
+ "hidden_dim": 64,
139
+ "num_candidates": 4,
140
+ "action_dim": 14,
141
+ "num_support_modes": 3,
142
+ "utility_margin": 0.1,
143
+ "corridor_weight": 1.0,
144
+ "persistence_weight": 0.5,
145
+ "proposal_weight": 0.5,
146
+ "task_progress_weight": 0.75,
147
+ "disturbance_weight": 0.75,
148
+ "reocclusion_weight": 0.5,
149
+ "visibility_weight": 0.25,
150
+ "num_heads": 4,
151
+ "num_layers": 2,
152
+ "num_phases": 5,
153
+ "num_arm_roles": 4
154
+ }
155
+ }
156
+ }
artifacts/outputs/interaction_rolefix/proxy_interaction_state_smoke/config_resolved.yaml ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ experiment_name: proxy_interaction_state_smoke
2
+ output_dir: /workspace/VLAarchtests/artifacts/outputs/interaction
3
+ device: cuda
4
+ seed: 13
5
+ data:
6
+ proxies:
7
+ - foliage_proxy
8
+ - bag_proxy
9
+ - cloth_proxy
10
+ resolution: 64
11
+ train_episodes_per_proxy: 6
12
+ val_episodes_per_proxy: 2
13
+ train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_smoke_v4.pt
14
+ val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_smoke_v4.pt
15
+ rebuild_dataset: false
16
+ chunk_horizon: 4
17
+ rollout_horizon: 3
18
+ history_steps: 6
19
+ planner_candidates: 4
20
+ seed: 13
21
+ optim:
22
+ epochs: 2
23
+ batch_size: 8
24
+ num_workers: 0
25
+ lr: 0.001
26
+ weight_decay: 0.0001
27
+ trainer:
28
+ policy_type: interaction_state
29
+ use_bf16: true
30
+ grad_clip_norm: 1.0
31
+ freeze_backbone: true
32
+ gradient_checkpointing: false
33
+ plan_during_train: true
34
+ plan_during_eval: true
35
+ support_mode_conditioning: true
36
+ planner_mode: trainable
37
+ policy:
38
+ backbone:
39
+ model_name: openai/clip-vit-base-patch32
40
+ hidden_dim: 64
41
+ max_text_tokens: 32
42
+ freeze_backbone: true
43
+ gradient_checkpointing: false
44
+ use_dummy_backbone: true
45
+ fusion:
46
+ hidden_dim: 64
47
+ num_cameras: 3
48
+ num_layers: 2
49
+ num_heads: 4
50
+ ff_dim: 128
51
+ dropout: 0.1
52
+ proprio_dim: 32
53
+ proprio_tokens: 1
54
+ memory:
55
+ hidden_dim: 64
56
+ history_steps: 6
57
+ num_layers: 2
58
+ dropout: 0.1
59
+ memory_bank_size: 4
60
+ num_heads: 4
61
+ max_history_steps: 8
62
+ decoder:
63
+ hidden_dim: 64
64
+ num_heads: 4
65
+ num_layers: 2
66
+ ff_dim: 128
67
+ dropout: 0.1
68
+ chunk_size: 4
69
+ action_dim: 14
70
+ arm_action_dim: 7
71
+ num_candidates: 4
72
+ num_phases: 5
73
+ num_arm_roles: 4
74
+ reveal_head:
75
+ hidden_dim: 64
76
+ num_support_modes: 3
77
+ num_approach_templates: 32
78
+ rollout_horizon: 3
79
+ belief_map_size: 32
80
+ field_size: 16
81
+ num_heads: 4
82
+ predict_belief_map: true
83
+ num_phases: 5
84
+ num_arm_roles: 4
85
+ num_interaction_tokens: 8
86
+ world_model:
87
+ hidden_dim: 64
88
+ action_dim: 14
89
+ num_support_modes: 3
90
+ num_approach_templates: 32
91
+ rollout_horizon: 3
92
+ field_size: 16
93
+ num_heads: 4
94
+ num_phases: 5
95
+ num_arm_roles: 4
96
+ num_interaction_tokens: 8
97
+ planner:
98
+ hidden_dim: 64
99
+ num_candidates: 4
100
+ action_dim: 14
101
+ num_support_modes: 3
102
+ utility_margin: 0.1
103
+ num_heads: 4
104
+ num_layers: 2
105
+ num_phases: 5
106
+ num_arm_roles: 4
107
+ loss_weights:
108
+ action: 1.0
109
+ support_mode: 0.15
110
+ corridor: 0.2
111
+ persistence: 0.1
112
+ disturbance: 0.1
113
+ world_model: 0.25
114
+ belief: 0.05
115
+ planner_success: 0.2
116
+ planner_risk: 0.1
117
+ planner_ranking: 0.1
118
+ proposal_reconstruction: 0.2
119
+ proposal_success: 0.1
120
+ proposal_ranking: 0.1
artifacts/outputs/interaction_rolefix/proxy_interaction_state_smoke/diagnostics/proxy_diagnostics.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "planner_top1_accuracy": 0.5,
3
+ "planner_regret": 0.28291308879852295,
4
+ "risk_calibration_mse": 0.011351427994668484,
5
+ "role_collapse_rate": 0.0,
6
+ "num_samples": 16
7
+ }
artifacts/outputs/interaction_rolefix/proxy_interaction_state_smoke/metrics.json ADDED
@@ -0,0 +1,88 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "epoch": 0,
4
+ "train": {
5
+ "action": 0.19658433113779342,
6
+ "arm_role": 1.238295819078173,
7
+ "belief": 0.5369629051004138,
8
+ "corridor": 0.5293313392571041,
9
+ "disturbance": 0.09085389758859362,
10
+ "persistence": 1.7996907574789864,
11
+ "phase": 1.0361328125,
12
+ "planner_ranking": 0.1484200656414032,
13
+ "planner_risk": 0.03149750775524548,
14
+ "planner_success": 0.6290038738931928,
15
+ "proposal_ranking": 0.12105858219521386,
16
+ "proposal_reconstruction": 0.26322201426540104,
17
+ "proposal_success": 0.5991358501570565,
18
+ "reocclusion": 0.65535911491939,
19
+ "support_mode": 0.8046875,
20
+ "total": 1.8467402798788888,
21
+ "uncertainty": 0.5706954428127834,
22
+ "world_model": 2.483790295464652
23
+ },
24
+ "val": {
25
+ "action": 0.07703214511275291,
26
+ "arm_role": 0.7396750450134277,
27
+ "belief": 0.391730472445488,
28
+ "corridor": 0.39731982350349426,
29
+ "disturbance": 0.0602701585739851,
30
+ "persistence": 1.7171077132225037,
31
+ "phase": 0.8182927072048187,
32
+ "planner_ranking": 0.10551176220178604,
33
+ "planner_risk": 0.010366585105657578,
34
+ "planner_success": 0.6895906329154968,
35
+ "proposal_ranking": 0.10800172761082649,
36
+ "proposal_reconstruction": 0.11226572096347809,
37
+ "proposal_success": 0.6531190276145935,
38
+ "reocclusion": 0.7202109694480896,
39
+ "support_mode": 0.8539398014545441,
40
+ "total": 1.366153061389923,
41
+ "uncertainty": 0.47223055362701416,
42
+ "world_model": 1.7127767205238342
43
+ }
44
+ },
45
+ {
46
+ "epoch": 1,
47
+ "train": {
48
+ "action": 0.0750974959560803,
49
+ "arm_role": 0.5170274334294456,
50
+ "belief": 0.26841118931770325,
51
+ "corridor": 0.31833365133830477,
52
+ "disturbance": 0.03495508113077709,
53
+ "persistence": 1.7808540718896049,
54
+ "phase": 0.825927734375,
55
+ "planner_ranking": 0.1236130531345095,
56
+ "planner_risk": 0.008478787228731173,
57
+ "planner_success": 0.6077252456120082,
58
+ "proposal_ranking": 0.08608398373637881,
59
+ "proposal_reconstruction": 0.111362986266613,
60
+ "proposal_success": 0.5995349713734218,
61
+ "reocclusion": 0.705062244619642,
62
+ "support_mode": 0.7960728236607143,
63
+ "total": 1.205997347831726,
64
+ "uncertainty": 0.387926242181233,
65
+ "world_model": 1.4581984792436873
66
+ },
67
+ "val": {
68
+ "action": 0.057233477011322975,
69
+ "arm_role": 0.269483357667923,
70
+ "belief": 0.14032869786024094,
71
+ "corridor": 0.2390739619731903,
72
+ "disturbance": 0.007302357582375407,
73
+ "persistence": 1.7315670251846313,
74
+ "phase": 0.692381888628006,
75
+ "planner_ranking": 0.10375471040606499,
76
+ "planner_risk": 0.011348946020007133,
77
+ "planner_success": 0.651288777589798,
78
+ "proposal_ranking": 0.1232626661658287,
79
+ "proposal_reconstruction": 0.1019212193787098,
80
+ "proposal_success": 0.6862722337245941,
81
+ "reocclusion": 0.7099874913692474,
82
+ "support_mode": 0.7302495241165161,
83
+ "total": 1.130429446697235,
84
+ "uncertainty": 0.2572660893201828,
85
+ "world_model": 1.5461857914924622
86
+ }
87
+ }
88
+ ]
artifacts/outputs/interaction_rolefix/reveal_eval_interaction_smoke/reveal_benchmark.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "interaction": {
3
+ "per_task_success": {
4
+ "foliage_proxy": 0.0,
5
+ "bag_proxy": 0.0,
6
+ "cloth_proxy": 0.0
7
+ },
8
+ "mean_success": 0.0,
9
+ "visibility_integral": 62.513198375701904,
10
+ "corridor_availability": 0.9871399253606796,
11
+ "reocclusion_rate": 0.0,
12
+ "persistence_horizon_mae": 2.8390470795333385,
13
+ "disturbance_cost": 0.9011474947134653
14
+ }
15
+ }
artifacts/outputs/interaction_rolefix/reveal_eval_interaction_smoke/reveal_benchmark.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Reveal Proxy Benchmark
2
+
3
+ ## interaction
4
+ - checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_rolefix/proxy_interaction_state_smoke/checkpoint_best.pt
5
+ - mean_success: 0.000
6
+ - visibility_integral: 62.513
7
+ - corridor_availability: 0.987
8
+ - reocclusion_rate: 0.000
9
+ - persistence_horizon_mae: 2.839
10
+ - disturbance_cost: 0.901
11
+ - foliage_proxy_success: 0.000
12
+ - bag_proxy_success: 0.000
13
+ - cloth_proxy_success: 0.000
artifacts/outputs/interaction_rolefix/smoke_checks/smoke_checks.json ADDED
@@ -0,0 +1,156 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "proxy": {
3
+ "losses": {
4
+ "action": 0.6122138500213623,
5
+ "phase": 1.8211359977722168,
6
+ "arm_role": 1.5296992063522339,
7
+ "support_mode": 1.1458361148834229,
8
+ "corridor": 0.7023701071739197,
9
+ "persistence": 2.00616717338562,
10
+ "disturbance": 0.16314803063869476,
11
+ "belief": 0.789874792098999,
12
+ "reocclusion": 0.6530417203903198,
13
+ "uncertainty": 0.7662769556045532,
14
+ "world_model": 3.8060429096221924,
15
+ "planner_success": 0.8667193651199341,
16
+ "planner_risk": 0.040573738515377045,
17
+ "planner_ranking": 0.26484477519989014,
18
+ "proposal_reconstruction": 0.7444740533828735,
19
+ "proposal_success": 0.8012435436248779,
20
+ "proposal_ranking": 0.07552901655435562,
21
+ "total": 1.9635474681854248
22
+ },
23
+ "grad_norm": 3.2980921268463135,
24
+ "candidate_shape": [
25
+ 2,
26
+ 4,
27
+ 4,
28
+ 14
29
+ ],
30
+ "rollout_phase_shape": [
31
+ 2,
32
+ 4,
33
+ 4,
34
+ 5
35
+ ]
36
+ },
37
+ "rlbench": {
38
+ "losses": {
39
+ "action": 0.44427579641342163,
40
+ "world_model": 0.0,
41
+ "planner_success": 0.0,
42
+ "planner_risk": 0.0,
43
+ "planner_ranking": 0.0,
44
+ "proposal_reconstruction": 0.0,
45
+ "proposal_success": 0.0,
46
+ "proposal_ranking": 0.0,
47
+ "total": 0.44427579641342163
48
+ },
49
+ "grad_norm": 2.2887489795684814,
50
+ "candidate_shape": [
51
+ 2,
52
+ 4,
53
+ 4,
54
+ 14
55
+ ],
56
+ "rollout_phase_shape": [
57
+ 2,
58
+ 4,
59
+ 4,
60
+ 5
61
+ ],
62
+ "planner_enabled_for_eval": true,
63
+ "frozen_modules": [
64
+ "interaction_head",
65
+ "world_model",
66
+ "planner"
67
+ ]
68
+ },
69
+ "policy_config": {
70
+ "backbone": {
71
+ "model_name": "openai/clip-vit-base-patch32",
72
+ "hidden_dim": 64,
73
+ "max_text_tokens": 32,
74
+ "freeze_backbone": true,
75
+ "gradient_checkpointing": false,
76
+ "use_dummy_backbone": true
77
+ },
78
+ "fusion": {
79
+ "hidden_dim": 64,
80
+ "num_cameras": 3,
81
+ "num_layers": 2,
82
+ "num_heads": 4,
83
+ "ff_dim": 128,
84
+ "dropout": 0.1,
85
+ "proprio_dim": 32,
86
+ "proprio_tokens": 1
87
+ },
88
+ "memory": {
89
+ "hidden_dim": 64,
90
+ "history_steps": 6,
91
+ "num_layers": 2,
92
+ "dropout": 0.1,
93
+ "memory_bank_size": 4,
94
+ "num_heads": 4,
95
+ "max_history_steps": 8
96
+ },
97
+ "decoder": {
98
+ "hidden_dim": 64,
99
+ "num_heads": 4,
100
+ "num_layers": 2,
101
+ "ff_dim": 128,
102
+ "dropout": 0.1,
103
+ "chunk_size": 4,
104
+ "action_dim": 14,
105
+ "arm_action_dim": 7,
106
+ "num_candidates": 4,
107
+ "num_phases": 5,
108
+ "num_arm_roles": 4
109
+ },
110
+ "reveal_head": {
111
+ "hidden_dim": 64,
112
+ "num_support_modes": 3,
113
+ "num_approach_templates": 32,
114
+ "rollout_horizon": 3,
115
+ "belief_map_size": 32,
116
+ "field_size": 16,
117
+ "num_heads": 4,
118
+ "predict_belief_map": true,
119
+ "num_phases": 5,
120
+ "num_arm_roles": 4,
121
+ "num_interaction_tokens": 8
122
+ },
123
+ "world_model": {
124
+ "hidden_dim": 64,
125
+ "action_dim": 14,
126
+ "num_support_modes": 3,
127
+ "num_approach_templates": 32,
128
+ "rollout_horizon": 3,
129
+ "field_size": 16,
130
+ "num_heads": 4,
131
+ "num_phases": 5,
132
+ "num_arm_roles": 4,
133
+ "num_interaction_tokens": 8,
134
+ "belief_map_size": 32,
135
+ "predict_belief_map": true
136
+ },
137
+ "planner": {
138
+ "hidden_dim": 64,
139
+ "num_candidates": 4,
140
+ "action_dim": 14,
141
+ "num_support_modes": 3,
142
+ "utility_margin": 0.1,
143
+ "corridor_weight": 1.0,
144
+ "persistence_weight": 0.5,
145
+ "proposal_weight": 0.5,
146
+ "task_progress_weight": 0.75,
147
+ "disturbance_weight": 0.75,
148
+ "reocclusion_weight": 0.5,
149
+ "visibility_weight": 0.25,
150
+ "num_heads": 4,
151
+ "num_layers": 2,
152
+ "num_phases": 5,
153
+ "num_arm_roles": 4
154
+ }
155
+ }
156
+ }
artifacts/outputs/interaction_rolefix_full/proxy_interaction_state/config_resolved.yaml ADDED
@@ -0,0 +1,120 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ experiment_name: proxy_interaction_state
2
+ output_dir: /workspace/VLAarchtests/artifacts/outputs/interaction
3
+ device: cuda
4
+ seed: 13
5
+ data:
6
+ proxies:
7
+ - foliage_proxy
8
+ - bag_proxy
9
+ - cloth_proxy
10
+ resolution: 96
11
+ train_episodes_per_proxy: 48
12
+ val_episodes_per_proxy: 16
13
+ train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v4_noleak_counterfactual.pt
14
+ val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v4_noleak_counterfactual.pt
15
+ rebuild_dataset: false
16
+ chunk_horizon: 8
17
+ rollout_horizon: 5
18
+ history_steps: 6
19
+ planner_candidates: 8
20
+ seed: 13
21
+ optim:
22
+ epochs: 8
23
+ batch_size: 16
24
+ num_workers: 0
25
+ lr: 0.001
26
+ weight_decay: 0.0001
27
+ trainer:
28
+ policy_type: interaction_state
29
+ use_bf16: true
30
+ grad_clip_norm: 1.0
31
+ freeze_backbone: true
32
+ gradient_checkpointing: false
33
+ plan_during_train: true
34
+ plan_during_eval: true
35
+ support_mode_conditioning: true
36
+ planner_mode: trainable
37
+ policy:
38
+ backbone:
39
+ model_name: openai/clip-vit-base-patch32
40
+ hidden_dim: 128
41
+ max_text_tokens: 32
42
+ freeze_backbone: true
43
+ gradient_checkpointing: false
44
+ use_dummy_backbone: true
45
+ fusion:
46
+ hidden_dim: 128
47
+ num_cameras: 3
48
+ num_layers: 2
49
+ num_heads: 4
50
+ ff_dim: 256
51
+ dropout: 0.1
52
+ proprio_dim: 32
53
+ proprio_tokens: 1
54
+ memory:
55
+ hidden_dim: 128
56
+ history_steps: 6
57
+ num_layers: 2
58
+ dropout: 0.1
59
+ memory_bank_size: 4
60
+ num_heads: 4
61
+ max_history_steps: 8
62
+ decoder:
63
+ hidden_dim: 128
64
+ num_heads: 4
65
+ num_layers: 2
66
+ ff_dim: 256
67
+ dropout: 0.1
68
+ chunk_size: 8
69
+ action_dim: 14
70
+ arm_action_dim: 7
71
+ num_candidates: 8
72
+ num_phases: 5
73
+ num_arm_roles: 4
74
+ reveal_head:
75
+ hidden_dim: 128
76
+ num_support_modes: 3
77
+ num_approach_templates: 32
78
+ rollout_horizon: 5
79
+ belief_map_size: 32
80
+ field_size: 16
81
+ num_heads: 4
82
+ predict_belief_map: true
83
+ num_phases: 5
84
+ num_arm_roles: 4
85
+ num_interaction_tokens: 8
86
+ world_model:
87
+ hidden_dim: 128
88
+ action_dim: 14
89
+ num_support_modes: 3
90
+ num_approach_templates: 32
91
+ rollout_horizon: 5
92
+ field_size: 16
93
+ num_heads: 4
94
+ num_phases: 5
95
+ num_arm_roles: 4
96
+ num_interaction_tokens: 8
97
+ planner:
98
+ hidden_dim: 128
99
+ num_candidates: 8
100
+ action_dim: 14
101
+ num_support_modes: 3
102
+ utility_margin: 0.1
103
+ num_heads: 4
104
+ num_layers: 2
105
+ num_phases: 5
106
+ num_arm_roles: 4
107
+ loss_weights:
108
+ action: 1.0
109
+ support_mode: 0.15
110
+ corridor: 0.2
111
+ persistence: 0.1
112
+ disturbance: 0.1
113
+ world_model: 0.25
114
+ belief: 0.05
115
+ planner_success: 0.2
116
+ planner_risk: 0.1
117
+ planner_ranking: 0.1
118
+ proposal_reconstruction: 0.2
119
+ proposal_success: 0.1
120
+ proposal_ranking: 0.1
artifacts/outputs/interaction_rolefix_full/proxy_interaction_state/diagnostics/proxy_diagnostics.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "planner_top1_accuracy": 0.29365079365079366,
3
+ "planner_regret": 0.08918909728527069,
4
+ "risk_calibration_mse": 0.009334742091596127,
5
+ "role_collapse_rate": 0.0,
6
+ "num_samples": 126
7
+ }
artifacts/outputs/interaction_rolefix_full/proxy_interaction_state/metrics.json ADDED
@@ -0,0 +1,346 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ [
2
+ {
3
+ "epoch": 0,
4
+ "train": {
5
+ "action": 0.10215476644225419,
6
+ "arm_role": 0.15410413238290252,
7
+ "belief": 0.2275839550420642,
8
+ "corridor": 0.31619268904129666,
9
+ "disturbance": 0.03557364640194768,
10
+ "persistence": 4.14529608686765,
11
+ "phase": 0.853579930961132,
12
+ "planner_ranking": 0.1402236126984159,
13
+ "planner_risk": 0.014521602657623589,
14
+ "planner_success": 0.6516827717423439,
15
+ "proposal_ranking": 0.12396896040687959,
16
+ "proposal_reconstruction": 0.15117586574827632,
17
+ "proposal_success": 0.6129913156231245,
18
+ "reocclusion": 0.6800185019771258,
19
+ "support_mode": 0.750041052699089,
20
+ "total": 1.7794813563426335,
21
+ "uncertainty": 0.2749920679877202,
22
+ "world_model": 2.930093298355738
23
+ },
24
+ "val": {
25
+ "action": 0.024464906891807914,
26
+ "arm_role": 0.00021468327213369776,
27
+ "belief": 0.11063466407358646,
28
+ "corridor": 0.24291332066059113,
29
+ "disturbance": 0.0021771492902189493,
30
+ "persistence": 4.035085469484329,
31
+ "phase": 0.7842688634991646,
32
+ "planner_ranking": 0.09380591381341219,
33
+ "planner_risk": 0.010528087033890188,
34
+ "planner_success": 0.6487544104456902,
35
+ "proposal_ranking": 0.09357322473078966,
36
+ "proposal_reconstruction": 0.05812322115525603,
37
+ "proposal_success": 0.6223367899656296,
38
+ "reocclusion": 0.6689130887389183,
39
+ "support_mode": 0.6824429258704185,
40
+ "total": 1.57107612490654,
41
+ "uncertainty": 0.04649291839450598,
42
+ "world_model": 2.8396184891462326
43
+ }
44
+ },
45
+ {
46
+ "epoch": 1,
47
+ "train": {
48
+ "action": 0.026911177905276418,
49
+ "arm_role": 9.164462486902873e-05,
50
+ "belief": 0.1127748250340422,
51
+ "corridor": 0.2482043243944645,
52
+ "disturbance": 0.0027894085894028344,
53
+ "persistence": 4.123300572236379,
54
+ "phase": 0.6966945106784502,
55
+ "planner_ranking": 0.1299859213953217,
56
+ "planner_risk": 0.011287257443958273,
57
+ "planner_success": 0.5469006697336832,
58
+ "proposal_ranking": 0.09497337446858485,
59
+ "proposal_reconstruction": 0.0546847361450394,
60
+ "proposal_success": 0.6040425598621368,
61
+ "reocclusion": 0.6738451148072878,
62
+ "support_mode": 0.6803697869181633,
63
+ "total": 1.4895438154538472,
64
+ "uncertainty": 0.04838159323359529,
65
+ "world_model": 2.5581150303284326
66
+ },
67
+ "val": {
68
+ "action": 0.0219610589556396,
69
+ "arm_role": 4.7797779643588e-05,
70
+ "belief": 0.11248616222292185,
71
+ "corridor": 0.24107512645423412,
72
+ "disturbance": 0.00229803760885261,
73
+ "persistence": 3.881433367729187,
74
+ "phase": 0.6858366876840591,
75
+ "planner_ranking": 0.10271583311259747,
76
+ "planner_risk": 0.010726989770773798,
77
+ "planner_success": 0.5016077607870102,
78
+ "proposal_ranking": 0.10926759615540504,
79
+ "proposal_reconstruction": 0.04846362583339214,
80
+ "proposal_success": 0.6263654828071594,
81
+ "reocclusion": 0.6623825207352638,
82
+ "support_mode": 0.6905809789896011,
83
+ "total": 1.4332728832960129,
84
+ "uncertainty": 0.03836950287222862,
85
+ "world_model": 2.490630403161049
86
+ }
87
+ },
88
+ {
89
+ "epoch": 2,
90
+ "train": {
91
+ "action": 0.028564381878823042,
92
+ "arm_role": 4.20472629230062e-05,
93
+ "belief": 0.11768585878113906,
94
+ "corridor": 0.2521046095838149,
95
+ "disturbance": 0.004006393282907084,
96
+ "persistence": 4.002537985642751,
97
+ "phase": 0.6817111050089201,
98
+ "planner_ranking": 0.14222958280394474,
99
+ "planner_risk": 0.010941210687936595,
100
+ "planner_success": 0.51358712464571,
101
+ "proposal_ranking": 0.10021264447520177,
102
+ "proposal_reconstruction": 0.05586679264282187,
103
+ "proposal_success": 0.6042261434098085,
104
+ "reocclusion": 0.6711050619681677,
105
+ "support_mode": 0.6735592807332674,
106
+ "total": 1.4198974122603734,
107
+ "uncertainty": 0.04468160099349916,
108
+ "world_model": 2.342899337410927
109
+ },
110
+ "val": {
111
+ "action": 0.03662527119740844,
112
+ "arm_role": 3.9326611840806436e-05,
113
+ "belief": 0.11038805078715086,
114
+ "corridor": 0.23578420095145702,
115
+ "disturbance": 0.0031197248463286087,
116
+ "persistence": 3.7882876694202423,
117
+ "phase": 0.677653007209301,
118
+ "planner_ranking": 0.12569222133606672,
119
+ "planner_risk": 0.010821192641742527,
120
+ "planner_success": 0.5561830475926399,
121
+ "proposal_ranking": 0.09295124560594559,
122
+ "proposal_reconstruction": 0.06929249316453934,
123
+ "proposal_success": 0.6254506856203079,
124
+ "reocclusion": 0.6604316681623459,
125
+ "support_mode": 0.6677745059132576,
126
+ "total": 1.2636573165655136,
127
+ "uncertainty": 0.02768313675187528,
128
+ "world_model": 1.7483449429273605
129
+ }
130
+ },
131
+ {
132
+ "epoch": 3,
133
+ "train": {
134
+ "action": 0.030749366773913305,
135
+ "arm_role": 4.2617077118241774e-05,
136
+ "belief": 0.11198224344601233,
137
+ "corridor": 0.24353070246676603,
138
+ "disturbance": 0.004747987113660201,
139
+ "persistence": 3.7688617209593454,
140
+ "phase": 0.6659654900431633,
141
+ "planner_ranking": 0.12002094245205323,
142
+ "planner_risk": 0.010106622396657864,
143
+ "planner_success": 0.472127099831899,
144
+ "proposal_ranking": 0.09478530536095302,
145
+ "proposal_reconstruction": 0.059262806084007025,
146
+ "proposal_success": 0.6104264035820961,
147
+ "reocclusion": 0.6585924625396729,
148
+ "support_mode": 0.6661049971977869,
149
+ "total": 1.3116108278433483,
150
+ "uncertainty": 0.02409021647569413,
151
+ "world_model": 2.0509919623533883
152
+ },
153
+ "val": {
154
+ "action": 0.020845535211265087,
155
+ "arm_role": 4.311565771786263e-05,
156
+ "belief": 0.105616076849401,
157
+ "corridor": 0.23376570269465446,
158
+ "disturbance": 0.002147116305422969,
159
+ "persistence": 3.7260473370552063,
160
+ "phase": 0.6661699637770653,
161
+ "planner_ranking": 0.10419025458395481,
162
+ "planner_risk": 0.010339341242797673,
163
+ "planner_success": 0.46252304688096046,
164
+ "proposal_ranking": 0.09330006875097752,
165
+ "proposal_reconstruction": 0.04469671146944165,
166
+ "proposal_success": 0.6214711964130402,
167
+ "reocclusion": 0.6415831819176674,
168
+ "support_mode": 0.6682936698198318,
169
+ "total": 1.2371356934309006,
170
+ "uncertainty": 0.021665064617991447,
171
+ "world_model": 1.8418128192424774
172
+ }
173
+ },
174
+ {
175
+ "epoch": 4,
176
+ "train": {
177
+ "action": 0.023547588226695854,
178
+ "arm_role": 4.4845532405209575e-05,
179
+ "belief": 0.10733066033571959,
180
+ "corridor": 0.2384033997853597,
181
+ "disturbance": 0.0032167407577314102,
182
+ "persistence": 3.8173932135105133,
183
+ "phase": 0.6745133176445961,
184
+ "planner_ranking": 0.10369156207889318,
185
+ "planner_risk": 0.01009264924020196,
186
+ "planner_success": 0.4860173078874747,
187
+ "proposal_ranking": 0.09702414429436128,
188
+ "proposal_reconstruction": 0.0478425626643002,
189
+ "proposal_success": 0.6053199768066406,
190
+ "reocclusion": 0.6491402039925257,
191
+ "support_mode": 0.6703156977891922,
192
+ "total": 1.2156481097141902,
193
+ "uncertainty": 0.024805960594676435,
194
+ "world_model": 1.684378559390704
195
+ },
196
+ "val": {
197
+ "action": 0.02007221127860248,
198
+ "arm_role": 6.0773097175115254e-05,
199
+ "belief": 0.10199161060154438,
200
+ "corridor": 0.22850653901696205,
201
+ "disturbance": 0.0017478264489909634,
202
+ "persistence": 3.6291932463645935,
203
+ "phase": 0.6642125844955444,
204
+ "planner_ranking": 0.09935609716922045,
205
+ "planner_risk": 0.009536529192700982,
206
+ "planner_success": 0.45760077610611916,
207
+ "proposal_ranking": 0.09855884779244661,
208
+ "proposal_reconstruction": 0.04397509805858135,
209
+ "proposal_success": 0.6215623244643211,
210
+ "reocclusion": 0.6404022425413132,
211
+ "support_mode": 0.6641640961170197,
212
+ "total": 1.153723917901516,
213
+ "uncertainty": 0.02464893041178584,
214
+ "world_model": 1.56255304813385
215
+ }
216
+ },
217
+ {
218
+ "epoch": 5,
219
+ "train": {
220
+ "action": 0.022455799548576277,
221
+ "arm_role": 5.3321499156785045e-05,
222
+ "belief": 0.10393211245536804,
223
+ "corridor": 0.23205090935031572,
224
+ "disturbance": 0.0021382822984984764,
225
+ "persistence": 3.760234226783117,
226
+ "phase": 0.6825721388061842,
227
+ "planner_ranking": 0.11921679352720578,
228
+ "planner_risk": 0.010239185998216271,
229
+ "planner_success": 0.467387559513251,
230
+ "proposal_ranking": 0.09636436806370814,
231
+ "proposal_reconstruction": 0.0463158117296795,
232
+ "proposal_success": 0.604705015818278,
233
+ "reocclusion": 0.6451127852002779,
234
+ "support_mode": 0.6723414833347002,
235
+ "total": 1.1677857091029484,
236
+ "uncertainty": 0.017458321526646614,
237
+ "world_model": 1.5345012545585632
238
+ },
239
+ "val": {
240
+ "action": 0.020456953439861536,
241
+ "arm_role": 5.5397130381606985e-05,
242
+ "belief": 0.100255505181849,
243
+ "corridor": 0.22343307547271252,
244
+ "disturbance": 0.0018057649213005789,
245
+ "persistence": 3.819442391395569,
246
+ "phase": 0.6870930641889572,
247
+ "planner_ranking": 0.12271129060536623,
248
+ "planner_risk": 0.009507962386123836,
249
+ "planner_success": 0.47849390283226967,
250
+ "proposal_ranking": 0.09397839661687613,
251
+ "proposal_reconstruction": 0.04395680082961917,
252
+ "proposal_success": 0.6256562769412994,
253
+ "reocclusion": 0.6624282449483871,
254
+ "support_mode": 0.6657112762331963,
255
+ "total": 1.3062576353549957,
256
+ "uncertainty": 0.007776510377880186,
257
+ "world_model": 2.0670085549354553
258
+ }
259
+ },
260
+ {
261
+ "epoch": 6,
262
+ "train": {
263
+ "action": 0.022894175878415506,
264
+ "arm_role": 5.4112812904349994e-05,
265
+ "belief": 0.10060124254475038,
266
+ "corridor": 0.23040568207701048,
267
+ "disturbance": 0.0020979453014054648,
268
+ "persistence": 3.749631315469742,
269
+ "phase": 0.6835000167290369,
270
+ "planner_ranking": 0.10540719423443079,
271
+ "planner_risk": 0.011304946111825606,
272
+ "planner_success": 0.43665214255452156,
273
+ "proposal_ranking": 0.09107906681795915,
274
+ "proposal_reconstruction": 0.04669830979158481,
275
+ "proposal_success": 0.6054539605975151,
276
+ "reocclusion": 0.6455749049782753,
277
+ "support_mode": 0.6700228725870451,
278
+ "total": 1.1786824663480122,
279
+ "uncertainty": 0.014146532688755542,
280
+ "world_model": 1.6150691360235214
281
+ },
282
+ "val": {
283
+ "action": 0.02070643357001245,
284
+ "arm_role": 4.2248018871759996e-05,
285
+ "belief": 0.10063061211258173,
286
+ "corridor": 0.22452155128121376,
287
+ "disturbance": 0.0018244763487018645,
288
+ "persistence": 3.6125852465629578,
289
+ "phase": 0.6734225451946259,
290
+ "planner_ranking": 0.0999936256557703,
291
+ "planner_risk": 0.010059075022581965,
292
+ "planner_success": 0.45402833819389343,
293
+ "proposal_ranking": 0.0882191276177764,
294
+ "proposal_reconstruction": 0.04391673672944307,
295
+ "proposal_success": 0.624024972319603,
296
+ "reocclusion": 0.6362400725483894,
297
+ "support_mode": 0.664807952940464,
298
+ "total": 1.134026937186718,
299
+ "uncertainty": 0.009506796195637435,
300
+ "world_model": 1.4956171810626984
301
+ }
302
+ },
303
+ {
304
+ "epoch": 7,
305
+ "train": {
306
+ "action": 0.02265403970765571,
307
+ "arm_role": 4.537651936213175e-05,
308
+ "belief": 0.10131731970856588,
309
+ "corridor": 0.22949850497146448,
310
+ "disturbance": 0.0021897068994197375,
311
+ "persistence": 3.6896196703116098,
312
+ "phase": 0.6795123865207037,
313
+ "planner_ranking": 0.09418578383823235,
314
+ "planner_risk": 0.00923546745131413,
315
+ "planner_success": 0.42756689339876175,
316
+ "proposal_ranking": 0.09173912275582552,
317
+ "proposal_reconstruction": 0.04657370550557971,
318
+ "proposal_success": 0.6038760592540106,
319
+ "reocclusion": 0.6364429369568825,
320
+ "support_mode": 0.6676999057332674,
321
+ "total": 1.1160989701747894,
322
+ "uncertainty": 0.01297911632961283,
323
+ "world_model": 1.4062732805808384
324
+ },
325
+ "val": {
326
+ "action": 0.023696284973993897,
327
+ "arm_role": 3.5256778573966585e-05,
328
+ "belief": 0.09744055476039648,
329
+ "corridor": 0.22240561619400978,
330
+ "disturbance": 0.0017758552203304134,
331
+ "persistence": 3.608371615409851,
332
+ "phase": 0.6682962626218796,
333
+ "planner_ranking": 0.10720822960138321,
334
+ "planner_risk": 0.009278025652747601,
335
+ "planner_success": 0.4377236105501652,
336
+ "proposal_ranking": 0.09098756965249777,
337
+ "proposal_reconstruction": 0.04804757330566645,
338
+ "proposal_success": 0.6270129010081291,
339
+ "reocclusion": 0.6341496035456657,
340
+ "support_mode": 0.6644193530082703,
341
+ "total": 1.0928071364760399,
342
+ "uncertainty": 0.015584498294629157,
343
+ "world_model": 1.3288657069206238
344
+ }
345
+ }
346
+ ]
artifacts/outputs/interaction_rolefix_full/reveal_eval_interaction/reveal_benchmark.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "interaction": {
3
+ "per_task_success": {
4
+ "foliage_proxy": 0.0,
5
+ "bag_proxy": 0.0,
6
+ "cloth_proxy": 0.0
7
+ },
8
+ "mean_success": 0.0,
9
+ "visibility_integral": 64.04203844070435,
10
+ "corridor_availability": 0.9837105721235275,
11
+ "reocclusion_rate": 0.0,
12
+ "persistence_horizon_mae": 1.7914747282500483,
13
+ "disturbance_cost": 0.8335009200705422
14
+ }
15
+ }
artifacts/outputs/interaction_rolefix_full/reveal_eval_interaction/reveal_benchmark.md ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Reveal Proxy Benchmark
2
+
3
+ ## interaction
4
+ - checkpoint: /workspace/VLAarchtests/artifacts/outputs/interaction_rolefix_full/proxy_interaction_state/checkpoint_best.pt
5
+ - mean_success: 0.000
6
+ - visibility_integral: 64.042
7
+ - corridor_availability: 0.984
8
+ - reocclusion_rate: 0.000
9
+ - persistence_horizon_mae: 1.791
10
+ - disturbance_cost: 0.834
11
+ - foliage_proxy_success: 0.000
12
+ - bag_proxy_success: 0.000
13
+ - cloth_proxy_success: 0.000