lsnu commited on 6 days ago

Commit

430a41a

verified ·

1 Parent(s): 8c435a3

Add files using upload-large-folder tool

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/benchmark_full/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/benchmark_full/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/config_resolved.yaml +149 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/diagnostics_full/proxy_diagnostics.json +16 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/metrics.json +230 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/summary.json +557 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/benchmark_full/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/benchmark_full/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/config_resolved.yaml +149 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/diagnostics_full/proxy_diagnostics.json +16 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/metrics.json +230 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/summary.json +557 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/benchmark_full/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/benchmark_full/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/config_resolved.yaml +149 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/diagnostics_full/proxy_diagnostics.json +16 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/metrics.json +230 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/summary.json +557 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_full/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_full/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_no_planner/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_no_planner/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_no_role_symmetry/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_no_role_symmetry/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/config_resolved.yaml +147 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/diagnostics_full/proxy_diagnostics.json +16 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/metrics.json +230 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/summary.json +14 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_full/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_full/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_no_planner/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_no_planner/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_no_role_symmetry/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_no_role_symmetry/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/config_resolved.yaml +147 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/diagnostics_full/proxy_diagnostics.json +16 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/metrics.json +230 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/summary.json +14 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_full/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_full/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_no_planner/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_no_planner/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_no_role_symmetry/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_no_role_symmetry/reveal_benchmark.md +13 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/config_resolved.yaml +147 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/diagnostics_full/proxy_diagnostics.json +16 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/metrics.json +230 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/summary.json +14 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage2_clip_seed11/benchmark_full/reveal_benchmark.json +15 -0
artifacts/outputs/r3d/proxy_interaction_r3d_stage2_clip_seed11/benchmark_full/reveal_benchmark.md +13 -0

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/benchmark_full/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.375,
+      "bag_proxy": 0.4583333333333333,
+      "cloth_proxy": 0.5833333333333334
+    },
+    "mean_success": 0.47222222222222215,
+    "visibility_integral": 37.36026926173104,
+    "corridor_availability": 0.8730104863643646,
+    "reocclusion_rate": 0.04405864197530864,
+    "persistence_horizon_mae": 1.033145775666108,
+    "disturbance_cost": 0.3228136783000082
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/benchmark_full/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/checkpoint_best.pt
+- mean_success: 0.472
+- visibility_integral: 37.360
+- corridor_availability: 0.873
+- reocclusion_rate: 0.044
+- persistence_horizon_mae: 1.033
+- disturbance_cost: 0.323
+- foliage_proxy_success: 0.375
+- bag_proxy_success: 0.458
+- cloth_proxy_success: 0.583

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/config_resolved.yaml ADDED Viewed

	@@ -0,0 +1,149 @@

+experiment_name: proxy_interaction_r3d_stage1_clip_seed7
+output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
+device: cuda
+seed: 7
+init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
+init_strict: false
+data:
+  proxies:
+  - foliage_proxy
+  - bag_proxy
+  - cloth_proxy
+  resolution: 224
+  dataset_version: reveal_proxy_v6_rgbd_elastic_state
+  train_episodes_per_proxy: 48
+  val_episodes_per_proxy: 16
+  train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage1_seed7.pt
+  val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage1_seed7.pt
+  rebuild_dataset: false
+  chunk_horizon: 8
+  rollout_horizon: 5
+  history_steps: 6
+  planner_candidates: 8
+  seed: 7
+optim:
+  epochs: 4
+  batch_size: 2
+  num_workers: 4
+  lr: 0.0003
+  weight_decay: 0.0001
+trainer:
+  policy_type: elastic_reveal
+  use_bf16: true
+  grad_clip_norm: 1.0
+  freeze_backbone: true
+  gradient_checkpointing: false
+  plan_during_train: true
+  plan_during_eval: true
+  support_mode_conditioning: true
+  planner_mode: trainable
+  use_depth: false
+  use_world_model: true
+  use_role_tokens: true
+  compute_equivariance_probe: true
+policy:
+  backbone:
+    model_name: openai/clip-vit-base-patch32
+    hidden_dim: 512
+    max_text_tokens: 32
+    freeze_backbone: true
+    gradient_checkpointing: false
+    use_dummy_backbone: false
+  fusion:
+    hidden_dim: 512
+    num_cameras: 3
+    num_layers: 4
+    num_heads: 8
+    ff_dim: 2048
+    dropout: 0.1
+    proprio_dim: 32
+    proprio_tokens: 1
+  memory:
+    hidden_dim: 512
+    action_dim: 14
+    history_steps: 6
+    scene_history_steps: 3
+    belief_history_steps: 8
+    num_layers: 2
+    dropout: 0.1
+    memory_bank_size: 4
+    scene_bank_size: 2
+    belief_bank_size: 2
+    num_heads: 8
+    max_history_steps: 8
+  decoder:
+    hidden_dim: 512
+    num_heads: 8
+    num_layers: 4
+    ff_dim: 2048
+    dropout: 0.1
+    chunk_size: 8
+    action_dim: 14
+    arm_action_dim: 7
+    num_candidates: 8
+    num_phases: 5
+    num_arm_roles: 4
+    num_proposal_modes: 6
+    planner_top_k: 4
+  reveal_head:
+    hidden_dim: 512
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    belief_map_size: 32
+    field_size: 16
+    num_heads: 8
+    predict_belief_map: true
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  world_model:
+    hidden_dim: 512
+    action_dim: 14
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    field_size: 16
+    num_heads: 8
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+    belief_map_size: 32
+    predict_belief_map: true
+    scene_bank_size: 2
+    belief_bank_size: 2
+  planner:
+    hidden_dim: 512
+    num_candidates: 8
+    action_dim: 14
+    num_support_modes: 3
+    utility_margin: 0.1
+    num_heads: 8
+    num_layers: 2
+    num_phases: 5
+    num_arm_roles: 4
+    top_k: 4
+loss_weights:
+  action: 1.0
+  phase: 0.1
+  arm_role: 0.15
+  support_mode: 0.1
+  corridor: 0.15
+  persistence: 0.05
+  disturbance: 0.05
+  world_model: 0.2
+  belief: 0.05
+  visibility: 0.05
+  clearance: 0.05
+  support_stability: 0.05
+  reocclusion: 0.05
+  occluder_contact: 0.05
+  grasp_affordance: 0.05
+  planner_success: 0.25
+  planner_risk: 0.1
+  planner_ranking: 0.2
+  proposal_reconstruction: 0.1
+  proposal_success: 0.15
+  proposal_ranking: 0.2
+  proposal_diversity: 0.05
+  role_swap_consistency: 0.05

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/diagnostics_full/proxy_diagnostics.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "planner_top1_accuracy": 0.25396825396825395,
+  "planner_regret": 0.024764427915215492,
+  "planner_score_utility_spearman": 0.1904761791229248,
+  "risk_calibration_mse": 0.010364258661866188,
+  "role_collapse_rate": 0.0,
+  "proposal_diversity": 0.022177213802933693,
+  "left_right_equivariance_error": 0.0002942846322184778,
+  "belief_calibration_brier": 0.003581121563911438,
+  "reocclusion_calibration_brier": 0.23373088240623474,
+  "support_stability_mae": 0.022998232394456863,
+  "clearance_auc": 0.8989269585276155,
+  "memory_write_rate": 0.0,
+  "memory_saturation": 0.41934600472450256,
+  "num_samples": 126
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/metrics.json ADDED Viewed

	@@ -0,0 +1,230 @@

+[
+  {
+    "epoch": 0,
+    "train": {
+      "action": 0.025519870977400175,
+      "arm_role": 0.03451829462151253,
+      "belief": 0.11532339149432656,
+      "clearance": 0.09198410963122758,
+      "corridor": 0.27232400180664673,
+      "disturbance": 0.005858588227789626,
+      "grasp_affordance": 0.018751464233153464,
+      "occluder_contact": 0.21359099159065967,
+      "persistence": 5.231568055785678,
+      "phase": 0.7372311896678665,
+      "planner_ranking": 0.1646315749647481,
+      "planner_risk": 0.014348083711473067,
+      "planner_success": 0.6091769787029446,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.253575401780493,
+      "proposal_reconstruction": 0.067724266230904,
+      "proposal_success": 0.6851897648491785,
+      "reocclusion": 0.7031442959895309,
+      "role_swap_consistency": 0.00044027801038677857,
+      "support_mode": 0.7282283443430956,
+      "support_stability": 0.15459337279551627,
+      "total": 1.6319934494832424,
+      "uncertainty": 0.013496716971069097,
+      "visibility": 0.11563199924314833,
+      "world_model": 2.671503098223222
+    },
+    "val": {
+      "action": 0.020692157455616526,
+      "arm_role": 9.546122843554865e-05,
+      "belief": 0.09874132736807778,
+      "clearance": 0.08244451738539196,
+      "corridor": 0.2306106292775699,
+      "disturbance": 0.006118982125097694,
+      "grasp_affordance": 0.009981726739732992,
+      "occluder_contact": 0.19720953915800368,
+      "persistence": 3.8672617465730696,
+      "phase": 0.668701058815396,
+      "planner_ranking": 0.03794538755975072,
+      "planner_risk": 0.009814016923349026,
+      "planner_success": 0.5628143776030767,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1249213124078417,
+      "proposal_reconstruction": 0.06329423224642164,
+      "proposal_success": 0.6747160203873165,
+      "reocclusion": 0.692203164100647,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.6680677216204386,
+      "support_stability": 0.1511912994411966,
+      "total": 1.358805573175824,
+      "uncertainty": 0.003482046378185115,
+      "visibility": 0.10417925601913816,
+      "world_model": 2.1376701915074907
+    }
+  },
+  {
+    "epoch": 1,
+    "train": {
+      "action": 0.02150821143575988,
+      "arm_role": 1.9482293054071397e-05,
+      "belief": 0.09863162136280725,
+      "clearance": 0.08064276829400924,
+      "corridor": 0.24359133383210416,
+      "disturbance": 0.002735878452234476,
+      "grasp_affordance": 0.009349104797184779,
+      "occluder_contact": 0.1937003313558888,
+      "persistence": 4.076787073262699,
+      "phase": 0.6966290698625655,
+      "planner_ranking": 0.04271617977273956,
+      "planner_risk": 0.010049402082938681,
+      "planner_success": 0.5399472568359674,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1569982820156357,
+      "proposal_reconstruction": 0.06389496966962414,
+      "proposal_success": 0.6711133328407847,
+      "reocclusion": 0.6940537130957498,
+      "role_swap_consistency": 0.00022550253765151655,
+      "support_mode": 0.6837139029777487,
+      "support_stability": 0.14029162690160474,
+      "total": 1.3837347957476271,
+      "uncertainty": 0.0016494125736687157,
+      "visibility": 0.09400421737922424,
+      "world_model": 2.175609592991974
+    },
+    "val": {
+      "action": 0.020051477757829523,
+      "arm_role": 2.626385377793451e-06,
+      "belief": 0.09183884199176516,
+      "clearance": 0.07657587877105153,
+      "corridor": 0.22728621321065084,
+      "disturbance": 0.0016498260886850951,
+      "grasp_affordance": 0.009590831518705403,
+      "occluder_contact": 0.1917984854607355,
+      "persistence": 3.699212070495363,
+      "phase": 0.6689459842348856,
+      "planner_ranking": 0.03331218510795715,
+      "planner_risk": 0.010092773325076061,
+      "planner_success": 0.5014436940352122,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1606994933552213,
+      "proposal_reconstruction": 0.062439400820978104,
+      "proposal_success": 0.675733851061927,
+      "reocclusion": 0.6921006942552234,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.6564426545112853,
+      "support_stability": 0.14099458102432508,
+      "total": 1.313369631767273,
+      "uncertainty": 0.0024020517326240973,
+      "visibility": 0.08723713226971172,
+      "world_model": 2.0216772158940635
+    }
+  },
+  {
+    "epoch": 2,
+    "train": {
+      "action": 0.018980447901412845,
+      "arm_role": 2.3090714559505124e-05,
+      "belief": 0.1100015923263827,
+      "clearance": 0.0791148773262872,
+      "corridor": 0.23030528037001852,
+      "disturbance": 0.002447301701405857,
+      "grasp_affordance": 0.009001106255400087,
+      "occluder_contact": 0.21010415864552504,
+      "persistence": 2.0494745795430753,
+      "phase": 0.459073231482381,
+      "planner_ranking": 0.036845811475892686,
+      "planner_risk": 0.011261017404920885,
+      "planner_success": 0.5133467099741491,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1499755538570944,
+      "proposal_reconstruction": 0.062038555780318395,
+      "proposal_success": 0.6672172468370168,
+      "reocclusion": 0.41151915600825667,
+      "role_swap_consistency": 0.0007739521978125561,
+      "support_mode": 0.38595684411013936,
+      "support_stability": 0.1425538511912665,
+      "total": 1.1811942648513154,
+      "uncertainty": 0.000767841034371724,
+      "visibility": 0.10209987125315591,
+      "world_model": 2.070929214904446
+    },
+    "val": {
+      "action": 0.0138629823627453,
+      "arm_role": 0.002011558223822855,
+      "belief": 0.10340341582657799,
+      "clearance": 0.0855481999497565,
+      "corridor": 0.2235906974427284,
+      "disturbance": 0.0011637268657111797,
+      "grasp_affordance": 0.010592727485807642,
+      "occluder_contact": 0.20843842601965343,
+      "persistence": 1.1762515253254346,
+      "phase": 0.3442955078771486,
+      "planner_ranking": 0.03461442932137519,
+      "planner_risk": 0.01165175854065825,
+      "planner_success": 0.45808544967855724,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.3026971003365895,
+      "proposal_reconstruction": 0.05888378312663427,
+      "proposal_success": 0.7430036550476438,
+      "reocclusion": 0.2871374910076459,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.22473623181900215,
+      "support_stability": 0.1320991822414928,
+      "total": 1.1099917330439129,
+      "uncertainty": 0.0005805234163528352,
+      "visibility": 0.09557991185122067,
+      "world_model": 1.9994045325687952
+    }
+  },
+  {
+    "epoch": 3,
+    "train": {
+      "action": 0.014569098466314883,
+      "arm_role": 4.4951576212937916e-05,
+      "belief": 0.09620984569582015,
+      "clearance": 0.07538617284315106,
+      "corridor": 0.21248489566188775,
+      "disturbance": 0.0016758848629270635,
+      "grasp_affordance": 0.008272631588777167,
+      "occluder_contact": 0.19746327033529731,
+      "persistence": 1.1089699098374644,
+      "phase": 0.3716845961765469,
+      "planner_ranking": 0.03254403228879829,
+      "planner_risk": 0.010248634800575772,
+      "planner_success": 0.47941413580279074,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.153262345578658,
+      "proposal_reconstruction": 0.05860933205064055,
+      "proposal_success": 0.6466394141706496,
+      "reocclusion": 0.2566672772173989,
+      "role_swap_consistency": 0.0010398222479868085,
+      "support_mode": 0.21815690070546734,
+      "support_stability": 0.13650912478449145,
+      "total": 1.0633102330861914,
+      "uncertainty": 0.0002461711761398012,
+      "visibility": 0.09588275449984361,
+      "world_model": 1.9903733518111144
+    },
+    "val": {
+      "action": 0.01619998768474611,
+      "arm_role": 3.844006559777174e-06,
+      "belief": 0.09427393618084136,
+      "clearance": 0.07296533326780985,
+      "corridor": 0.2100035525148823,
+      "disturbance": 0.0013519242122204862,
+      "grasp_affordance": 0.007646961093303703,
+      "occluder_contact": 0.1950870676646157,
+      "persistence": 1.3894045449024628,
+      "phase": 0.6804814789192899,
+      "planner_ranking": 0.027768202883649677,
+      "planner_risk": 0.010219628483081044,
+      "planner_success": 0.4819766197885786,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1241777983922807,
+      "proposal_reconstruction": 0.060782825840370994,
+      "proposal_success": 0.6369421221907177,
+      "reocclusion": 0.27461627113913734,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.08716485598531093,
+      "support_stability": 0.13245442648610425,
+      "total": 1.0629130696493483,
+      "uncertainty": 8.45672577761145e-05,
+      "visibility": 0.1013997554306,
+      "world_model": 1.8573077273747278
+    }
+  }
+]

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/summary.json ADDED Viewed

	@@ -0,0 +1,557 @@

+{
+  "experiment_name": "proxy_interaction_r3d_stage1_clip_seed7",
+  "device": "cuda",
+  "best_checkpoint": "/workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed7/checkpoint_best.pt",
+  "final_train_total": 1.0633102330861914,
+  "final_val_total": 1.0629130696493483,
+  "train_time_sec": 174.85308933258057,
+  "peak_gpu_memory_mb": 1919.8251953125,
+  "num_train_samples": 382,
+  "num_val_samples": 126,
+  "planner_mode": "trainable",
+  "frozen_modules": [],
+  "init_info": {
+    "path": "/workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt",
+    "loaded_keys": 461,
+    "skipped_shape_mismatch_keys": [
+      "memory.gru.weight_ih_l0",
+      "memory.gru.weight_hh_l0",
+      "memory.gru.bias_ih_l0",
+      "memory.gru.bias_hh_l0",
+      "memory.token_proj.0.weight",
+      "memory.token_proj.0.bias",
+      "memory.token_proj.1.weight",
+      "memory.token_proj.1.bias",
+      "decoder.actor_role_bias",
+      "decoder.revealer_decoder.layers.0.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.0.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.0.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.0.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.0.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.0.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.0.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.0.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.0.linear1.weight",
+      "decoder.revealer_decoder.layers.0.linear1.bias",
+      "decoder.revealer_decoder.layers.0.linear2.weight",
+      "decoder.revealer_decoder.layers.0.linear2.bias",
+      "decoder.revealer_decoder.layers.0.norm1.weight",
+      "decoder.revealer_decoder.layers.0.norm1.bias",
+      "decoder.revealer_decoder.layers.0.norm2.weight",
+      "decoder.revealer_decoder.layers.0.norm2.bias",
+      "decoder.revealer_decoder.layers.0.norm3.weight",
+      "decoder.revealer_decoder.layers.0.norm3.bias",
+      "decoder.revealer_decoder.layers.1.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.1.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.1.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.1.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.1.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.1.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.1.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.1.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.1.linear1.weight",
+      "decoder.revealer_decoder.layers.1.linear1.bias",
+      "decoder.revealer_decoder.layers.1.linear2.weight",
+      "decoder.revealer_decoder.layers.1.linear2.bias",
+      "decoder.revealer_decoder.layers.1.norm1.weight",
+      "decoder.revealer_decoder.layers.1.norm1.bias",
+      "decoder.revealer_decoder.layers.1.norm2.weight",
+      "decoder.revealer_decoder.layers.1.norm2.bias",
+      "decoder.revealer_decoder.layers.1.norm3.weight",
+      "decoder.revealer_decoder.layers.1.norm3.bias",
+      "decoder.revealer_decoder.layers.2.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.2.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.2.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.2.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.2.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.2.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.2.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.2.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.2.linear1.weight",
+      "decoder.revealer_decoder.layers.2.linear1.bias",
+      "decoder.revealer_decoder.layers.2.linear2.weight",
+      "decoder.revealer_decoder.layers.2.linear2.bias",
+      "decoder.revealer_decoder.layers.2.norm1.weight",
+      "decoder.revealer_decoder.layers.2.norm1.bias",
+      "decoder.revealer_decoder.layers.2.norm2.weight",
+      "decoder.revealer_decoder.layers.2.norm2.bias",
+      "decoder.revealer_decoder.layers.2.norm3.weight",
+      "decoder.revealer_decoder.layers.2.norm3.bias",
+      "decoder.revealer_decoder.layers.3.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.3.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.3.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.3.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.3.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.3.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.3.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.3.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.3.linear1.weight",
+      "decoder.revealer_decoder.layers.3.linear1.bias",
+      "decoder.revealer_decoder.layers.3.linear2.weight",
+      "decoder.revealer_decoder.layers.3.linear2.bias",
+      "decoder.revealer_decoder.layers.3.norm1.weight",
+      "decoder.revealer_decoder.layers.3.norm1.bias",
+      "decoder.revealer_decoder.layers.3.norm2.weight",
+      "decoder.revealer_decoder.layers.3.norm2.bias",
+      "decoder.revealer_decoder.layers.3.norm3.weight",
+      "decoder.revealer_decoder.layers.3.norm3.bias",
+      "decoder.actor_decoder.layers.0.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.0.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.0.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.0.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.0.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.0.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.0.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.0.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.0.linear1.weight",
+      "decoder.actor_decoder.layers.0.linear1.bias",
+      "decoder.actor_decoder.layers.0.linear2.weight",
+      "decoder.actor_decoder.layers.0.linear2.bias",
+      "decoder.actor_decoder.layers.0.norm1.weight",
+      "decoder.actor_decoder.layers.0.norm1.bias",
+      "decoder.actor_decoder.layers.0.norm2.weight",
+      "decoder.actor_decoder.layers.0.norm2.bias",
+      "decoder.actor_decoder.layers.0.norm3.weight",
+      "decoder.actor_decoder.layers.0.norm3.bias",
+      "decoder.actor_decoder.layers.1.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.1.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.1.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.1.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.1.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.1.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.1.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.1.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.1.linear1.weight",
+      "decoder.actor_decoder.layers.1.linear1.bias",
+      "decoder.actor_decoder.layers.1.linear2.weight",
+      "decoder.actor_decoder.layers.1.linear2.bias",
+      "decoder.actor_decoder.layers.1.norm1.weight",
+      "decoder.actor_decoder.layers.1.norm1.bias",
+      "decoder.actor_decoder.layers.1.norm2.weight",
+      "decoder.actor_decoder.layers.1.norm2.bias",
+      "decoder.actor_decoder.layers.1.norm3.weight",
+      "decoder.actor_decoder.layers.1.norm3.bias",
+      "decoder.actor_decoder.layers.2.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.2.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.2.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.2.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.2.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.2.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.2.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.2.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.2.linear1.weight",
+      "decoder.actor_decoder.layers.2.linear1.bias",
+      "decoder.actor_decoder.layers.2.linear2.weight",
+      "decoder.actor_decoder.layers.2.linear2.bias",
+      "decoder.actor_decoder.layers.2.norm1.weight",
+      "decoder.actor_decoder.layers.2.norm1.bias",
+      "decoder.actor_decoder.layers.2.norm2.weight",
+      "decoder.actor_decoder.layers.2.norm2.bias",
+      "decoder.actor_decoder.layers.2.norm3.weight",
+      "decoder.actor_decoder.layers.2.norm3.bias",
+      "decoder.actor_decoder.layers.3.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.3.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.3.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.3.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.3.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.3.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.3.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.3.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.3.linear1.weight",
+      "decoder.actor_decoder.layers.3.linear1.bias",
+      "decoder.actor_decoder.layers.3.linear2.weight",
+      "decoder.actor_decoder.layers.3.linear2.bias",
+      "decoder.actor_decoder.layers.3.norm1.weight",
+      "decoder.actor_decoder.layers.3.norm1.bias",
+      "decoder.actor_decoder.layers.3.norm2.weight",
+      "decoder.actor_decoder.layers.3.norm2.bias",
+      "decoder.actor_decoder.layers.3.norm3.weight",
+      "decoder.actor_decoder.layers.3.norm3.bias",
+      "decoder.revealer_mean.weight",
+      "decoder.revealer_mean.bias",
+      "decoder.revealer_log_std.weight",
+      "decoder.revealer_log_std.bias",
+      "decoder.actor_mean.weight",
+      "decoder.actor_mean.bias",
+      "decoder.actor_log_std.weight",
+      "decoder.actor_log_std.bias",
+      "decoder.proposal_score.0.weight",
+      "decoder.proposal_score.0.bias",
+      "decoder.proposal_score.1.weight",
+      "decoder.proposal_score.1.bias"
+    ],
+    "missing_keys": [
+      "backbone.depth_adapter.depth_proj.0.weight",
+      "backbone.depth_adapter.depth_proj.0.bias",
+      "backbone.depth_adapter.depth_proj.1.weight",
+      "backbone.depth_adapter.depth_proj.1.bias",
+      "backbone.depth_adapter.depth_proj.3.weight",
+      "backbone.depth_adapter.depth_proj.3.bias",
+      "backbone.depth_adapter.geometry_proj.0.weight",
+      "backbone.depth_adapter.geometry_proj.0.bias",
+      "backbone.depth_adapter.geometry_proj.1.weight",
+      "backbone.depth_adapter.geometry_proj.1.bias",
+      "backbone.depth_adapter.camera_proj.0.weight",
+      "backbone.depth_adapter.camera_proj.0.bias",
+      "backbone.depth_adapter.camera_proj.1.weight",
+      "backbone.depth_adapter.camera_proj.1.bias",
+      "fusion.geometry_fusion.attn.in_proj_weight",
+      "fusion.geometry_fusion.attn.in_proj_bias",
+      "fusion.geometry_fusion.attn.out_proj.weight",
+      "fusion.geometry_fusion.attn.out_proj.bias",
+      "fusion.geometry_fusion.gate.0.weight",
+      "fusion.geometry_fusion.gate.0.bias",
+      "fusion.geometry_fusion.gate.1.weight",
+      "fusion.geometry_fusion.gate.1.bias",
+      "fusion.geometry_fusion.gate.3.weight",
+      "fusion.geometry_fusion.gate.3.bias",
+      "fusion.geometry_fusion.out.0.weight",
+      "fusion.geometry_fusion.out.0.bias",
+      "fusion.geometry_fusion.out.1.weight",
+      "fusion.geometry_fusion.out.1.bias",
+      "memory.scene_memory.position_embedding",
+      "memory.scene_memory.bank_queries",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.in_proj_weight",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.in_proj_bias",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.out_proj.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.out_proj.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.linear1.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.linear1.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.linear2.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.linear2.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.norm1.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.norm1.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.norm2.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.norm2.bias",
+      "memory.scene_memory.bank_attention.in_proj_weight",
+      "memory.scene_memory.bank_attention.in_proj_bias",
+      "memory.scene_memory.bank_attention.out_proj.weight",
+      "memory.scene_memory.bank_attention.out_proj.bias",
+      "memory.scene_memory.action_proj.0.weight",
+      "memory.scene_memory.action_proj.0.bias",
+      "memory.scene_memory.action_proj.1.weight",
+      "memory.scene_memory.action_proj.1.bias",
+      "memory.scene_memory.write_gate.0.weight",
+      "memory.scene_memory.write_gate.0.bias",
+      "memory.scene_memory.write_gate.1.weight",
+      "memory.scene_memory.write_gate.1.bias",
+      "memory.scene_memory.write_gate.3.weight",
+      "memory.scene_memory.write_gate.3.bias",
+      "memory.scene_memory.token_proj.0.weight",
+      "memory.scene_memory.token_proj.0.bias",
+      "memory.scene_memory.token_proj.1.weight",
+      "memory.scene_memory.token_proj.1.bias",
+      "memory.belief_memory.position_embedding",
+      "memory.belief_memory.bank_queries",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.in_proj_weight",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.in_proj_bias",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.out_proj.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.out_proj.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.linear1.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.linear1.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.linear2.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.linear2.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.norm1.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.norm1.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.norm2.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.norm2.bias",
+      "memory.belief_memory.bank_attention.in_proj_weight",
+      "memory.belief_memory.bank_attention.in_proj_bias",
+      "memory.belief_memory.bank_attention.out_proj.weight",
+      "memory.belief_memory.bank_attention.out_proj.bias",
+      "memory.belief_memory.action_proj.0.weight",
+      "memory.belief_memory.action_proj.0.bias",
+      "memory.belief_memory.action_proj.1.weight",
+      "memory.belief_memory.action_proj.1.bias",
+      "memory.belief_memory.write_gate.0.weight",
+      "memory.belief_memory.write_gate.0.bias",
+      "memory.belief_memory.write_gate.1.weight",
+      "memory.belief_memory.write_gate.1.bias",
+      "memory.belief_memory.write_gate.3.weight",
+      "memory.belief_memory.write_gate.3.bias",
+      "memory.belief_memory.token_proj.0.weight",
+      "memory.belief_memory.token_proj.0.bias",
+      "memory.belief_memory.token_proj.1.weight",
+      "memory.belief_memory.token_proj.1.bias",
+      "decoder.arm_decoder.layers.0.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.0.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.0.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.0.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.0.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.0.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.0.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.0.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.0.linear1.weight",
+      "decoder.arm_decoder.layers.0.linear1.bias",
+      "decoder.arm_decoder.layers.0.linear2.weight",
+      "decoder.arm_decoder.layers.0.linear2.bias",
+      "decoder.arm_decoder.layers.0.norm1.weight",
+      "decoder.arm_decoder.layers.0.norm1.bias",
+      "decoder.arm_decoder.layers.0.norm2.weight",
+      "decoder.arm_decoder.layers.0.norm2.bias",
+      "decoder.arm_decoder.layers.0.norm3.weight",
+      "decoder.arm_decoder.layers.0.norm3.bias",
+      "decoder.arm_decoder.layers.1.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.1.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.1.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.1.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.1.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.1.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.1.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.1.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.1.linear1.weight",
+      "decoder.arm_decoder.layers.1.linear1.bias",
+      "decoder.arm_decoder.layers.1.linear2.weight",
+      "decoder.arm_decoder.layers.1.linear2.bias",
+      "decoder.arm_decoder.layers.1.norm1.weight",
+      "decoder.arm_decoder.layers.1.norm1.bias",
+      "decoder.arm_decoder.layers.1.norm2.weight",
+      "decoder.arm_decoder.layers.1.norm2.bias",
+      "decoder.arm_decoder.layers.1.norm3.weight",
+      "decoder.arm_decoder.layers.1.norm3.bias",
+      "decoder.arm_decoder.layers.2.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.2.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.2.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.2.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.2.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.2.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.2.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.2.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.2.linear1.weight",
+      "decoder.arm_decoder.layers.2.linear1.bias",
+      "decoder.arm_decoder.layers.2.linear2.weight",
+      "decoder.arm_decoder.layers.2.linear2.bias",
+      "decoder.arm_decoder.layers.2.norm1.weight",
+      "decoder.arm_decoder.layers.2.norm1.bias",
+      "decoder.arm_decoder.layers.2.norm2.weight",
+      "decoder.arm_decoder.layers.2.norm2.bias",
+      "decoder.arm_decoder.layers.2.norm3.weight",
+      "decoder.arm_decoder.layers.2.norm3.bias",
+      "decoder.arm_decoder.layers.3.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.3.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.3.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.3.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.3.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.3.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.3.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.3.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.3.linear1.weight",
+      "decoder.arm_decoder.layers.3.linear1.bias",
+      "decoder.arm_decoder.layers.3.linear2.weight",
+      "decoder.arm_decoder.layers.3.linear2.bias",
+      "decoder.arm_decoder.layers.3.norm1.weight",
+      "decoder.arm_decoder.layers.3.norm1.bias",
+      "decoder.arm_decoder.layers.3.norm2.weight",
+      "decoder.arm_decoder.layers.3.norm2.bias",
+      "decoder.arm_decoder.layers.3.norm3.weight",
+      "decoder.arm_decoder.layers.3.norm3.bias",
+      "decoder.arm_identity.weight",
+      "decoder.phase_adapter.weight",
+      "decoder.phase_adapter.bias",
+      "decoder.role_adapter.weight",
+      "decoder.role_adapter.bias",
+      "decoder.context_proj.0.weight",
+      "decoder.context_proj.0.bias",
+      "decoder.context_proj.1.weight",
+      "decoder.context_proj.1.bias",
+      "decoder.arm_head.0.weight",
+      "decoder.arm_head.0.bias",
+      "decoder.arm_head.1.weight",
+      "decoder.arm_head.1.bias",
+      "decoder.arm_mean.weight",
+      "decoder.arm_mean.bias",
+      "decoder.arm_log_std.weight",
+      "decoder.arm_log_std.bias",
+      "decoder.proposal_mode_head.0.weight",
+      "decoder.proposal_mode_head.0.bias",
+      "decoder.proposal_mode_head.1.weight",
+      "decoder.proposal_mode_head.1.bias",
+      "decoder.proposal_mode_head.3.weight",
+      "decoder.proposal_mode_head.3.bias",
+      "decoder.proposal_mode_embeddings.weight",
+      "decoder.proposal_slot_embeddings.weight",
+      "decoder.mode_residual_heads.0.0.weight",
+      "decoder.mode_residual_heads.0.0.bias",
+      "decoder.mode_residual_heads.0.1.weight",
+      "decoder.mode_residual_heads.0.1.bias",
+      "decoder.mode_residual_heads.0.3.weight",
+      "decoder.mode_residual_heads.0.3.bias",
+      "decoder.mode_residual_heads.1.0.weight",
+      "decoder.mode_residual_heads.1.0.bias",
+      "decoder.mode_residual_heads.1.1.weight",
+      "decoder.mode_residual_heads.1.1.bias",
+      "decoder.mode_residual_heads.1.3.weight",
+      "decoder.mode_residual_heads.1.3.bias",
+      "decoder.mode_residual_heads.2.0.weight",
+      "decoder.mode_residual_heads.2.0.bias",
+      "decoder.mode_residual_heads.2.1.weight",
+      "decoder.mode_residual_heads.2.1.bias",
+      "decoder.mode_residual_heads.2.3.weight",
+      "decoder.mode_residual_heads.2.3.bias",
+      "decoder.mode_residual_heads.3.0.weight",
+      "decoder.mode_residual_heads.3.0.bias",
+      "decoder.mode_residual_heads.3.1.weight",
+      "decoder.mode_residual_heads.3.1.bias",
+      "decoder.mode_residual_heads.3.3.weight",
+      "decoder.mode_residual_heads.3.3.bias",
+      "decoder.mode_residual_heads.4.0.weight",
+      "decoder.mode_residual_heads.4.0.bias",
+      "decoder.mode_residual_heads.4.1.weight",
+      "decoder.mode_residual_heads.4.1.bias",
+      "decoder.mode_residual_heads.4.3.weight",
+      "decoder.mode_residual_heads.4.3.bias",
+      "decoder.mode_residual_heads.5.0.weight",
+      "decoder.mode_residual_heads.5.0.bias",
+      "decoder.mode_residual_heads.5.1.weight",
+      "decoder.mode_residual_heads.5.1.bias",
+      "decoder.mode_residual_heads.5.3.weight",
+      "decoder.mode_residual_heads.5.3.bias",
+      "decoder.slot_delta.0.weight",
+      "decoder.slot_delta.0.bias",
+      "decoder.slot_delta.1.weight",
+      "decoder.slot_delta.1.bias",
+      "decoder.slot_delta.3.weight",
+      "decoder.slot_delta.3.bias",
+      "decoder.proposal_score.0.weight",
+      "decoder.proposal_score.0.bias",
+      "decoder.proposal_score.1.weight",
+      "decoder.proposal_score.1.bias",
+      "decoder.proposal_score.3.weight",
+      "decoder.proposal_score.3.bias",
+      "elastic_state_head.interaction_queries",
+      "elastic_state_head.interaction_attention.in_proj_weight",
+      "elastic_state_head.interaction_attention.in_proj_bias",
+      "elastic_state_head.interaction_attention.out_proj.weight",
+      "elastic_state_head.interaction_attention.out_proj.bias",
+      "elastic_state_head.interaction_mlp.0.weight",
+      "elastic_state_head.interaction_mlp.0.bias",
+      "elastic_state_head.interaction_mlp.1.weight",
+      "elastic_state_head.interaction_mlp.1.bias",
+      "elastic_state_head.interaction_mlp.3.weight",
+      "elastic_state_head.interaction_mlp.3.bias",
+      "elastic_state_head.decoder.field_queries",
+      "elastic_state_head.decoder.field_attention.in_proj_weight",
+      "elastic_state_head.decoder.field_attention.in_proj_bias",
+      "elastic_state_head.decoder.field_attention.out_proj.weight",
+      "elastic_state_head.decoder.field_attention.out_proj.bias",
+      "elastic_state_head.decoder.field_mlp.0.weight",
+      "elastic_state_head.decoder.field_mlp.0.bias",
+      "elastic_state_head.decoder.field_mlp.1.weight",
+      "elastic_state_head.decoder.field_mlp.1.bias",
+      "elastic_state_head.decoder.field_mlp.3.weight",
+      "elastic_state_head.decoder.field_mlp.3.bias",
+      "elastic_state_head.decoder.summary_proj.0.weight",
+      "elastic_state_head.decoder.summary_proj.0.bias",
+      "elastic_state_head.decoder.summary_proj.1.weight",
+      "elastic_state_head.decoder.summary_proj.1.bias",
+      "elastic_state_head.decoder.phase_head.0.weight",
+      "elastic_state_head.decoder.phase_head.0.bias",
+      "elastic_state_head.decoder.phase_head.1.weight",
+      "elastic_state_head.decoder.phase_head.1.bias",
+      "elastic_state_head.decoder.phase_head.3.weight",
+      "elastic_state_head.decoder.phase_head.3.bias",
+      "elastic_state_head.decoder.arm_role_head.0.weight",
+      "elastic_state_head.decoder.arm_role_head.0.bias",
+      "elastic_state_head.decoder.arm_role_head.1.weight",
+      "elastic_state_head.decoder.arm_role_head.1.bias",
+      "elastic_state_head.decoder.arm_role_head.3.weight",
+      "elastic_state_head.decoder.arm_role_head.3.bias",
+      "elastic_state_head.decoder.arm_identity.weight",
+      "elastic_state_head.decoder.support_mode.0.weight",
+      "elastic_state_head.decoder.support_mode.0.bias",
+      "elastic_state_head.decoder.support_mode.1.weight",
+      "elastic_state_head.decoder.support_mode.1.bias",
+      "elastic_state_head.decoder.support_mode.3.weight",
+      "elastic_state_head.decoder.support_mode.3.bias",
+      "elastic_state_head.decoder.access_field.weight",
+      "elastic_state_head.decoder.access_field.bias",
+      "elastic_state_head.decoder.target_belief_field.weight",
+      "elastic_state_head.decoder.target_belief_field.bias",
+      "elastic_state_head.decoder.visibility_field.weight",
+      "elastic_state_head.decoder.visibility_field.bias",
+      "elastic_state_head.decoder.clearance_field.weight",
+      "elastic_state_head.decoder.clearance_field.bias",
+      "elastic_state_head.decoder.occluder_contact_field.weight",
+      "elastic_state_head.decoder.occluder_contact_field.bias",
+      "elastic_state_head.decoder.grasp_affordance_field.weight",
+      "elastic_state_head.decoder.grasp_affordance_field.bias",
+      "elastic_state_head.decoder.support_stability_field.weight",
+      "elastic_state_head.decoder.support_stability_field.bias",
+      "elastic_state_head.decoder.persistence_field.weight",
+      "elastic_state_head.decoder.persistence_field.bias",
+      "elastic_state_head.decoder.reocclusion_field.weight",
+      "elastic_state_head.decoder.reocclusion_field.bias",
+      "elastic_state_head.decoder.disturbance_field.weight",
+      "elastic_state_head.decoder.disturbance_field.bias",
+      "elastic_state_head.decoder.uncertainty_field.weight",
+      "elastic_state_head.decoder.uncertainty_field.bias",
+      "elastic_state_head.decoder.reocclusion_head.0.weight",
+      "elastic_state_head.decoder.reocclusion_head.0.bias",
+      "elastic_state_head.decoder.reocclusion_head.1.weight",
+      "elastic_state_head.decoder.reocclusion_head.1.bias",
+      "elastic_state_head.decoder.reocclusion_head.3.weight",
+      "elastic_state_head.decoder.reocclusion_head.3.bias",
+      "world_model.state_encoder.0.weight",
+      "world_model.state_encoder.0.bias",
+      "world_model.state_encoder.1.weight",
+      "world_model.state_encoder.1.bias",
+      "world_model.scene_memory_proj.0.weight",
+      "world_model.scene_memory_proj.0.bias",
+      "world_model.scene_memory_proj.1.weight",
+      "world_model.scene_memory_proj.1.bias",
+      "world_model.belief_memory_proj.0.weight",
+      "world_model.belief_memory_proj.0.bias",
+      "world_model.belief_memory_proj.1.weight",
+      "world_model.belief_memory_proj.1.bias",
+      "world_model.action_encoder.0.weight",
+      "world_model.action_encoder.0.bias",
+      "world_model.action_encoder.1.weight",
+      "world_model.action_encoder.1.bias",
+      "world_model.transition.weight_ih",
+      "world_model.transition.weight_hh",
+      "world_model.transition.bias_ih",
+      "world_model.transition.bias_hh",
+      "world_model.scene_memory_update.weight",
+      "world_model.scene_memory_update.bias",
+      "world_model.belief_memory_update.weight",
+      "world_model.belief_memory_update.bias",
+      "world_model.compact_decoder.weight",
+      "world_model.compact_decoder.bias",
+      "world_model.target_belief_head.weight",
+      "world_model.target_belief_head.bias",
+      "world_model.visibility_head.weight",
+      "world_model.visibility_head.bias",
+      "world_model.clearance_head.weight",
+      "world_model.clearance_head.bias",
+      "world_model.occluder_contact_head.weight",
+      "world_model.occluder_contact_head.bias",
+      "world_model.grasp_affordance_head.weight",
+      "world_model.grasp_affordance_head.bias",
+      "world_model.support_stability_head.weight",
+      "world_model.support_stability_head.bias",
+      "world_model.persistence_head.weight",
+      "world_model.persistence_head.bias",
+      "world_model.reocclusion_head.weight",
+      "world_model.reocclusion_head.bias",
+      "world_model.disturbance_head.weight",
+      "world_model.disturbance_head.bias",
+      "world_model.uncertainty_head.weight",
+      "world_model.uncertainty_head.bias",
+      "world_model.access_head.weight",
+      "world_model.access_head.bias",
+      "planner.residual.trunk.0.weight",
+      "planner.residual.trunk.0.bias",
+      "planner.residual.trunk.1.weight",
+      "planner.residual.trunk.1.bias",
+      "planner.residual.trunk.3.weight",
+      "planner.residual.trunk.3.bias",
+      "planner.residual.success_head.weight",
+      "planner.residual.success_head.bias",
+      "planner.residual.risk_head.weight",
+      "planner.residual.risk_head.bias",
+      "planner.residual.residual_head.weight",
+      "planner.residual.residual_head.bias"
+    ],
+    "unexpected_keys": []
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/benchmark_full/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5833333333333334,
+      "cloth_proxy": 0.6666666666666666
+    },
+    "mean_success": 0.5555555555555555,
+    "visibility_integral": 31.92372977733612,
+    "corridor_availability": 0.8500884034567409,
+    "reocclusion_rate": 0.029287114566719827,
+    "persistence_horizon_mae": 0.894922278028389,
+    "disturbance_cost": 0.28616168903600836
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/benchmark_full/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/checkpoint_best.pt
+- mean_success: 0.556
+- visibility_integral: 31.924
+- corridor_availability: 0.850
+- reocclusion_rate: 0.029
+- persistence_horizon_mae: 0.895
+- disturbance_cost: 0.286
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.583
+- cloth_proxy_success: 0.667

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/config_resolved.yaml ADDED Viewed

	@@ -0,0 +1,149 @@

+experiment_name: proxy_interaction_r3d_stage1_clip_seed8
+output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
+device: cuda
+seed: 8
+init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
+init_strict: false
+data:
+  proxies:
+  - foliage_proxy
+  - bag_proxy
+  - cloth_proxy
+  resolution: 224
+  dataset_version: reveal_proxy_v6_rgbd_elastic_state
+  train_episodes_per_proxy: 48
+  val_episodes_per_proxy: 16
+  train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage1_seed8.pt
+  val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage1_seed8.pt
+  rebuild_dataset: false
+  chunk_horizon: 8
+  rollout_horizon: 5
+  history_steps: 6
+  planner_candidates: 8
+  seed: 8
+optim:
+  epochs: 4
+  batch_size: 2
+  num_workers: 4
+  lr: 0.0003
+  weight_decay: 0.0001
+trainer:
+  policy_type: elastic_reveal
+  use_bf16: true
+  grad_clip_norm: 1.0
+  freeze_backbone: true
+  gradient_checkpointing: false
+  plan_during_train: true
+  plan_during_eval: true
+  support_mode_conditioning: true
+  planner_mode: trainable
+  use_depth: false
+  use_world_model: true
+  use_role_tokens: true
+  compute_equivariance_probe: true
+policy:
+  backbone:
+    model_name: openai/clip-vit-base-patch32
+    hidden_dim: 512
+    max_text_tokens: 32
+    freeze_backbone: true
+    gradient_checkpointing: false
+    use_dummy_backbone: false
+  fusion:
+    hidden_dim: 512
+    num_cameras: 3
+    num_layers: 4
+    num_heads: 8
+    ff_dim: 2048
+    dropout: 0.1
+    proprio_dim: 32
+    proprio_tokens: 1
+  memory:
+    hidden_dim: 512
+    action_dim: 14
+    history_steps: 6
+    scene_history_steps: 3
+    belief_history_steps: 8
+    num_layers: 2
+    dropout: 0.1
+    memory_bank_size: 4
+    scene_bank_size: 2
+    belief_bank_size: 2
+    num_heads: 8
+    max_history_steps: 8
+  decoder:
+    hidden_dim: 512
+    num_heads: 8
+    num_layers: 4
+    ff_dim: 2048
+    dropout: 0.1
+    chunk_size: 8
+    action_dim: 14
+    arm_action_dim: 7
+    num_candidates: 8
+    num_phases: 5
+    num_arm_roles: 4
+    num_proposal_modes: 6
+    planner_top_k: 4
+  reveal_head:
+    hidden_dim: 512
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    belief_map_size: 32
+    field_size: 16
+    num_heads: 8
+    predict_belief_map: true
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  world_model:
+    hidden_dim: 512
+    action_dim: 14
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    field_size: 16
+    num_heads: 8
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+    belief_map_size: 32
+    predict_belief_map: true
+    scene_bank_size: 2
+    belief_bank_size: 2
+  planner:
+    hidden_dim: 512
+    num_candidates: 8
+    action_dim: 14
+    num_support_modes: 3
+    utility_margin: 0.1
+    num_heads: 8
+    num_layers: 2
+    num_phases: 5
+    num_arm_roles: 4
+    top_k: 4
+loss_weights:
+  action: 1.0
+  phase: 0.1
+  arm_role: 0.15
+  support_mode: 0.1
+  corridor: 0.15
+  persistence: 0.05
+  disturbance: 0.05
+  world_model: 0.2
+  belief: 0.05
+  visibility: 0.05
+  clearance: 0.05
+  support_stability: 0.05
+  reocclusion: 0.05
+  occluder_contact: 0.05
+  grasp_affordance: 0.05
+  planner_success: 0.25
+  planner_risk: 0.1
+  planner_ranking: 0.2
+  proposal_reconstruction: 0.1
+  proposal_success: 0.15
+  proposal_ranking: 0.2
+  proposal_diversity: 0.05
+  role_swap_consistency: 0.05

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/diagnostics_full/proxy_diagnostics.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "planner_top1_accuracy": 0.25984251968503935,
+  "planner_regret": 0.024652592837810516,
+  "planner_score_utility_spearman": 0.15748029947280884,
+  "risk_calibration_mse": 0.010109159164130688,
+  "role_collapse_rate": 0.0,
+  "proposal_diversity": 0.02039325051009655,
+  "left_right_equivariance_error": 8.317838273796951e-05,
+  "belief_calibration_brier": 0.0039802417159080505,
+  "reocclusion_calibration_brier": 0.2667863667011261,
+  "support_stability_mae": 0.023258011788129807,
+  "clearance_auc": 0.9407927438472715,
+  "memory_write_rate": 0.0,
+  "memory_saturation": 0.5879086852073669,
+  "num_samples": 127
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/metrics.json ADDED Viewed

	@@ -0,0 +1,230 @@

+[
+  {
+    "epoch": 0,
+    "train": {
+      "action": 0.025799189747862168,
+      "arm_role": 0.027215735138398815,
+      "belief": 0.11522909954034222,
+      "clearance": 0.09597517975181809,
+      "corridor": 0.3045216482132673,
+      "disturbance": 0.006567074132739083,
+      "grasp_affordance": 0.02625927054055074,
+      "occluder_contact": 0.2161167692295544,
+      "persistence": 7.305491891831004,
+      "phase": 0.7473598300474477,
+      "planner_ranking": 0.14102927445574143,
+      "planner_risk": 0.014660530898254365,
+      "planner_success": 0.596433128830026,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.26868818193206,
+      "proposal_reconstruction": 0.06815405646387819,
+      "proposal_success": 0.6748700912710259,
+      "reocclusion": 0.7006335564308765,
+      "role_swap_consistency": 0.0005011227108655176,
+      "support_mode": 0.7077700629908377,
+      "support_stability": 0.1599257462645798,
+      "total": 1.733834327203441,
+      "uncertainty": 0.022427979406115357,
+      "visibility": 0.11316451830155562,
+      "world_model": 2.674901399312843
+    },
+    "val": {
+      "action": 0.02199536032276228,
+      "arm_role": 9.8040056428772e-06,
+      "belief": 0.0978035525768064,
+      "clearance": 0.07755720446584746,
+      "corridor": 0.24431297194678336,
+      "disturbance": 0.0019795258613157785,
+      "grasp_affordance": 0.008650467454572208,
+      "occluder_contact": 0.20205649081617594,
+      "persistence": 4.437129996716976,
+      "phase": 0.6695621414110065,
+      "planner_ranking": 0.04436381870164041,
+      "planner_risk": 0.010196975797498453,
+      "planner_success": 0.5646271030418575,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1638631131500006,
+      "proposal_reconstruction": 0.06484090705635026,
+      "proposal_success": 0.6649224627763033,
+      "reocclusion": 0.7438069470226765,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.673728191293776,
+      "support_stability": 0.13629821891663596,
+      "total": 1.4150245506316423,
+      "uncertainty": 0.002036258225416532,
+      "visibility": 0.09110353700816631,
+      "world_model": 2.210838695988059
+    }
+  },
+  {
+    "epoch": 1,
+    "train": {
+      "action": 0.02220674532499769,
+      "arm_role": 4.0168849585568094e-05,
+      "belief": 0.10375202887969491,
+      "clearance": 0.08468958432176663,
+      "corridor": 0.24882320250282114,
+      "disturbance": 0.002981857188692701,
+      "grasp_affordance": 0.00994103324857994,
+      "occluder_contact": 0.20824503820604054,
+      "persistence": 4.263324179262391,
+      "phase": 0.7222360341336714,
+      "planner_ranking": 0.044953017053952174,
+      "planner_risk": 0.010661984013600143,
+      "planner_success": 0.5370719069273684,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1506784087076236,
+      "proposal_reconstruction": 0.06470025059674422,
+      "proposal_success": 0.6748968515720667,
+      "reocclusion": 0.7042920837539652,
+      "role_swap_consistency": 0.00024932249915769023,
+      "support_mode": 0.6881518938154451,
+      "support_stability": 0.1487102357972979,
+      "total": 1.3995415040959862,
+      "uncertainty": 0.0019858729011069556,
+      "visibility": 0.09729615078156531,
+      "world_model": 2.178037493952906
+    },
+    "val": {
+      "action": 0.029678026388864964,
+      "arm_role": 0.0003116108114227245,
+      "belief": 0.10797233448829502,
+      "clearance": 0.08150003047194332,
+      "corridor": 0.2509052273235284,
+      "disturbance": 0.002103368451003007,
+      "grasp_affordance": 0.008963905274868011,
+      "occluder_contact": 0.2007133779115975,
+      "persistence": 4.478599248453975,
+      "phase": 0.7040554136037827,
+      "planner_ranking": 0.03813048706929578,
+      "planner_risk": 0.01057393318569666,
+      "planner_success": 0.5217722351662815,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1685641314834356,
+      "proposal_reconstruction": 0.07131227233912796,
+      "proposal_success": 0.6757729910314083,
+      "reocclusion": 0.6976062525063753,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.7273222031071782,
+      "support_stability": 0.1463006478443276,
+      "total": 1.3876731358468533,
+      "uncertainty": 0.0005028243003835087,
+      "visibility": 0.10090084094554186,
+      "world_model": 2.023001086898148
+    }
+  },
+  {
+    "epoch": 2,
+    "train": {
+      "action": 0.022834130358048446,
+      "arm_role": 3.6339485208401505e-05,
+      "belief": 0.10015391417978946,
+      "clearance": 0.08339313631243418,
+      "corridor": 0.24550532728082536,
+      "disturbance": 0.002419849791671015,
+      "grasp_affordance": 0.011102509094860541,
+      "occluder_contact": 0.20242435567041966,
+      "persistence": 4.354869382134127,
+      "phase": 0.6933721572316754,
+      "planner_ranking": 0.04187904763565859,
+      "planner_risk": 0.010259467963658331,
+      "planner_success": 0.5138571092283538,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1488539314394846,
+      "proposal_reconstruction": 0.06509613401758733,
+      "proposal_success": 0.6776590312962757,
+      "reocclusion": 0.70495132540221,
+      "role_swap_consistency": 0.0003516697920602868,
+      "support_mode": 0.6823001881544503,
+      "support_stability": 0.14350243961116718,
+      "total": 1.378995967473035,
+      "uncertainty": 0.0031733291824921203,
+      "visibility": 0.09716511293465555,
+      "world_model": 2.104598100584839
+    },
+    "val": {
+      "action": 0.02644303720444441,
+      "arm_role": 4.627731826190029e-06,
+      "belief": 0.10258024383801967,
+      "clearance": 0.07597982959123328,
+      "corridor": 0.2423992605181411,
+      "disturbance": 0.0015974244740846189,
+      "grasp_affordance": 0.007909159859991632,
+      "occluder_contact": 0.19435308501124382,
+      "persistence": 3.919285401701927,
+      "phase": 0.6770087121985853,
+      "planner_ranking": 0.030531517459166935,
+      "planner_risk": 0.010262692154356046,
+      "planner_success": 0.5169326290488243,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.138186807744205,
+      "proposal_reconstruction": 0.06911751109873876,
+      "proposal_success": 0.6695848302915692,
+      "reocclusion": 0.6975388880819082,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.6884247697889805,
+      "support_stability": 0.13594868587097153,
+      "total": 1.3366163168102503,
+      "uncertainty": 0.0006479808544099797,
+      "visibility": 0.09649082575924695,
+      "world_model": 2.0216304706409574
+    }
+  },
+  {
+    "epoch": 3,
+    "train": {
+      "action": 0.021160060905544235,
+      "arm_role": 5.587545364939105e-05,
+      "belief": 0.10077974488909956,
+      "clearance": 0.08377115065670762,
+      "corridor": 0.2723994788211522,
+      "disturbance": 0.0028603613238174243,
+      "grasp_affordance": 0.011514163958835196,
+      "occluder_contact": 0.20602131318983607,
+      "persistence": 3.0813600014851317,
+      "phase": 0.6817607779777487,
+      "planner_ranking": 0.031658034657560674,
+      "planner_risk": 0.010394540625284256,
+      "planner_success": 0.5069346120532271,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.132226309851202,
+      "proposal_reconstruction": 0.06328810811900967,
+      "proposal_success": 0.6744790461050902,
+      "reocclusion": 0.6852282721022661,
+      "role_swap_consistency": 0.0005754872515272832,
+      "support_mode": 0.6633978239528796,
+      "support_stability": 0.14488365837977468,
+      "total": 1.293662095569191,
+      "uncertainty": 0.0023333917296635863,
+      "visibility": 0.09853576490392235,
+      "world_model": 2.0413369105748482
+    },
+    "val": {
+      "action": 0.017367416352499276,
+      "arm_role": 7.692722565622034e-07,
+      "belief": 0.1027774921967648,
+      "clearance": 0.08752925635781139,
+      "corridor": 0.26156787533545867,
+      "disturbance": 0.0016430629628985116,
+      "grasp_affordance": 0.010058694657345768,
+      "occluder_contact": 0.21157401148229837,
+      "persistence": 1.0993698399979621,
+      "phase": 0.6142133427783847,
+      "planner_ranking": 0.03328441088268619,
+      "planner_risk": 0.010188427979301196,
+      "planner_success": 0.4918641885742545,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1239634547382593,
+      "proposal_reconstruction": 0.06056849448941648,
+      "proposal_success": 0.6778606250882149,
+      "reocclusion": 0.5640022717416286,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.5024671151768416,
+      "support_stability": 0.13648800805094652,
+      "total": 1.1350205279886723,
+      "uncertainty": 0.0008341338888158134,
+      "visibility": 0.0982570193009451,
+      "world_model": 1.93993010930717
+    }
+  }
+]

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/summary.json ADDED Viewed

	@@ -0,0 +1,557 @@

+{
+  "experiment_name": "proxy_interaction_r3d_stage1_clip_seed8",
+  "device": "cuda",
+  "best_checkpoint": "/workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed8/checkpoint_best.pt",
+  "final_train_total": 1.293662095569191,
+  "final_val_total": 1.1350205279886723,
+  "train_time_sec": 146.87081933021545,
+  "peak_gpu_memory_mb": 1891.1337890625,
+  "num_train_samples": 381,
+  "num_val_samples": 127,
+  "planner_mode": "trainable",
+  "frozen_modules": [],
+  "init_info": {
+    "path": "/workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt",
+    "loaded_keys": 461,
+    "skipped_shape_mismatch_keys": [
+      "memory.gru.weight_ih_l0",
+      "memory.gru.weight_hh_l0",
+      "memory.gru.bias_ih_l0",
+      "memory.gru.bias_hh_l0",
+      "memory.token_proj.0.weight",
+      "memory.token_proj.0.bias",
+      "memory.token_proj.1.weight",
+      "memory.token_proj.1.bias",
+      "decoder.actor_role_bias",
+      "decoder.revealer_decoder.layers.0.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.0.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.0.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.0.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.0.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.0.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.0.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.0.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.0.linear1.weight",
+      "decoder.revealer_decoder.layers.0.linear1.bias",
+      "decoder.revealer_decoder.layers.0.linear2.weight",
+      "decoder.revealer_decoder.layers.0.linear2.bias",
+      "decoder.revealer_decoder.layers.0.norm1.weight",
+      "decoder.revealer_decoder.layers.0.norm1.bias",
+      "decoder.revealer_decoder.layers.0.norm2.weight",
+      "decoder.revealer_decoder.layers.0.norm2.bias",
+      "decoder.revealer_decoder.layers.0.norm3.weight",
+      "decoder.revealer_decoder.layers.0.norm3.bias",
+      "decoder.revealer_decoder.layers.1.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.1.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.1.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.1.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.1.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.1.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.1.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.1.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.1.linear1.weight",
+      "decoder.revealer_decoder.layers.1.linear1.bias",
+      "decoder.revealer_decoder.layers.1.linear2.weight",
+      "decoder.revealer_decoder.layers.1.linear2.bias",
+      "decoder.revealer_decoder.layers.1.norm1.weight",
+      "decoder.revealer_decoder.layers.1.norm1.bias",
+      "decoder.revealer_decoder.layers.1.norm2.weight",
+      "decoder.revealer_decoder.layers.1.norm2.bias",
+      "decoder.revealer_decoder.layers.1.norm3.weight",
+      "decoder.revealer_decoder.layers.1.norm3.bias",
+      "decoder.revealer_decoder.layers.2.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.2.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.2.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.2.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.2.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.2.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.2.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.2.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.2.linear1.weight",
+      "decoder.revealer_decoder.layers.2.linear1.bias",
+      "decoder.revealer_decoder.layers.2.linear2.weight",
+      "decoder.revealer_decoder.layers.2.linear2.bias",
+      "decoder.revealer_decoder.layers.2.norm1.weight",
+      "decoder.revealer_decoder.layers.2.norm1.bias",
+      "decoder.revealer_decoder.layers.2.norm2.weight",
+      "decoder.revealer_decoder.layers.2.norm2.bias",
+      "decoder.revealer_decoder.layers.2.norm3.weight",
+      "decoder.revealer_decoder.layers.2.norm3.bias",
+      "decoder.revealer_decoder.layers.3.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.3.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.3.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.3.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.3.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.3.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.3.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.3.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.3.linear1.weight",
+      "decoder.revealer_decoder.layers.3.linear1.bias",
+      "decoder.revealer_decoder.layers.3.linear2.weight",
+      "decoder.revealer_decoder.layers.3.linear2.bias",
+      "decoder.revealer_decoder.layers.3.norm1.weight",
+      "decoder.revealer_decoder.layers.3.norm1.bias",
+      "decoder.revealer_decoder.layers.3.norm2.weight",
+      "decoder.revealer_decoder.layers.3.norm2.bias",
+      "decoder.revealer_decoder.layers.3.norm3.weight",
+      "decoder.revealer_decoder.layers.3.norm3.bias",
+      "decoder.actor_decoder.layers.0.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.0.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.0.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.0.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.0.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.0.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.0.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.0.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.0.linear1.weight",
+      "decoder.actor_decoder.layers.0.linear1.bias",
+      "decoder.actor_decoder.layers.0.linear2.weight",
+      "decoder.actor_decoder.layers.0.linear2.bias",
+      "decoder.actor_decoder.layers.0.norm1.weight",
+      "decoder.actor_decoder.layers.0.norm1.bias",
+      "decoder.actor_decoder.layers.0.norm2.weight",
+      "decoder.actor_decoder.layers.0.norm2.bias",
+      "decoder.actor_decoder.layers.0.norm3.weight",
+      "decoder.actor_decoder.layers.0.norm3.bias",
+      "decoder.actor_decoder.layers.1.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.1.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.1.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.1.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.1.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.1.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.1.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.1.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.1.linear1.weight",
+      "decoder.actor_decoder.layers.1.linear1.bias",
+      "decoder.actor_decoder.layers.1.linear2.weight",
+      "decoder.actor_decoder.layers.1.linear2.bias",
+      "decoder.actor_decoder.layers.1.norm1.weight",
+      "decoder.actor_decoder.layers.1.norm1.bias",
+      "decoder.actor_decoder.layers.1.norm2.weight",
+      "decoder.actor_decoder.layers.1.norm2.bias",
+      "decoder.actor_decoder.layers.1.norm3.weight",
+      "decoder.actor_decoder.layers.1.norm3.bias",
+      "decoder.actor_decoder.layers.2.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.2.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.2.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.2.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.2.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.2.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.2.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.2.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.2.linear1.weight",
+      "decoder.actor_decoder.layers.2.linear1.bias",
+      "decoder.actor_decoder.layers.2.linear2.weight",
+      "decoder.actor_decoder.layers.2.linear2.bias",
+      "decoder.actor_decoder.layers.2.norm1.weight",
+      "decoder.actor_decoder.layers.2.norm1.bias",
+      "decoder.actor_decoder.layers.2.norm2.weight",
+      "decoder.actor_decoder.layers.2.norm2.bias",
+      "decoder.actor_decoder.layers.2.norm3.weight",
+      "decoder.actor_decoder.layers.2.norm3.bias",
+      "decoder.actor_decoder.layers.3.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.3.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.3.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.3.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.3.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.3.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.3.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.3.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.3.linear1.weight",
+      "decoder.actor_decoder.layers.3.linear1.bias",
+      "decoder.actor_decoder.layers.3.linear2.weight",
+      "decoder.actor_decoder.layers.3.linear2.bias",
+      "decoder.actor_decoder.layers.3.norm1.weight",
+      "decoder.actor_decoder.layers.3.norm1.bias",
+      "decoder.actor_decoder.layers.3.norm2.weight",
+      "decoder.actor_decoder.layers.3.norm2.bias",
+      "decoder.actor_decoder.layers.3.norm3.weight",
+      "decoder.actor_decoder.layers.3.norm3.bias",
+      "decoder.revealer_mean.weight",
+      "decoder.revealer_mean.bias",
+      "decoder.revealer_log_std.weight",
+      "decoder.revealer_log_std.bias",
+      "decoder.actor_mean.weight",
+      "decoder.actor_mean.bias",
+      "decoder.actor_log_std.weight",
+      "decoder.actor_log_std.bias",
+      "decoder.proposal_score.0.weight",
+      "decoder.proposal_score.0.bias",
+      "decoder.proposal_score.1.weight",
+      "decoder.proposal_score.1.bias"
+    ],
+    "missing_keys": [
+      "backbone.depth_adapter.depth_proj.0.weight",
+      "backbone.depth_adapter.depth_proj.0.bias",
+      "backbone.depth_adapter.depth_proj.1.weight",
+      "backbone.depth_adapter.depth_proj.1.bias",
+      "backbone.depth_adapter.depth_proj.3.weight",
+      "backbone.depth_adapter.depth_proj.3.bias",
+      "backbone.depth_adapter.geometry_proj.0.weight",
+      "backbone.depth_adapter.geometry_proj.0.bias",
+      "backbone.depth_adapter.geometry_proj.1.weight",
+      "backbone.depth_adapter.geometry_proj.1.bias",
+      "backbone.depth_adapter.camera_proj.0.weight",
+      "backbone.depth_adapter.camera_proj.0.bias",
+      "backbone.depth_adapter.camera_proj.1.weight",
+      "backbone.depth_adapter.camera_proj.1.bias",
+      "fusion.geometry_fusion.attn.in_proj_weight",
+      "fusion.geometry_fusion.attn.in_proj_bias",
+      "fusion.geometry_fusion.attn.out_proj.weight",
+      "fusion.geometry_fusion.attn.out_proj.bias",
+      "fusion.geometry_fusion.gate.0.weight",
+      "fusion.geometry_fusion.gate.0.bias",
+      "fusion.geometry_fusion.gate.1.weight",
+      "fusion.geometry_fusion.gate.1.bias",
+      "fusion.geometry_fusion.gate.3.weight",
+      "fusion.geometry_fusion.gate.3.bias",
+      "fusion.geometry_fusion.out.0.weight",
+      "fusion.geometry_fusion.out.0.bias",
+      "fusion.geometry_fusion.out.1.weight",
+      "fusion.geometry_fusion.out.1.bias",
+      "memory.scene_memory.position_embedding",
+      "memory.scene_memory.bank_queries",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.in_proj_weight",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.in_proj_bias",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.out_proj.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.out_proj.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.linear1.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.linear1.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.linear2.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.linear2.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.norm1.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.norm1.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.norm2.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.norm2.bias",
+      "memory.scene_memory.bank_attention.in_proj_weight",
+      "memory.scene_memory.bank_attention.in_proj_bias",
+      "memory.scene_memory.bank_attention.out_proj.weight",
+      "memory.scene_memory.bank_attention.out_proj.bias",
+      "memory.scene_memory.action_proj.0.weight",
+      "memory.scene_memory.action_proj.0.bias",
+      "memory.scene_memory.action_proj.1.weight",
+      "memory.scene_memory.action_proj.1.bias",
+      "memory.scene_memory.write_gate.0.weight",
+      "memory.scene_memory.write_gate.0.bias",
+      "memory.scene_memory.write_gate.1.weight",
+      "memory.scene_memory.write_gate.1.bias",
+      "memory.scene_memory.write_gate.3.weight",
+      "memory.scene_memory.write_gate.3.bias",
+      "memory.scene_memory.token_proj.0.weight",
+      "memory.scene_memory.token_proj.0.bias",
+      "memory.scene_memory.token_proj.1.weight",
+      "memory.scene_memory.token_proj.1.bias",
+      "memory.belief_memory.position_embedding",
+      "memory.belief_memory.bank_queries",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.in_proj_weight",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.in_proj_bias",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.out_proj.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.out_proj.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.linear1.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.linear1.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.linear2.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.linear2.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.norm1.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.norm1.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.norm2.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.norm2.bias",
+      "memory.belief_memory.bank_attention.in_proj_weight",
+      "memory.belief_memory.bank_attention.in_proj_bias",
+      "memory.belief_memory.bank_attention.out_proj.weight",
+      "memory.belief_memory.bank_attention.out_proj.bias",
+      "memory.belief_memory.action_proj.0.weight",
+      "memory.belief_memory.action_proj.0.bias",
+      "memory.belief_memory.action_proj.1.weight",
+      "memory.belief_memory.action_proj.1.bias",
+      "memory.belief_memory.write_gate.0.weight",
+      "memory.belief_memory.write_gate.0.bias",
+      "memory.belief_memory.write_gate.1.weight",
+      "memory.belief_memory.write_gate.1.bias",
+      "memory.belief_memory.write_gate.3.weight",
+      "memory.belief_memory.write_gate.3.bias",
+      "memory.belief_memory.token_proj.0.weight",
+      "memory.belief_memory.token_proj.0.bias",
+      "memory.belief_memory.token_proj.1.weight",
+      "memory.belief_memory.token_proj.1.bias",
+      "decoder.arm_decoder.layers.0.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.0.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.0.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.0.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.0.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.0.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.0.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.0.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.0.linear1.weight",
+      "decoder.arm_decoder.layers.0.linear1.bias",
+      "decoder.arm_decoder.layers.0.linear2.weight",
+      "decoder.arm_decoder.layers.0.linear2.bias",
+      "decoder.arm_decoder.layers.0.norm1.weight",
+      "decoder.arm_decoder.layers.0.norm1.bias",
+      "decoder.arm_decoder.layers.0.norm2.weight",
+      "decoder.arm_decoder.layers.0.norm2.bias",
+      "decoder.arm_decoder.layers.0.norm3.weight",
+      "decoder.arm_decoder.layers.0.norm3.bias",
+      "decoder.arm_decoder.layers.1.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.1.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.1.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.1.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.1.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.1.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.1.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.1.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.1.linear1.weight",
+      "decoder.arm_decoder.layers.1.linear1.bias",
+      "decoder.arm_decoder.layers.1.linear2.weight",
+      "decoder.arm_decoder.layers.1.linear2.bias",
+      "decoder.arm_decoder.layers.1.norm1.weight",
+      "decoder.arm_decoder.layers.1.norm1.bias",
+      "decoder.arm_decoder.layers.1.norm2.weight",
+      "decoder.arm_decoder.layers.1.norm2.bias",
+      "decoder.arm_decoder.layers.1.norm3.weight",
+      "decoder.arm_decoder.layers.1.norm3.bias",
+      "decoder.arm_decoder.layers.2.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.2.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.2.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.2.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.2.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.2.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.2.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.2.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.2.linear1.weight",
+      "decoder.arm_decoder.layers.2.linear1.bias",
+      "decoder.arm_decoder.layers.2.linear2.weight",
+      "decoder.arm_decoder.layers.2.linear2.bias",
+      "decoder.arm_decoder.layers.2.norm1.weight",
+      "decoder.arm_decoder.layers.2.norm1.bias",
+      "decoder.arm_decoder.layers.2.norm2.weight",
+      "decoder.arm_decoder.layers.2.norm2.bias",
+      "decoder.arm_decoder.layers.2.norm3.weight",
+      "decoder.arm_decoder.layers.2.norm3.bias",
+      "decoder.arm_decoder.layers.3.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.3.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.3.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.3.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.3.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.3.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.3.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.3.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.3.linear1.weight",
+      "decoder.arm_decoder.layers.3.linear1.bias",
+      "decoder.arm_decoder.layers.3.linear2.weight",
+      "decoder.arm_decoder.layers.3.linear2.bias",
+      "decoder.arm_decoder.layers.3.norm1.weight",
+      "decoder.arm_decoder.layers.3.norm1.bias",
+      "decoder.arm_decoder.layers.3.norm2.weight",
+      "decoder.arm_decoder.layers.3.norm2.bias",
+      "decoder.arm_decoder.layers.3.norm3.weight",
+      "decoder.arm_decoder.layers.3.norm3.bias",
+      "decoder.arm_identity.weight",
+      "decoder.phase_adapter.weight",
+      "decoder.phase_adapter.bias",
+      "decoder.role_adapter.weight",
+      "decoder.role_adapter.bias",
+      "decoder.context_proj.0.weight",
+      "decoder.context_proj.0.bias",
+      "decoder.context_proj.1.weight",
+      "decoder.context_proj.1.bias",
+      "decoder.arm_head.0.weight",
+      "decoder.arm_head.0.bias",
+      "decoder.arm_head.1.weight",
+      "decoder.arm_head.1.bias",
+      "decoder.arm_mean.weight",
+      "decoder.arm_mean.bias",
+      "decoder.arm_log_std.weight",
+      "decoder.arm_log_std.bias",
+      "decoder.proposal_mode_head.0.weight",
+      "decoder.proposal_mode_head.0.bias",
+      "decoder.proposal_mode_head.1.weight",
+      "decoder.proposal_mode_head.1.bias",
+      "decoder.proposal_mode_head.3.weight",
+      "decoder.proposal_mode_head.3.bias",
+      "decoder.proposal_mode_embeddings.weight",
+      "decoder.proposal_slot_embeddings.weight",
+      "decoder.mode_residual_heads.0.0.weight",
+      "decoder.mode_residual_heads.0.0.bias",
+      "decoder.mode_residual_heads.0.1.weight",
+      "decoder.mode_residual_heads.0.1.bias",
+      "decoder.mode_residual_heads.0.3.weight",
+      "decoder.mode_residual_heads.0.3.bias",
+      "decoder.mode_residual_heads.1.0.weight",
+      "decoder.mode_residual_heads.1.0.bias",
+      "decoder.mode_residual_heads.1.1.weight",
+      "decoder.mode_residual_heads.1.1.bias",
+      "decoder.mode_residual_heads.1.3.weight",
+      "decoder.mode_residual_heads.1.3.bias",
+      "decoder.mode_residual_heads.2.0.weight",
+      "decoder.mode_residual_heads.2.0.bias",
+      "decoder.mode_residual_heads.2.1.weight",
+      "decoder.mode_residual_heads.2.1.bias",
+      "decoder.mode_residual_heads.2.3.weight",
+      "decoder.mode_residual_heads.2.3.bias",
+      "decoder.mode_residual_heads.3.0.weight",
+      "decoder.mode_residual_heads.3.0.bias",
+      "decoder.mode_residual_heads.3.1.weight",
+      "decoder.mode_residual_heads.3.1.bias",
+      "decoder.mode_residual_heads.3.3.weight",
+      "decoder.mode_residual_heads.3.3.bias",
+      "decoder.mode_residual_heads.4.0.weight",
+      "decoder.mode_residual_heads.4.0.bias",
+      "decoder.mode_residual_heads.4.1.weight",
+      "decoder.mode_residual_heads.4.1.bias",
+      "decoder.mode_residual_heads.4.3.weight",
+      "decoder.mode_residual_heads.4.3.bias",
+      "decoder.mode_residual_heads.5.0.weight",
+      "decoder.mode_residual_heads.5.0.bias",
+      "decoder.mode_residual_heads.5.1.weight",
+      "decoder.mode_residual_heads.5.1.bias",
+      "decoder.mode_residual_heads.5.3.weight",
+      "decoder.mode_residual_heads.5.3.bias",
+      "decoder.slot_delta.0.weight",
+      "decoder.slot_delta.0.bias",
+      "decoder.slot_delta.1.weight",
+      "decoder.slot_delta.1.bias",
+      "decoder.slot_delta.3.weight",
+      "decoder.slot_delta.3.bias",
+      "decoder.proposal_score.0.weight",
+      "decoder.proposal_score.0.bias",
+      "decoder.proposal_score.1.weight",
+      "decoder.proposal_score.1.bias",
+      "decoder.proposal_score.3.weight",
+      "decoder.proposal_score.3.bias",
+      "elastic_state_head.interaction_queries",
+      "elastic_state_head.interaction_attention.in_proj_weight",
+      "elastic_state_head.interaction_attention.in_proj_bias",
+      "elastic_state_head.interaction_attention.out_proj.weight",
+      "elastic_state_head.interaction_attention.out_proj.bias",
+      "elastic_state_head.interaction_mlp.0.weight",
+      "elastic_state_head.interaction_mlp.0.bias",
+      "elastic_state_head.interaction_mlp.1.weight",
+      "elastic_state_head.interaction_mlp.1.bias",
+      "elastic_state_head.interaction_mlp.3.weight",
+      "elastic_state_head.interaction_mlp.3.bias",
+      "elastic_state_head.decoder.field_queries",
+      "elastic_state_head.decoder.field_attention.in_proj_weight",
+      "elastic_state_head.decoder.field_attention.in_proj_bias",
+      "elastic_state_head.decoder.field_attention.out_proj.weight",
+      "elastic_state_head.decoder.field_attention.out_proj.bias",
+      "elastic_state_head.decoder.field_mlp.0.weight",
+      "elastic_state_head.decoder.field_mlp.0.bias",
+      "elastic_state_head.decoder.field_mlp.1.weight",
+      "elastic_state_head.decoder.field_mlp.1.bias",
+      "elastic_state_head.decoder.field_mlp.3.weight",
+      "elastic_state_head.decoder.field_mlp.3.bias",
+      "elastic_state_head.decoder.summary_proj.0.weight",
+      "elastic_state_head.decoder.summary_proj.0.bias",
+      "elastic_state_head.decoder.summary_proj.1.weight",
+      "elastic_state_head.decoder.summary_proj.1.bias",
+      "elastic_state_head.decoder.phase_head.0.weight",
+      "elastic_state_head.decoder.phase_head.0.bias",
+      "elastic_state_head.decoder.phase_head.1.weight",
+      "elastic_state_head.decoder.phase_head.1.bias",
+      "elastic_state_head.decoder.phase_head.3.weight",
+      "elastic_state_head.decoder.phase_head.3.bias",
+      "elastic_state_head.decoder.arm_role_head.0.weight",
+      "elastic_state_head.decoder.arm_role_head.0.bias",
+      "elastic_state_head.decoder.arm_role_head.1.weight",
+      "elastic_state_head.decoder.arm_role_head.1.bias",
+      "elastic_state_head.decoder.arm_role_head.3.weight",
+      "elastic_state_head.decoder.arm_role_head.3.bias",
+      "elastic_state_head.decoder.arm_identity.weight",
+      "elastic_state_head.decoder.support_mode.0.weight",
+      "elastic_state_head.decoder.support_mode.0.bias",
+      "elastic_state_head.decoder.support_mode.1.weight",
+      "elastic_state_head.decoder.support_mode.1.bias",
+      "elastic_state_head.decoder.support_mode.3.weight",
+      "elastic_state_head.decoder.support_mode.3.bias",
+      "elastic_state_head.decoder.access_field.weight",
+      "elastic_state_head.decoder.access_field.bias",
+      "elastic_state_head.decoder.target_belief_field.weight",
+      "elastic_state_head.decoder.target_belief_field.bias",
+      "elastic_state_head.decoder.visibility_field.weight",
+      "elastic_state_head.decoder.visibility_field.bias",
+      "elastic_state_head.decoder.clearance_field.weight",
+      "elastic_state_head.decoder.clearance_field.bias",
+      "elastic_state_head.decoder.occluder_contact_field.weight",
+      "elastic_state_head.decoder.occluder_contact_field.bias",
+      "elastic_state_head.decoder.grasp_affordance_field.weight",
+      "elastic_state_head.decoder.grasp_affordance_field.bias",
+      "elastic_state_head.decoder.support_stability_field.weight",
+      "elastic_state_head.decoder.support_stability_field.bias",
+      "elastic_state_head.decoder.persistence_field.weight",
+      "elastic_state_head.decoder.persistence_field.bias",
+      "elastic_state_head.decoder.reocclusion_field.weight",
+      "elastic_state_head.decoder.reocclusion_field.bias",
+      "elastic_state_head.decoder.disturbance_field.weight",
+      "elastic_state_head.decoder.disturbance_field.bias",
+      "elastic_state_head.decoder.uncertainty_field.weight",
+      "elastic_state_head.decoder.uncertainty_field.bias",
+      "elastic_state_head.decoder.reocclusion_head.0.weight",
+      "elastic_state_head.decoder.reocclusion_head.0.bias",
+      "elastic_state_head.decoder.reocclusion_head.1.weight",
+      "elastic_state_head.decoder.reocclusion_head.1.bias",
+      "elastic_state_head.decoder.reocclusion_head.3.weight",
+      "elastic_state_head.decoder.reocclusion_head.3.bias",
+      "world_model.state_encoder.0.weight",
+      "world_model.state_encoder.0.bias",
+      "world_model.state_encoder.1.weight",
+      "world_model.state_encoder.1.bias",
+      "world_model.scene_memory_proj.0.weight",
+      "world_model.scene_memory_proj.0.bias",
+      "world_model.scene_memory_proj.1.weight",
+      "world_model.scene_memory_proj.1.bias",
+      "world_model.belief_memory_proj.0.weight",
+      "world_model.belief_memory_proj.0.bias",
+      "world_model.belief_memory_proj.1.weight",
+      "world_model.belief_memory_proj.1.bias",
+      "world_model.action_encoder.0.weight",
+      "world_model.action_encoder.0.bias",
+      "world_model.action_encoder.1.weight",
+      "world_model.action_encoder.1.bias",
+      "world_model.transition.weight_ih",
+      "world_model.transition.weight_hh",
+      "world_model.transition.bias_ih",
+      "world_model.transition.bias_hh",
+      "world_model.scene_memory_update.weight",
+      "world_model.scene_memory_update.bias",
+      "world_model.belief_memory_update.weight",
+      "world_model.belief_memory_update.bias",
+      "world_model.compact_decoder.weight",
+      "world_model.compact_decoder.bias",
+      "world_model.target_belief_head.weight",
+      "world_model.target_belief_head.bias",
+      "world_model.visibility_head.weight",
+      "world_model.visibility_head.bias",
+      "world_model.clearance_head.weight",
+      "world_model.clearance_head.bias",
+      "world_model.occluder_contact_head.weight",
+      "world_model.occluder_contact_head.bias",
+      "world_model.grasp_affordance_head.weight",
+      "world_model.grasp_affordance_head.bias",
+      "world_model.support_stability_head.weight",
+      "world_model.support_stability_head.bias",
+      "world_model.persistence_head.weight",
+      "world_model.persistence_head.bias",
+      "world_model.reocclusion_head.weight",
+      "world_model.reocclusion_head.bias",
+      "world_model.disturbance_head.weight",
+      "world_model.disturbance_head.bias",
+      "world_model.uncertainty_head.weight",
+      "world_model.uncertainty_head.bias",
+      "world_model.access_head.weight",
+      "world_model.access_head.bias",
+      "planner.residual.trunk.0.weight",
+      "planner.residual.trunk.0.bias",
+      "planner.residual.trunk.1.weight",
+      "planner.residual.trunk.1.bias",
+      "planner.residual.trunk.3.weight",
+      "planner.residual.trunk.3.bias",
+      "planner.residual.success_head.weight",
+      "planner.residual.success_head.bias",
+      "planner.residual.risk_head.weight",
+      "planner.residual.risk_head.bias",
+      "planner.residual.residual_head.weight",
+      "planner.residual.residual_head.bias"
+    ],
+    "unexpected_keys": []
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/benchmark_full/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.5,
+      "bag_proxy": 0.5416666666666666,
+      "cloth_proxy": 0.6666666666666666
+    },
+    "mean_success": 0.5694444444444443,
+    "visibility_integral": 32.623872251146366,
+    "corridor_availability": 0.889709601799647,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.1627785900766536,
+    "disturbance_cost": 0.2332938505957524
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/benchmark_full/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/checkpoint_best.pt
+- mean_success: 0.569
+- visibility_integral: 32.624
+- corridor_availability: 0.890
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.163
+- disturbance_cost: 0.233
+- foliage_proxy_success: 0.500
+- bag_proxy_success: 0.542
+- cloth_proxy_success: 0.667

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/config_resolved.yaml ADDED Viewed

	@@ -0,0 +1,149 @@

+experiment_name: proxy_interaction_r3d_stage1_clip_seed9
+output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
+device: cuda
+seed: 9
+init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
+init_strict: false
+data:
+  proxies:
+  - foliage_proxy
+  - bag_proxy
+  - cloth_proxy
+  resolution: 224
+  dataset_version: reveal_proxy_v6_rgbd_elastic_state
+  train_episodes_per_proxy: 48
+  val_episodes_per_proxy: 16
+  train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage1_seed9.pt
+  val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage1_seed9.pt
+  rebuild_dataset: false
+  chunk_horizon: 8
+  rollout_horizon: 5
+  history_steps: 6
+  planner_candidates: 8
+  seed: 9
+optim:
+  epochs: 4
+  batch_size: 2
+  num_workers: 4
+  lr: 0.0003
+  weight_decay: 0.0001
+trainer:
+  policy_type: elastic_reveal
+  use_bf16: true
+  grad_clip_norm: 1.0
+  freeze_backbone: true
+  gradient_checkpointing: false
+  plan_during_train: true
+  plan_during_eval: true
+  support_mode_conditioning: true
+  planner_mode: trainable
+  use_depth: false
+  use_world_model: true
+  use_role_tokens: true
+  compute_equivariance_probe: true
+policy:
+  backbone:
+    model_name: openai/clip-vit-base-patch32
+    hidden_dim: 512
+    max_text_tokens: 32
+    freeze_backbone: true
+    gradient_checkpointing: false
+    use_dummy_backbone: false
+  fusion:
+    hidden_dim: 512
+    num_cameras: 3
+    num_layers: 4
+    num_heads: 8
+    ff_dim: 2048
+    dropout: 0.1
+    proprio_dim: 32
+    proprio_tokens: 1
+  memory:
+    hidden_dim: 512
+    action_dim: 14
+    history_steps: 6
+    scene_history_steps: 3
+    belief_history_steps: 8
+    num_layers: 2
+    dropout: 0.1
+    memory_bank_size: 4
+    scene_bank_size: 2
+    belief_bank_size: 2
+    num_heads: 8
+    max_history_steps: 8
+  decoder:
+    hidden_dim: 512
+    num_heads: 8
+    num_layers: 4
+    ff_dim: 2048
+    dropout: 0.1
+    chunk_size: 8
+    action_dim: 14
+    arm_action_dim: 7
+    num_candidates: 8
+    num_phases: 5
+    num_arm_roles: 4
+    num_proposal_modes: 6
+    planner_top_k: 4
+  reveal_head:
+    hidden_dim: 512
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    belief_map_size: 32
+    field_size: 16
+    num_heads: 8
+    predict_belief_map: true
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  world_model:
+    hidden_dim: 512
+    action_dim: 14
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    field_size: 16
+    num_heads: 8
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+    belief_map_size: 32
+    predict_belief_map: true
+    scene_bank_size: 2
+    belief_bank_size: 2
+  planner:
+    hidden_dim: 512
+    num_candidates: 8
+    action_dim: 14
+    num_support_modes: 3
+    utility_margin: 0.1
+    num_heads: 8
+    num_layers: 2
+    num_phases: 5
+    num_arm_roles: 4
+    top_k: 4
+loss_weights:
+  action: 1.0
+  phase: 0.1
+  arm_role: 0.15
+  support_mode: 0.1
+  corridor: 0.15
+  persistence: 0.05
+  disturbance: 0.05
+  world_model: 0.2
+  belief: 0.05
+  visibility: 0.05
+  clearance: 0.05
+  support_stability: 0.05
+  reocclusion: 0.05
+  occluder_contact: 0.05
+  grasp_affordance: 0.05
+  planner_success: 0.25
+  planner_risk: 0.1
+  planner_ranking: 0.2
+  proposal_reconstruction: 0.1
+  proposal_success: 0.15
+  proposal_ranking: 0.2
+  proposal_diversity: 0.05
+  role_swap_consistency: 0.05

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/diagnostics_full/proxy_diagnostics.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "planner_top1_accuracy": 0.2890625,
+  "planner_regret": 0.02300698682665825,
+  "planner_score_utility_spearman": 0.22968751192092896,
+  "risk_calibration_mse": 0.010304542258381844,
+  "role_collapse_rate": 0.0,
+  "proposal_diversity": 0.022611485794186592,
+  "left_right_equivariance_error": 8.689248215887346e-05,
+  "belief_calibration_brier": 0.0043337177485227585,
+  "reocclusion_calibration_brier": 0.22800305485725403,
+  "support_stability_mae": 0.02859283983707428,
+  "clearance_auc": 0.6329041426155311,
+  "memory_write_rate": 0.0,
+  "memory_saturation": 0.2469944953918457,
+  "num_samples": 128
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/metrics.json ADDED Viewed

	@@ -0,0 +1,230 @@

+[
+  {
+    "epoch": 0,
+    "train": {
+      "action": 0.027812569460978633,
+      "arm_role": 0.030137697646492406,
+      "belief": 0.12157152328444154,
+      "clearance": 0.09282162053216444,
+      "corridor": 0.2851656379864404,
+      "disturbance": 0.004553798715077344,
+      "grasp_affordance": 0.018851539715634365,
+      "occluder_contact": 0.2132460696916831,
+      "persistence": 5.642576662878807,
+      "phase": 0.7761939600894325,
+      "planner_ranking": 0.17902961440620282,
+      "planner_risk": 0.013923984336035668,
+      "planner_success": 0.6199151214800382,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.2823116054660395,
+      "proposal_reconstruction": 0.06912861580127164,
+      "proposal_success": 0.6811760576147782,
+      "reocclusion": 0.7353295496419856,
+      "role_swap_consistency": 0.0005873552748725113,
+      "support_mode": 0.7828435195119757,
+      "support_stability": 0.16347284512594343,
+      "total": 1.6866143584251403,
+      "uncertainty": 0.019001170223897423,
+      "visibility": 0.11754893544865282,
+      "world_model": 2.710779071795313
+    },
+    "val": {
+      "action": 0.02170204828144051,
+      "arm_role": 6.762321064002208e-06,
+      "belief": 0.10080993873998523,
+      "clearance": 0.08166962582617998,
+      "corridor": 0.23909102065954357,
+      "disturbance": 0.001983066906802833,
+      "grasp_affordance": 0.008535019573173486,
+      "occluder_contact": 0.2112727805506438,
+      "persistence": 3.857563339173794,
+      "phase": 0.6654304726980627,
+      "planner_ranking": 0.04032187890697969,
+      "planner_risk": 0.011350331830726645,
+      "planner_success": 0.5934910103678703,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1493350621312857,
+      "proposal_reconstruction": 0.06338102876907215,
+      "proposal_success": 0.6806164355948567,
+      "reocclusion": 0.6909330077469349,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.6831411011517048,
+      "support_stability": 0.13910080850473605,
+      "total": 1.458911145105958,
+      "uncertainty": 0.0033405375688744243,
+      "visibility": 0.09547075629234314,
+      "world_model": 2.5560860373079777
+    }
+  },
+  {
+    "epoch": 1,
+    "train": {
+      "action": 0.023493385471795733,
+      "arm_role": 0.0002928718140250758,
+      "belief": 0.10523007610126546,
+      "clearance": 0.08677955961933262,
+      "corridor": 0.25750191186211613,
+      "disturbance": 0.0031594517295421777,
+      "grasp_affordance": 0.01005841078187682,
+      "occluder_contact": 0.20920588836858148,
+      "persistence": 4.331643560058192,
+      "phase": 0.7189607319078948,
+      "planner_ranking": 0.05423959079287933,
+      "planner_risk": 0.010427037446980217,
+      "planner_success": 0.5849820621703801,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1505002517449228,
+      "proposal_reconstruction": 0.06525950771021216,
+      "proposal_success": 0.6752778025049913,
+      "reocclusion": 0.7005268357302014,
+      "role_swap_consistency": 0.0007142310405278726,
+      "support_mode": 0.70107421875,
+      "support_stability": 0.14081861141480898,
+      "total": 1.432289683818817,
+      "uncertainty": 0.002551493341237993,
+      "visibility": 0.10134971671198544,
+      "world_model": 2.237849539204648
+    },
+    "val": {
+      "action": 0.021186921891057864,
+      "arm_role": 3.6694105953749556e-07,
+      "belief": 0.09995241661090404,
+      "clearance": 0.08146111795213073,
+      "corridor": 0.24082361184991896,
+      "disturbance": 0.001976304362585779,
+      "grasp_affordance": 0.00922958003502572,
+      "occluder_contact": 0.21127386414445937,
+      "persistence": 3.7571401111781597,
+      "phase": 0.6817005267366767,
+      "planner_ranking": 0.03515352255374182,
+      "planner_risk": 0.01038273600534012,
+      "planner_success": 0.5073812543414533,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1285581476986408,
+      "proposal_reconstruction": 0.0629420520272106,
+      "proposal_success": 0.6745674163103104,
+      "reocclusion": 0.6919681001454592,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.6647901809774339,
+      "support_stability": 0.14570825529517606,
+      "total": 1.3415670674294233,
+      "uncertainty": 0.0013466343752952525,
+      "visibility": 0.09475092665525153,
+      "world_model": 2.1340785464271903
+    }
+  },
+  {
+    "epoch": 2,
+    "train": {
+      "action": 0.021538028542540576,
+      "arm_role": 2.1901883577045642e-05,
+      "belief": 0.10526431232298675,
+      "clearance": 0.08594944182979433,
+      "corridor": 0.24735975777240177,
+      "disturbance": 0.0026733651749964336,
+      "grasp_affordance": 0.010091915089440974,
+      "occluder_contact": 0.20871730721310566,
+      "persistence": 4.281911664887478,
+      "phase": 0.6870194284539474,
+      "planner_ranking": 0.04152601579832519,
+      "planner_risk": 0.01045033406331449,
+      "planner_success": 0.5353652712545897,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1453557397189893,
+      "proposal_reconstruction": 0.06370952629337186,
+      "proposal_success": 0.6778088651205364,
+      "reocclusion": 0.6986164701612372,
+      "role_swap_consistency": 0.0004750598012929243,
+      "support_mode": 0.6878212376644737,
+      "support_stability": 0.1362508504700504,
+      "total": 1.384049719885776,
+      "uncertainty": 0.001396400365047157,
+      "visibility": 0.09892214826847377,
+      "world_model": 2.1307888821551675
+    },
+    "val": {
+      "action": 0.021681111145881005,
+      "arm_role": 0.0003864255304506514,
+      "belief": 0.10844068287406117,
+      "clearance": 0.08775011514080688,
+      "corridor": 0.23830276518128812,
+      "disturbance": 0.0019835491895037194,
+      "grasp_affordance": 0.011450761739979498,
+      "occluder_contact": 0.21598492935299873,
+      "persistence": 3.682887438684702,
+      "phase": 0.6754010105505586,
+      "planner_ranking": 0.03584061572041719,
+      "planner_risk": 0.010325502114255869,
+      "planner_success": 0.49944606237113476,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1196386851370335,
+      "proposal_reconstruction": 0.0637086319620721,
+      "proposal_success": 0.6784614324569702,
+      "reocclusion": 0.6908501861616969,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.6635435968637466,
+      "support_stability": 0.14290154923219234,
+      "total": 1.3013203730806708,
+      "uncertainty": 0.002612559406315995,
+      "visibility": 0.10054636449785903,
+      "world_model": 1.9632274899631739
+    }
+  },
+  {
+    "epoch": 3,
+    "train": {
+      "action": 0.02116909674123714,
+      "arm_role": 0.00017300687338176526,
+      "belief": 0.10208533270970771,
+      "clearance": 0.08287150121637081,
+      "corridor": 0.24314571875882776,
+      "disturbance": 0.002553280315360577,
+      "grasp_affordance": 0.010202447837218642,
+      "occluder_contact": 0.20370756677891078,
+      "persistence": 3.4343402633541507,
+      "phase": 0.6811472039473684,
+      "planner_ranking": 0.03300265433170257,
+      "planner_risk": 0.010154466018828221,
+      "planner_success": 0.5132313249338615,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1288216785380716,
+      "proposal_reconstruction": 0.06323393973472871,
+      "proposal_success": 0.6770071575516149,
+      "reocclusion": 0.7064933630980943,
+      "role_swap_consistency": 0.0003766025873023625,
+      "support_mode": 0.7007555509868421,
+      "support_stability": 0.1340178519732466,
+      "total": 1.314924956309168,
+      "uncertainty": 0.0012071453580622467,
+      "visibility": 0.09558045302370662,
+      "world_model": 2.054408212398228
+    },
+    "val": {
+      "action": 0.021696553943911567,
+      "arm_role": 6.053594985289124e-07,
+      "belief": 0.0983218071050942,
+      "clearance": 0.07689482159912586,
+      "corridor": 0.29242096332018264,
+      "disturbance": 0.0041615761442699295,
+      "grasp_affordance": 0.0100187708158046,
+      "occluder_contact": 0.19618010916747153,
+      "persistence": 4.662721422035247,
+      "phase": 0.6692422716878355,
+      "planner_ranking": 0.030305169929533804,
+      "planner_risk": 0.010842124038390466,
+      "planner_success": 0.5005343491211534,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1591037698090076,
+      "proposal_reconstruction": 0.06389545585261658,
+      "proposal_success": 0.6826766086742282,
+      "reocclusion": 0.7785650952719152,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.6616131067276001,
+      "support_stability": 0.1388778503460344,
+      "total": 1.3739404007792473,
+      "uncertainty": 2.288464340693963e-05,
+      "visibility": 0.09415236074710265,
+      "world_model": 1.9970475500449538
+    }
+  }
+]

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/summary.json ADDED Viewed

	@@ -0,0 +1,557 @@

+{
+  "experiment_name": "proxy_interaction_r3d_stage1_clip_seed9",
+  "device": "cuda",
+  "best_checkpoint": "/workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_clip_seed9/checkpoint_best.pt",
+  "final_train_total": 1.314924956309168,
+  "final_val_total": 1.3739404007792473,
+  "train_time_sec": 146.7574381828308,
+  "peak_gpu_memory_mb": 1915.8154296875,
+  "num_train_samples": 380,
+  "num_val_samples": 128,
+  "planner_mode": "trainable",
+  "frozen_modules": [],
+  "init_info": {
+    "path": "/workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt",
+    "loaded_keys": 461,
+    "skipped_shape_mismatch_keys": [
+      "memory.gru.weight_ih_l0",
+      "memory.gru.weight_hh_l0",
+      "memory.gru.bias_ih_l0",
+      "memory.gru.bias_hh_l0",
+      "memory.token_proj.0.weight",
+      "memory.token_proj.0.bias",
+      "memory.token_proj.1.weight",
+      "memory.token_proj.1.bias",
+      "decoder.actor_role_bias",
+      "decoder.revealer_decoder.layers.0.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.0.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.0.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.0.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.0.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.0.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.0.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.0.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.0.linear1.weight",
+      "decoder.revealer_decoder.layers.0.linear1.bias",
+      "decoder.revealer_decoder.layers.0.linear2.weight",
+      "decoder.revealer_decoder.layers.0.linear2.bias",
+      "decoder.revealer_decoder.layers.0.norm1.weight",
+      "decoder.revealer_decoder.layers.0.norm1.bias",
+      "decoder.revealer_decoder.layers.0.norm2.weight",
+      "decoder.revealer_decoder.layers.0.norm2.bias",
+      "decoder.revealer_decoder.layers.0.norm3.weight",
+      "decoder.revealer_decoder.layers.0.norm3.bias",
+      "decoder.revealer_decoder.layers.1.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.1.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.1.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.1.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.1.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.1.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.1.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.1.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.1.linear1.weight",
+      "decoder.revealer_decoder.layers.1.linear1.bias",
+      "decoder.revealer_decoder.layers.1.linear2.weight",
+      "decoder.revealer_decoder.layers.1.linear2.bias",
+      "decoder.revealer_decoder.layers.1.norm1.weight",
+      "decoder.revealer_decoder.layers.1.norm1.bias",
+      "decoder.revealer_decoder.layers.1.norm2.weight",
+      "decoder.revealer_decoder.layers.1.norm2.bias",
+      "decoder.revealer_decoder.layers.1.norm3.weight",
+      "decoder.revealer_decoder.layers.1.norm3.bias",
+      "decoder.revealer_decoder.layers.2.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.2.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.2.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.2.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.2.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.2.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.2.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.2.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.2.linear1.weight",
+      "decoder.revealer_decoder.layers.2.linear1.bias",
+      "decoder.revealer_decoder.layers.2.linear2.weight",
+      "decoder.revealer_decoder.layers.2.linear2.bias",
+      "decoder.revealer_decoder.layers.2.norm1.weight",
+      "decoder.revealer_decoder.layers.2.norm1.bias",
+      "decoder.revealer_decoder.layers.2.norm2.weight",
+      "decoder.revealer_decoder.layers.2.norm2.bias",
+      "decoder.revealer_decoder.layers.2.norm3.weight",
+      "decoder.revealer_decoder.layers.2.norm3.bias",
+      "decoder.revealer_decoder.layers.3.self_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.3.self_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.3.self_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.3.self_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.3.multihead_attn.in_proj_weight",
+      "decoder.revealer_decoder.layers.3.multihead_attn.in_proj_bias",
+      "decoder.revealer_decoder.layers.3.multihead_attn.out_proj.weight",
+      "decoder.revealer_decoder.layers.3.multihead_attn.out_proj.bias",
+      "decoder.revealer_decoder.layers.3.linear1.weight",
+      "decoder.revealer_decoder.layers.3.linear1.bias",
+      "decoder.revealer_decoder.layers.3.linear2.weight",
+      "decoder.revealer_decoder.layers.3.linear2.bias",
+      "decoder.revealer_decoder.layers.3.norm1.weight",
+      "decoder.revealer_decoder.layers.3.norm1.bias",
+      "decoder.revealer_decoder.layers.3.norm2.weight",
+      "decoder.revealer_decoder.layers.3.norm2.bias",
+      "decoder.revealer_decoder.layers.3.norm3.weight",
+      "decoder.revealer_decoder.layers.3.norm3.bias",
+      "decoder.actor_decoder.layers.0.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.0.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.0.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.0.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.0.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.0.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.0.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.0.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.0.linear1.weight",
+      "decoder.actor_decoder.layers.0.linear1.bias",
+      "decoder.actor_decoder.layers.0.linear2.weight",
+      "decoder.actor_decoder.layers.0.linear2.bias",
+      "decoder.actor_decoder.layers.0.norm1.weight",
+      "decoder.actor_decoder.layers.0.norm1.bias",
+      "decoder.actor_decoder.layers.0.norm2.weight",
+      "decoder.actor_decoder.layers.0.norm2.bias",
+      "decoder.actor_decoder.layers.0.norm3.weight",
+      "decoder.actor_decoder.layers.0.norm3.bias",
+      "decoder.actor_decoder.layers.1.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.1.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.1.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.1.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.1.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.1.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.1.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.1.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.1.linear1.weight",
+      "decoder.actor_decoder.layers.1.linear1.bias",
+      "decoder.actor_decoder.layers.1.linear2.weight",
+      "decoder.actor_decoder.layers.1.linear2.bias",
+      "decoder.actor_decoder.layers.1.norm1.weight",
+      "decoder.actor_decoder.layers.1.norm1.bias",
+      "decoder.actor_decoder.layers.1.norm2.weight",
+      "decoder.actor_decoder.layers.1.norm2.bias",
+      "decoder.actor_decoder.layers.1.norm3.weight",
+      "decoder.actor_decoder.layers.1.norm3.bias",
+      "decoder.actor_decoder.layers.2.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.2.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.2.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.2.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.2.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.2.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.2.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.2.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.2.linear1.weight",
+      "decoder.actor_decoder.layers.2.linear1.bias",
+      "decoder.actor_decoder.layers.2.linear2.weight",
+      "decoder.actor_decoder.layers.2.linear2.bias",
+      "decoder.actor_decoder.layers.2.norm1.weight",
+      "decoder.actor_decoder.layers.2.norm1.bias",
+      "decoder.actor_decoder.layers.2.norm2.weight",
+      "decoder.actor_decoder.layers.2.norm2.bias",
+      "decoder.actor_decoder.layers.2.norm3.weight",
+      "decoder.actor_decoder.layers.2.norm3.bias",
+      "decoder.actor_decoder.layers.3.self_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.3.self_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.3.self_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.3.self_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.3.multihead_attn.in_proj_weight",
+      "decoder.actor_decoder.layers.3.multihead_attn.in_proj_bias",
+      "decoder.actor_decoder.layers.3.multihead_attn.out_proj.weight",
+      "decoder.actor_decoder.layers.3.multihead_attn.out_proj.bias",
+      "decoder.actor_decoder.layers.3.linear1.weight",
+      "decoder.actor_decoder.layers.3.linear1.bias",
+      "decoder.actor_decoder.layers.3.linear2.weight",
+      "decoder.actor_decoder.layers.3.linear2.bias",
+      "decoder.actor_decoder.layers.3.norm1.weight",
+      "decoder.actor_decoder.layers.3.norm1.bias",
+      "decoder.actor_decoder.layers.3.norm2.weight",
+      "decoder.actor_decoder.layers.3.norm2.bias",
+      "decoder.actor_decoder.layers.3.norm3.weight",
+      "decoder.actor_decoder.layers.3.norm3.bias",
+      "decoder.revealer_mean.weight",
+      "decoder.revealer_mean.bias",
+      "decoder.revealer_log_std.weight",
+      "decoder.revealer_log_std.bias",
+      "decoder.actor_mean.weight",
+      "decoder.actor_mean.bias",
+      "decoder.actor_log_std.weight",
+      "decoder.actor_log_std.bias",
+      "decoder.proposal_score.0.weight",
+      "decoder.proposal_score.0.bias",
+      "decoder.proposal_score.1.weight",
+      "decoder.proposal_score.1.bias"
+    ],
+    "missing_keys": [
+      "backbone.depth_adapter.depth_proj.0.weight",
+      "backbone.depth_adapter.depth_proj.0.bias",
+      "backbone.depth_adapter.depth_proj.1.weight",
+      "backbone.depth_adapter.depth_proj.1.bias",
+      "backbone.depth_adapter.depth_proj.3.weight",
+      "backbone.depth_adapter.depth_proj.3.bias",
+      "backbone.depth_adapter.geometry_proj.0.weight",
+      "backbone.depth_adapter.geometry_proj.0.bias",
+      "backbone.depth_adapter.geometry_proj.1.weight",
+      "backbone.depth_adapter.geometry_proj.1.bias",
+      "backbone.depth_adapter.camera_proj.0.weight",
+      "backbone.depth_adapter.camera_proj.0.bias",
+      "backbone.depth_adapter.camera_proj.1.weight",
+      "backbone.depth_adapter.camera_proj.1.bias",
+      "fusion.geometry_fusion.attn.in_proj_weight",
+      "fusion.geometry_fusion.attn.in_proj_bias",
+      "fusion.geometry_fusion.attn.out_proj.weight",
+      "fusion.geometry_fusion.attn.out_proj.bias",
+      "fusion.geometry_fusion.gate.0.weight",
+      "fusion.geometry_fusion.gate.0.bias",
+      "fusion.geometry_fusion.gate.1.weight",
+      "fusion.geometry_fusion.gate.1.bias",
+      "fusion.geometry_fusion.gate.3.weight",
+      "fusion.geometry_fusion.gate.3.bias",
+      "fusion.geometry_fusion.out.0.weight",
+      "fusion.geometry_fusion.out.0.bias",
+      "fusion.geometry_fusion.out.1.weight",
+      "fusion.geometry_fusion.out.1.bias",
+      "memory.scene_memory.position_embedding",
+      "memory.scene_memory.bank_queries",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.in_proj_weight",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.in_proj_bias",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.out_proj.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.self_attn.out_proj.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.linear1.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.linear1.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.linear2.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.linear2.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.norm1.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.norm1.bias",
+      "memory.scene_memory.sequence_encoder.layers.0.norm2.weight",
+      "memory.scene_memory.sequence_encoder.layers.0.norm2.bias",
+      "memory.scene_memory.bank_attention.in_proj_weight",
+      "memory.scene_memory.bank_attention.in_proj_bias",
+      "memory.scene_memory.bank_attention.out_proj.weight",
+      "memory.scene_memory.bank_attention.out_proj.bias",
+      "memory.scene_memory.action_proj.0.weight",
+      "memory.scene_memory.action_proj.0.bias",
+      "memory.scene_memory.action_proj.1.weight",
+      "memory.scene_memory.action_proj.1.bias",
+      "memory.scene_memory.write_gate.0.weight",
+      "memory.scene_memory.write_gate.0.bias",
+      "memory.scene_memory.write_gate.1.weight",
+      "memory.scene_memory.write_gate.1.bias",
+      "memory.scene_memory.write_gate.3.weight",
+      "memory.scene_memory.write_gate.3.bias",
+      "memory.scene_memory.token_proj.0.weight",
+      "memory.scene_memory.token_proj.0.bias",
+      "memory.scene_memory.token_proj.1.weight",
+      "memory.scene_memory.token_proj.1.bias",
+      "memory.belief_memory.position_embedding",
+      "memory.belief_memory.bank_queries",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.in_proj_weight",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.in_proj_bias",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.out_proj.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.self_attn.out_proj.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.linear1.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.linear1.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.linear2.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.linear2.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.norm1.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.norm1.bias",
+      "memory.belief_memory.sequence_encoder.layers.0.norm2.weight",
+      "memory.belief_memory.sequence_encoder.layers.0.norm2.bias",
+      "memory.belief_memory.bank_attention.in_proj_weight",
+      "memory.belief_memory.bank_attention.in_proj_bias",
+      "memory.belief_memory.bank_attention.out_proj.weight",
+      "memory.belief_memory.bank_attention.out_proj.bias",
+      "memory.belief_memory.action_proj.0.weight",
+      "memory.belief_memory.action_proj.0.bias",
+      "memory.belief_memory.action_proj.1.weight",
+      "memory.belief_memory.action_proj.1.bias",
+      "memory.belief_memory.write_gate.0.weight",
+      "memory.belief_memory.write_gate.0.bias",
+      "memory.belief_memory.write_gate.1.weight",
+      "memory.belief_memory.write_gate.1.bias",
+      "memory.belief_memory.write_gate.3.weight",
+      "memory.belief_memory.write_gate.3.bias",
+      "memory.belief_memory.token_proj.0.weight",
+      "memory.belief_memory.token_proj.0.bias",
+      "memory.belief_memory.token_proj.1.weight",
+      "memory.belief_memory.token_proj.1.bias",
+      "decoder.arm_decoder.layers.0.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.0.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.0.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.0.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.0.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.0.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.0.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.0.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.0.linear1.weight",
+      "decoder.arm_decoder.layers.0.linear1.bias",
+      "decoder.arm_decoder.layers.0.linear2.weight",
+      "decoder.arm_decoder.layers.0.linear2.bias",
+      "decoder.arm_decoder.layers.0.norm1.weight",
+      "decoder.arm_decoder.layers.0.norm1.bias",
+      "decoder.arm_decoder.layers.0.norm2.weight",
+      "decoder.arm_decoder.layers.0.norm2.bias",
+      "decoder.arm_decoder.layers.0.norm3.weight",
+      "decoder.arm_decoder.layers.0.norm3.bias",
+      "decoder.arm_decoder.layers.1.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.1.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.1.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.1.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.1.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.1.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.1.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.1.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.1.linear1.weight",
+      "decoder.arm_decoder.layers.1.linear1.bias",
+      "decoder.arm_decoder.layers.1.linear2.weight",
+      "decoder.arm_decoder.layers.1.linear2.bias",
+      "decoder.arm_decoder.layers.1.norm1.weight",
+      "decoder.arm_decoder.layers.1.norm1.bias",
+      "decoder.arm_decoder.layers.1.norm2.weight",
+      "decoder.arm_decoder.layers.1.norm2.bias",
+      "decoder.arm_decoder.layers.1.norm3.weight",
+      "decoder.arm_decoder.layers.1.norm3.bias",
+      "decoder.arm_decoder.layers.2.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.2.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.2.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.2.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.2.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.2.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.2.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.2.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.2.linear1.weight",
+      "decoder.arm_decoder.layers.2.linear1.bias",
+      "decoder.arm_decoder.layers.2.linear2.weight",
+      "decoder.arm_decoder.layers.2.linear2.bias",
+      "decoder.arm_decoder.layers.2.norm1.weight",
+      "decoder.arm_decoder.layers.2.norm1.bias",
+      "decoder.arm_decoder.layers.2.norm2.weight",
+      "decoder.arm_decoder.layers.2.norm2.bias",
+      "decoder.arm_decoder.layers.2.norm3.weight",
+      "decoder.arm_decoder.layers.2.norm3.bias",
+      "decoder.arm_decoder.layers.3.self_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.3.self_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.3.self_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.3.self_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.3.multihead_attn.in_proj_weight",
+      "decoder.arm_decoder.layers.3.multihead_attn.in_proj_bias",
+      "decoder.arm_decoder.layers.3.multihead_attn.out_proj.weight",
+      "decoder.arm_decoder.layers.3.multihead_attn.out_proj.bias",
+      "decoder.arm_decoder.layers.3.linear1.weight",
+      "decoder.arm_decoder.layers.3.linear1.bias",
+      "decoder.arm_decoder.layers.3.linear2.weight",
+      "decoder.arm_decoder.layers.3.linear2.bias",
+      "decoder.arm_decoder.layers.3.norm1.weight",
+      "decoder.arm_decoder.layers.3.norm1.bias",
+      "decoder.arm_decoder.layers.3.norm2.weight",
+      "decoder.arm_decoder.layers.3.norm2.bias",
+      "decoder.arm_decoder.layers.3.norm3.weight",
+      "decoder.arm_decoder.layers.3.norm3.bias",
+      "decoder.arm_identity.weight",
+      "decoder.phase_adapter.weight",
+      "decoder.phase_adapter.bias",
+      "decoder.role_adapter.weight",
+      "decoder.role_adapter.bias",
+      "decoder.context_proj.0.weight",
+      "decoder.context_proj.0.bias",
+      "decoder.context_proj.1.weight",
+      "decoder.context_proj.1.bias",
+      "decoder.arm_head.0.weight",
+      "decoder.arm_head.0.bias",
+      "decoder.arm_head.1.weight",
+      "decoder.arm_head.1.bias",
+      "decoder.arm_mean.weight",
+      "decoder.arm_mean.bias",
+      "decoder.arm_log_std.weight",
+      "decoder.arm_log_std.bias",
+      "decoder.proposal_mode_head.0.weight",
+      "decoder.proposal_mode_head.0.bias",
+      "decoder.proposal_mode_head.1.weight",
+      "decoder.proposal_mode_head.1.bias",
+      "decoder.proposal_mode_head.3.weight",
+      "decoder.proposal_mode_head.3.bias",
+      "decoder.proposal_mode_embeddings.weight",
+      "decoder.proposal_slot_embeddings.weight",
+      "decoder.mode_residual_heads.0.0.weight",
+      "decoder.mode_residual_heads.0.0.bias",
+      "decoder.mode_residual_heads.0.1.weight",
+      "decoder.mode_residual_heads.0.1.bias",
+      "decoder.mode_residual_heads.0.3.weight",
+      "decoder.mode_residual_heads.0.3.bias",
+      "decoder.mode_residual_heads.1.0.weight",
+      "decoder.mode_residual_heads.1.0.bias",
+      "decoder.mode_residual_heads.1.1.weight",
+      "decoder.mode_residual_heads.1.1.bias",
+      "decoder.mode_residual_heads.1.3.weight",
+      "decoder.mode_residual_heads.1.3.bias",
+      "decoder.mode_residual_heads.2.0.weight",
+      "decoder.mode_residual_heads.2.0.bias",
+      "decoder.mode_residual_heads.2.1.weight",
+      "decoder.mode_residual_heads.2.1.bias",
+      "decoder.mode_residual_heads.2.3.weight",
+      "decoder.mode_residual_heads.2.3.bias",
+      "decoder.mode_residual_heads.3.0.weight",
+      "decoder.mode_residual_heads.3.0.bias",
+      "decoder.mode_residual_heads.3.1.weight",
+      "decoder.mode_residual_heads.3.1.bias",
+      "decoder.mode_residual_heads.3.3.weight",
+      "decoder.mode_residual_heads.3.3.bias",
+      "decoder.mode_residual_heads.4.0.weight",
+      "decoder.mode_residual_heads.4.0.bias",
+      "decoder.mode_residual_heads.4.1.weight",
+      "decoder.mode_residual_heads.4.1.bias",
+      "decoder.mode_residual_heads.4.3.weight",
+      "decoder.mode_residual_heads.4.3.bias",
+      "decoder.mode_residual_heads.5.0.weight",
+      "decoder.mode_residual_heads.5.0.bias",
+      "decoder.mode_residual_heads.5.1.weight",
+      "decoder.mode_residual_heads.5.1.bias",
+      "decoder.mode_residual_heads.5.3.weight",
+      "decoder.mode_residual_heads.5.3.bias",
+      "decoder.slot_delta.0.weight",
+      "decoder.slot_delta.0.bias",
+      "decoder.slot_delta.1.weight",
+      "decoder.slot_delta.1.bias",
+      "decoder.slot_delta.3.weight",
+      "decoder.slot_delta.3.bias",
+      "decoder.proposal_score.0.weight",
+      "decoder.proposal_score.0.bias",
+      "decoder.proposal_score.1.weight",
+      "decoder.proposal_score.1.bias",
+      "decoder.proposal_score.3.weight",
+      "decoder.proposal_score.3.bias",
+      "elastic_state_head.interaction_queries",
+      "elastic_state_head.interaction_attention.in_proj_weight",
+      "elastic_state_head.interaction_attention.in_proj_bias",
+      "elastic_state_head.interaction_attention.out_proj.weight",
+      "elastic_state_head.interaction_attention.out_proj.bias",
+      "elastic_state_head.interaction_mlp.0.weight",
+      "elastic_state_head.interaction_mlp.0.bias",
+      "elastic_state_head.interaction_mlp.1.weight",
+      "elastic_state_head.interaction_mlp.1.bias",
+      "elastic_state_head.interaction_mlp.3.weight",
+      "elastic_state_head.interaction_mlp.3.bias",
+      "elastic_state_head.decoder.field_queries",
+      "elastic_state_head.decoder.field_attention.in_proj_weight",
+      "elastic_state_head.decoder.field_attention.in_proj_bias",
+      "elastic_state_head.decoder.field_attention.out_proj.weight",
+      "elastic_state_head.decoder.field_attention.out_proj.bias",
+      "elastic_state_head.decoder.field_mlp.0.weight",
+      "elastic_state_head.decoder.field_mlp.0.bias",
+      "elastic_state_head.decoder.field_mlp.1.weight",
+      "elastic_state_head.decoder.field_mlp.1.bias",
+      "elastic_state_head.decoder.field_mlp.3.weight",
+      "elastic_state_head.decoder.field_mlp.3.bias",
+      "elastic_state_head.decoder.summary_proj.0.weight",
+      "elastic_state_head.decoder.summary_proj.0.bias",
+      "elastic_state_head.decoder.summary_proj.1.weight",
+      "elastic_state_head.decoder.summary_proj.1.bias",
+      "elastic_state_head.decoder.phase_head.0.weight",
+      "elastic_state_head.decoder.phase_head.0.bias",
+      "elastic_state_head.decoder.phase_head.1.weight",
+      "elastic_state_head.decoder.phase_head.1.bias",
+      "elastic_state_head.decoder.phase_head.3.weight",
+      "elastic_state_head.decoder.phase_head.3.bias",
+      "elastic_state_head.decoder.arm_role_head.0.weight",
+      "elastic_state_head.decoder.arm_role_head.0.bias",
+      "elastic_state_head.decoder.arm_role_head.1.weight",
+      "elastic_state_head.decoder.arm_role_head.1.bias",
+      "elastic_state_head.decoder.arm_role_head.3.weight",
+      "elastic_state_head.decoder.arm_role_head.3.bias",
+      "elastic_state_head.decoder.arm_identity.weight",
+      "elastic_state_head.decoder.support_mode.0.weight",
+      "elastic_state_head.decoder.support_mode.0.bias",
+      "elastic_state_head.decoder.support_mode.1.weight",
+      "elastic_state_head.decoder.support_mode.1.bias",
+      "elastic_state_head.decoder.support_mode.3.weight",
+      "elastic_state_head.decoder.support_mode.3.bias",
+      "elastic_state_head.decoder.access_field.weight",
+      "elastic_state_head.decoder.access_field.bias",
+      "elastic_state_head.decoder.target_belief_field.weight",
+      "elastic_state_head.decoder.target_belief_field.bias",
+      "elastic_state_head.decoder.visibility_field.weight",
+      "elastic_state_head.decoder.visibility_field.bias",
+      "elastic_state_head.decoder.clearance_field.weight",
+      "elastic_state_head.decoder.clearance_field.bias",
+      "elastic_state_head.decoder.occluder_contact_field.weight",
+      "elastic_state_head.decoder.occluder_contact_field.bias",
+      "elastic_state_head.decoder.grasp_affordance_field.weight",
+      "elastic_state_head.decoder.grasp_affordance_field.bias",
+      "elastic_state_head.decoder.support_stability_field.weight",
+      "elastic_state_head.decoder.support_stability_field.bias",
+      "elastic_state_head.decoder.persistence_field.weight",
+      "elastic_state_head.decoder.persistence_field.bias",
+      "elastic_state_head.decoder.reocclusion_field.weight",
+      "elastic_state_head.decoder.reocclusion_field.bias",
+      "elastic_state_head.decoder.disturbance_field.weight",
+      "elastic_state_head.decoder.disturbance_field.bias",
+      "elastic_state_head.decoder.uncertainty_field.weight",
+      "elastic_state_head.decoder.uncertainty_field.bias",
+      "elastic_state_head.decoder.reocclusion_head.0.weight",
+      "elastic_state_head.decoder.reocclusion_head.0.bias",
+      "elastic_state_head.decoder.reocclusion_head.1.weight",
+      "elastic_state_head.decoder.reocclusion_head.1.bias",
+      "elastic_state_head.decoder.reocclusion_head.3.weight",
+      "elastic_state_head.decoder.reocclusion_head.3.bias",
+      "world_model.state_encoder.0.weight",
+      "world_model.state_encoder.0.bias",
+      "world_model.state_encoder.1.weight",
+      "world_model.state_encoder.1.bias",
+      "world_model.scene_memory_proj.0.weight",
+      "world_model.scene_memory_proj.0.bias",
+      "world_model.scene_memory_proj.1.weight",
+      "world_model.scene_memory_proj.1.bias",
+      "world_model.belief_memory_proj.0.weight",
+      "world_model.belief_memory_proj.0.bias",
+      "world_model.belief_memory_proj.1.weight",
+      "world_model.belief_memory_proj.1.bias",
+      "world_model.action_encoder.0.weight",
+      "world_model.action_encoder.0.bias",
+      "world_model.action_encoder.1.weight",
+      "world_model.action_encoder.1.bias",
+      "world_model.transition.weight_ih",
+      "world_model.transition.weight_hh",
+      "world_model.transition.bias_ih",
+      "world_model.transition.bias_hh",
+      "world_model.scene_memory_update.weight",
+      "world_model.scene_memory_update.bias",
+      "world_model.belief_memory_update.weight",
+      "world_model.belief_memory_update.bias",
+      "world_model.compact_decoder.weight",
+      "world_model.compact_decoder.bias",
+      "world_model.target_belief_head.weight",
+      "world_model.target_belief_head.bias",
+      "world_model.visibility_head.weight",
+      "world_model.visibility_head.bias",
+      "world_model.clearance_head.weight",
+      "world_model.clearance_head.bias",
+      "world_model.occluder_contact_head.weight",
+      "world_model.occluder_contact_head.bias",
+      "world_model.grasp_affordance_head.weight",
+      "world_model.grasp_affordance_head.bias",
+      "world_model.support_stability_head.weight",
+      "world_model.support_stability_head.bias",
+      "world_model.persistence_head.weight",
+      "world_model.persistence_head.bias",
+      "world_model.reocclusion_head.weight",
+      "world_model.reocclusion_head.bias",
+      "world_model.disturbance_head.weight",
+      "world_model.disturbance_head.bias",
+      "world_model.uncertainty_head.weight",
+      "world_model.uncertainty_head.bias",
+      "world_model.access_head.weight",
+      "world_model.access_head.bias",
+      "planner.residual.trunk.0.weight",
+      "planner.residual.trunk.0.bias",
+      "planner.residual.trunk.1.weight",
+      "planner.residual.trunk.1.bias",
+      "planner.residual.trunk.3.weight",
+      "planner.residual.trunk.3.bias",
+      "planner.residual.success_head.weight",
+      "planner.residual.success_head.bias",
+      "planner.residual.risk_head.weight",
+      "planner.residual.risk_head.bias",
+      "planner.residual.residual_head.weight",
+      "planner.residual.residual_head.bias"
+    ],
+    "unexpected_keys": []
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_full/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4583333333333333,
+      "bag_proxy": 0.5833333333333334,
+      "cloth_proxy": 0.6666666666666666
+    },
+    "mean_success": 0.5694444444444445,
+    "visibility_integral": 32.2005988392565,
+    "corridor_availability": 0.8664570152759552,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.1903364318709135,
+    "disturbance_cost": 0.35011103795841336
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_full/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/checkpoint_best.pt
+- mean_success: 0.569
+- visibility_integral: 32.201
+- corridor_availability: 0.866
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.190
+- disturbance_cost: 0.350
+- foliage_proxy_success: 0.458
+- bag_proxy_success: 0.583
+- cloth_proxy_success: 0.667

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_no_planner/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5833333333333334,
+      "cloth_proxy": 0.6666666666666666
+    },
+    "mean_success": 0.5555555555555555,
+    "visibility_integral": 33.31703626612822,
+    "corridor_availability": 0.886079938047462,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.1836884579143008,
+    "disturbance_cost": 0.3696938648612963
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_no_planner/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/checkpoint_best.pt
+- mean_success: 0.556
+- visibility_integral: 33.317
+- corridor_availability: 0.886
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.184
+- disturbance_cost: 0.370
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.583
+- cloth_proxy_success: 0.667

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_no_role_symmetry/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4583333333333333,
+      "bag_proxy": 0.5833333333333334,
+      "cloth_proxy": 0.6666666666666666
+    },
+    "mean_success": 0.5694444444444445,
+    "visibility_integral": 32.571378606888985,
+    "corridor_availability": 0.8744470203916231,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.249059588784357,
+    "disturbance_cost": 0.34120469799058306
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/benchmark_no_role_symmetry/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/checkpoint_best.pt
+- mean_success: 0.569
+- visibility_integral: 32.571
+- corridor_availability: 0.874
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.249
+- disturbance_cost: 0.341
+- foliage_proxy_success: 0.458
+- bag_proxy_success: 0.583
+- cloth_proxy_success: 0.667

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/config_resolved.yaml ADDED Viewed

	@@ -0,0 +1,147 @@

+experiment_name: proxy_interaction_r3d_stage1_dummy_seed13
+output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
+device: cuda
+seed: 13
+data:
+  proxies:
+  - foliage_proxy
+  - bag_proxy
+  - cloth_proxy
+  resolution: 96
+  dataset_version: reveal_proxy_v6_rgbd_elastic_state
+  train_episodes_per_proxy: 48
+  val_episodes_per_proxy: 16
+  train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v6_rgbd_stage1_dummy_seed13.pt
+  val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v6_rgbd_stage1_dummy_seed13.pt
+  rebuild_dataset: false
+  chunk_horizon: 8
+  rollout_horizon: 5
+  history_steps: 6
+  planner_candidates: 8
+  seed: 13
+optim:
+  epochs: 4
+  batch_size: 16
+  num_workers: 4
+  lr: 0.001
+  weight_decay: 0.0001
+trainer:
+  policy_type: elastic_reveal
+  use_bf16: false
+  grad_clip_norm: 1.0
+  freeze_backbone: true
+  gradient_checkpointing: false
+  plan_during_train: true
+  plan_during_eval: true
+  support_mode_conditioning: true
+  planner_mode: trainable
+  use_depth: false
+  use_world_model: true
+  use_role_tokens: true
+  compute_equivariance_probe: true
+policy:
+  backbone:
+    model_name: openai/clip-vit-base-patch32
+    hidden_dim: 192
+    max_text_tokens: 32
+    freeze_backbone: true
+    gradient_checkpointing: false
+    use_dummy_backbone: true
+  fusion:
+    hidden_dim: 192
+    num_cameras: 3
+    num_layers: 2
+    num_heads: 4
+    ff_dim: 384
+    dropout: 0.1
+    proprio_dim: 32
+    proprio_tokens: 1
+  memory:
+    hidden_dim: 192
+    action_dim: 14
+    history_steps: 6
+    scene_history_steps: 3
+    belief_history_steps: 8
+    num_layers: 2
+    dropout: 0.1
+    memory_bank_size: 4
+    scene_bank_size: 2
+    belief_bank_size: 2
+    num_heads: 4
+    max_history_steps: 8
+  decoder:
+    hidden_dim: 192
+    num_heads: 4
+    num_layers: 2
+    ff_dim: 384
+    dropout: 0.1
+    chunk_size: 8
+    action_dim: 14
+    arm_action_dim: 7
+    num_candidates: 8
+    num_phases: 5
+    num_arm_roles: 4
+    num_proposal_modes: 6
+    planner_top_k: 4
+  reveal_head:
+    hidden_dim: 192
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    belief_map_size: 32
+    field_size: 16
+    num_heads: 4
+    predict_belief_map: true
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  world_model:
+    hidden_dim: 192
+    action_dim: 14
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    field_size: 16
+    num_heads: 4
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+    belief_map_size: 32
+    predict_belief_map: true
+    scene_bank_size: 2
+    belief_bank_size: 2
+  planner:
+    hidden_dim: 192
+    num_candidates: 8
+    action_dim: 14
+    num_support_modes: 3
+    utility_margin: 0.1
+    num_heads: 4
+    num_layers: 2
+    num_phases: 5
+    num_arm_roles: 4
+    top_k: 4
+loss_weights:
+  action: 1.0
+  phase: 0.15
+  arm_role: 0.2
+  support_mode: 0.15
+  corridor: 0.2
+  persistence: 0.1
+  disturbance: 0.1
+  world_model: 0.25
+  belief: 0.05
+  visibility: 0.05
+  clearance: 0.05
+  support_stability: 0.05
+  reocclusion: 0.05
+  occluder_contact: 0.05
+  grasp_affordance: 0.05
+  planner_success: 0.2
+  planner_risk: 0.1
+  planner_ranking: 0.1
+  proposal_reconstruction: 0.2
+  proposal_success: 0.1
+  proposal_ranking: 0.1
+  proposal_diversity: 0.05
+  role_swap_consistency: 0.05

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/diagnostics_full/proxy_diagnostics.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "planner_top1_accuracy": 0.2595419847328244,
+  "planner_regret": 0.015185066498816013,
+  "planner_score_utility_spearman": 0.25190839171409607,
+  "risk_calibration_mse": 0.011332111433148384,
+  "role_collapse_rate": 0.0,
+  "proposal_diversity": 0.02456846833229065,
+  "left_right_equivariance_error": 0.007538194466820534,
+  "belief_calibration_brier": 0.0055354926735162735,
+  "reocclusion_calibration_brier": 0.2274838089942932,
+  "support_stability_mae": 0.030257930979132652,
+  "clearance_auc": 0.7414014153848468,
+  "memory_write_rate": 0.0,
+  "memory_saturation": 0.7680174112319946,
+  "num_samples": 131
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/metrics.json ADDED Viewed

	@@ -0,0 +1,230 @@

+[
+  {
+    "epoch": 0,
+    "train": {
+      "action": 0.029530804604291916,
+      "arm_role": 0.19113596672893132,
+      "belief": 0.19201900158077478,
+      "clearance": 0.1937584774568677,
+      "corridor": 0.30155759242673713,
+      "disturbance": 0.018230090441647917,
+      "grasp_affordance": 0.1115249302238226,
+      "occluder_contact": 0.29577948339283466,
+      "persistence": 5.046393771966298,
+      "phase": 0.835017109910647,
+      "planner_ranking": 0.6733469751973947,
+      "planner_risk": 0.04033496890527507,
+      "planner_success": 0.6355331862966219,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.276770144701004,
+      "proposal_reconstruction": 0.07184042579804857,
+      "proposal_success": 0.6676094954212507,
+      "reocclusion": 0.6988904004295667,
+      "role_swap_consistency": 0.0006935761872834215,
+      "support_mode": 0.7387049297491709,
+      "support_stability": 0.22416748199611902,
+      "total": 2.4212693075339,
+      "uncertainty": 0.32931591259936493,
+      "visibility": 0.23356754829486212,
+      "world_model": 4.170340110858281
+    },
+    "val": {
+      "action": 0.023605089427696332,
+      "arm_role": 8.891185360779572e-05,
+      "belief": 0.112466166416804,
+      "clearance": 0.08774211009343465,
+      "corridor": 0.2502693798806932,
+      "disturbance": 0.0037313879001885653,
+      "grasp_affordance": 0.013532540657454066,
+      "occluder_contact": 0.2236137886842092,
+      "persistence": 4.796973652309841,
+      "phase": 0.6506193346447415,
+      "planner_ranking": 0.45240074396133423,
+      "planner_risk": 0.012336155710120996,
+      "planner_success": 0.6348234679963853,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1647081640031602,
+      "proposal_reconstruction": 0.06623147221075164,
+      "proposal_success": 0.6723773082097372,
+      "reocclusion": 0.6799028648270501,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.6129622724321153,
+      "support_stability": 0.14574629151158863,
+      "total": 1.9533665710025363,
+      "uncertainty": 0.057104989886283875,
+      "visibility": 0.09962501211298837,
+      "world_model": 3.08394538031684
+    }
+  },
+  {
+    "epoch": 1,
+    "train": {
+      "action": 0.02052135338696341,
+      "arm_role": 0.00010673219821910607,
+      "belief": 0.11743779480457306,
+      "clearance": 0.09043452050536871,
+      "corridor": 0.24632801488041878,
+      "disturbance": 0.003475519949764324,
+      "grasp_affordance": 0.01625332736875862,
+      "occluder_contact": 0.2240921917061011,
+      "persistence": 4.695922573407491,
+      "phase": 0.49508154888947803,
+      "planner_ranking": 0.14279444872712097,
+      "planner_risk": 0.0141817982463787,
+      "planner_success": 0.593176061908404,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.165678009390831,
+      "proposal_reconstruction": 0.06292749894782901,
+      "proposal_success": 0.674570898214976,
+      "reocclusion": 0.3844434078782797,
+      "role_swap_consistency": 0.00039524554207067314,
+      "support_mode": 0.17358588459561966,
+      "support_stability": 0.1374168156956633,
+      "total": 1.6440163105726242,
+      "uncertainty": 0.047071967429171004,
+      "visibility": 0.11256152174125116,
+      "world_model": 2.4736096411943436
+    },
+    "val": {
+      "action": 0.020492848422792222,
+      "arm_role": 0.0002776960156754487,
+      "belief": 0.1081986419028706,
+      "clearance": 0.08335375868611866,
+      "corridor": 0.24787565734651354,
+      "disturbance": 0.0022675159141524797,
+      "grasp_affordance": 0.012290253303945065,
+      "occluder_contact": 0.21959979832172394,
+      "persistence": 4.647055625915527,
+      "phase": 0.4316861795054542,
+      "planner_ranking": 0.06341143821676572,
+      "planner_risk": 0.015357115098999606,
+      "planner_success": 0.5689369605647193,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1283477942148845,
+      "proposal_reconstruction": 0.06308732968237665,
+      "proposal_success": 0.6809348861376444,
+      "reocclusion": 0.2748950504594379,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.0006280758987284369,
+      "support_stability": 0.14622381826241812,
+      "total": 1.6025353935029771,
+      "uncertainty": 0.02438033703300688,
+      "visibility": 0.10466726124286652,
+      "world_model": 2.558868553903368
+    }
+  },
+  {
+    "epoch": 2,
+    "train": {
+      "action": 0.01646478761297961,
+      "arm_role": 9.377782756322024e-05,
+      "belief": 0.10991635639220476,
+      "clearance": 0.0843405183404684,
+      "corridor": 0.2701566057900588,
+      "disturbance": 0.0031300995663817353,
+      "grasp_affordance": 0.012393822447241595,
+      "occluder_contact": 0.21479063170651594,
+      "persistence": 2.6339182580510774,
+      "phase": 0.431367311005791,
+      "planner_ranking": 0.06486702508603533,
+      "planner_risk": 0.013548698586722216,
+      "planner_success": 0.5643768397470316,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1353335281213124,
+      "proposal_reconstruction": 0.05951391921068231,
+      "proposal_success": 0.6731756230195364,
+      "reocclusion": 0.2623978331685066,
+      "role_swap_consistency": 0.00040521422973445925,
+      "support_mode": 0.000605581031171217,
+      "support_stability": 0.1400139912342032,
+      "total": 1.2923575937747955,
+      "uncertainty": 0.02004621450517637,
+      "visibility": 0.10328224146117766,
+      "world_model": 2.1331751296917596
+    },
+    "val": {
+      "action": 0.018090524814195104,
+      "arm_role": 4.204427063490989e-05,
+      "belief": 0.11348766502406862,
+      "clearance": 0.0778748012251324,
+      "corridor": 0.24816315703921848,
+      "disturbance": 0.0018734507805978258,
+      "grasp_affordance": 0.008446878753602505,
+      "occluder_contact": 0.2068953894906574,
+      "persistence": 1.9170836640728846,
+      "phase": 0.4777056227127711,
+      "planner_ranking": 0.07497243583202362,
+      "planner_risk": 0.012007931971715556,
+      "planner_success": 0.5846167008082072,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1227490504582722,
+      "proposal_reconstruction": 0.06178469873136944,
+      "proposal_success": 0.6768591006596884,
+      "reocclusion": 0.2698347626460923,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.0005942495643264718,
+      "support_stability": 0.14820611890819338,
+      "total": 1.2714158693949382,
+      "uncertainty": 0.004030831908393238,
+      "visibility": 0.09794799155659145,
+      "world_model": 2.303717931111654
+    }
+  },
+  {
+    "epoch": 3,
+    "train": {
+      "action": 0.015296258614398539,
+      "arm_role": 9.897743439069018e-05,
+      "belief": 0.10741911331812541,
+      "clearance": 0.07931565772742033,
+      "corridor": 0.23081608302891254,
+      "disturbance": 0.00287542298125724,
+      "grasp_affordance": 0.008955261165586611,
+      "occluder_contact": 0.21085621416568756,
+      "persistence": 1.6830786913633347,
+      "phase": 0.4407324629525344,
+      "planner_ranking": 0.053573422211532794,
+      "planner_risk": 0.011835894741428396,
+      "planner_success": 0.5389373525977135,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1375357458988826,
+      "proposal_reconstruction": 0.05875217309221625,
+      "proposal_success": 0.669308491051197,
+      "reocclusion": 0.26737124752253294,
+      "role_swap_consistency": 0.00044258072254403186,
+      "support_mode": 0.0058784369854644565,
+      "support_stability": 0.13682511821389198,
+      "total": 1.1672432621320088,
+      "uncertainty": 0.007140855586233859,
+      "visibility": 0.094703309237957,
+      "world_model": 2.072191367546717
+    },
+    "val": {
+      "action": 0.016218292733861342,
+      "arm_role": 0.00022501617463098632,
+      "belief": 0.10660513407654232,
+      "clearance": 0.07916852169566685,
+      "corridor": 0.23598399923907387,
+      "disturbance": 0.0013176489026389187,
+      "grasp_affordance": 0.009249631315469742,
+      "occluder_contact": 0.2084801279836231,
+      "persistence": 1.9978744321399264,
+      "phase": 0.46462951434983146,
+      "planner_ranking": 0.04140180618398719,
+      "planner_risk": 0.011076963868820004,
+      "planner_success": 0.5154120292928484,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1469912661446466,
+      "proposal_reconstruction": 0.05962582967347569,
+      "proposal_success": 0.6495795779758029,
+      "reocclusion": 0.2503652158710692,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.0004595977985041423,
+      "support_stability": 0.14600716531276703,
+      "total": 1.2128634585274591,
+      "uncertainty": 0.007759603775209851,
+      "visibility": 0.09225249456034766,
+      "world_model": 2.1404969029956393
+    }
+  }
+]

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/summary.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "experiment_name": "proxy_interaction_r3d_stage1_dummy_seed13",
+  "device": "cuda",
+  "best_checkpoint": "/workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed13/checkpoint_best.pt",
+  "final_train_total": 1.1672432621320088,
+  "final_val_total": 1.2128634585274591,
+  "train_time_sec": 18.091050624847412,
+  "peak_gpu_memory_mb": 631.1953125,
+  "num_train_samples": 380,
+  "num_val_samples": 131,
+  "planner_mode": "trainable",
+  "frozen_modules": [],
+  "init_info": null
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_full/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.625,
+      "cloth_proxy": 0.6666666666666666
+    },
+    "mean_success": 0.5694444444444445,
+    "visibility_integral": 32.801942747500206,
+    "corridor_availability": 0.8877548724412918,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 1.4711664057066363,
+    "disturbance_cost": 0.37882790300581193
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_full/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/checkpoint_best.pt
+- mean_success: 0.569
+- visibility_integral: 32.802
+- corridor_availability: 0.888
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 1.471
+- disturbance_cost: 0.379
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.625
+- cloth_proxy_success: 0.667

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_no_planner/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5833333333333334,
+      "cloth_proxy": 0.625
+    },
+    "mean_success": 0.5416666666666666,
+    "visibility_integral": 34.428366212381256,
+    "corridor_availability": 0.8909231291876899,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 1.4917179537341767,
+    "disturbance_cost": 0.39409097459995085
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_no_planner/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/checkpoint_best.pt
+- mean_success: 0.542
+- visibility_integral: 34.428
+- corridor_availability: 0.891
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 1.492
+- disturbance_cost: 0.394
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.583
+- cloth_proxy_success: 0.625

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_no_role_symmetry/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.625,
+      "cloth_proxy": 0.6666666666666666
+    },
+    "mean_success": 0.5694444444444445,
+    "visibility_integral": 33.27109728753567,
+    "corridor_availability": 0.8943836614489555,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 1.488106187582016,
+    "disturbance_cost": 0.3667886131960485
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/benchmark_no_role_symmetry/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/checkpoint_best.pt
+- mean_success: 0.569
+- visibility_integral: 33.271
+- corridor_availability: 0.894
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 1.488
+- disturbance_cost: 0.367
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.625
+- cloth_proxy_success: 0.667

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/config_resolved.yaml ADDED Viewed

	@@ -0,0 +1,147 @@

+experiment_name: proxy_interaction_r3d_stage1_dummy_seed14
+output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
+device: cuda
+seed: 14
+data:
+  proxies:
+  - foliage_proxy
+  - bag_proxy
+  - cloth_proxy
+  resolution: 96
+  dataset_version: reveal_proxy_v6_rgbd_elastic_state
+  train_episodes_per_proxy: 48
+  val_episodes_per_proxy: 16
+  train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v6_rgbd_stage1_dummy_seed14.pt
+  val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v6_rgbd_stage1_dummy_seed14.pt
+  rebuild_dataset: false
+  chunk_horizon: 8
+  rollout_horizon: 5
+  history_steps: 6
+  planner_candidates: 8
+  seed: 14
+optim:
+  epochs: 4
+  batch_size: 16
+  num_workers: 4
+  lr: 0.001
+  weight_decay: 0.0001
+trainer:
+  policy_type: elastic_reveal
+  use_bf16: false
+  grad_clip_norm: 1.0
+  freeze_backbone: true
+  gradient_checkpointing: false
+  plan_during_train: true
+  plan_during_eval: true
+  support_mode_conditioning: true
+  planner_mode: trainable
+  use_depth: false
+  use_world_model: true
+  use_role_tokens: true
+  compute_equivariance_probe: true
+policy:
+  backbone:
+    model_name: openai/clip-vit-base-patch32
+    hidden_dim: 192
+    max_text_tokens: 32
+    freeze_backbone: true
+    gradient_checkpointing: false
+    use_dummy_backbone: true
+  fusion:
+    hidden_dim: 192
+    num_cameras: 3
+    num_layers: 2
+    num_heads: 4
+    ff_dim: 384
+    dropout: 0.1
+    proprio_dim: 32
+    proprio_tokens: 1
+  memory:
+    hidden_dim: 192
+    action_dim: 14
+    history_steps: 6
+    scene_history_steps: 3
+    belief_history_steps: 8
+    num_layers: 2
+    dropout: 0.1
+    memory_bank_size: 4
+    scene_bank_size: 2
+    belief_bank_size: 2
+    num_heads: 4
+    max_history_steps: 8
+  decoder:
+    hidden_dim: 192
+    num_heads: 4
+    num_layers: 2
+    ff_dim: 384
+    dropout: 0.1
+    chunk_size: 8
+    action_dim: 14
+    arm_action_dim: 7
+    num_candidates: 8
+    num_phases: 5
+    num_arm_roles: 4
+    num_proposal_modes: 6
+    planner_top_k: 4
+  reveal_head:
+    hidden_dim: 192
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    belief_map_size: 32
+    field_size: 16
+    num_heads: 4
+    predict_belief_map: true
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  world_model:
+    hidden_dim: 192
+    action_dim: 14
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    field_size: 16
+    num_heads: 4
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+    belief_map_size: 32
+    predict_belief_map: true
+    scene_bank_size: 2
+    belief_bank_size: 2
+  planner:
+    hidden_dim: 192
+    num_candidates: 8
+    action_dim: 14
+    num_support_modes: 3
+    utility_margin: 0.1
+    num_heads: 4
+    num_layers: 2
+    num_phases: 5
+    num_arm_roles: 4
+    top_k: 4
+loss_weights:
+  action: 1.0
+  phase: 0.15
+  arm_role: 0.2
+  support_mode: 0.15
+  corridor: 0.2
+  persistence: 0.1
+  disturbance: 0.1
+  world_model: 0.25
+  belief: 0.05
+  visibility: 0.05
+  clearance: 0.05
+  support_stability: 0.05
+  reocclusion: 0.05
+  occluder_contact: 0.05
+  grasp_affordance: 0.05
+  planner_success: 0.2
+  planner_risk: 0.1
+  planner_ranking: 0.1
+  proposal_reconstruction: 0.2
+  proposal_success: 0.1
+  proposal_ranking: 0.1
+  proposal_diversity: 0.05
+  role_swap_consistency: 0.05

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/diagnostics_full/proxy_diagnostics.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "planner_top1_accuracy": 0.2846153846153846,
+  "planner_regret": 0.014314642176032066,
+  "planner_score_utility_spearman": 0.2153846174478531,
+  "risk_calibration_mse": 0.010775926522910595,
+  "role_collapse_rate": 0.0,
+  "proposal_diversity": 0.02589959278702736,
+  "left_right_equivariance_error": 0.008901518605211201,
+  "belief_calibration_brier": 0.005614265333861113,
+  "reocclusion_calibration_brier": 0.28406235575675964,
+  "support_stability_mae": 0.025872904807329178,
+  "clearance_auc": 0.5220335124994485,
+  "memory_write_rate": 0.0,
+  "memory_saturation": 0.7309081554412842,
+  "num_samples": 130
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/metrics.json ADDED Viewed

	@@ -0,0 +1,230 @@

+[
+  {
+    "epoch": 0,
+    "train": {
+      "action": 0.033738364155093827,
+      "arm_role": 0.2658534389071671,
+      "belief": 0.1663714082290729,
+      "clearance": 0.1995344152674079,
+      "corridor": 0.2937144724031289,
+      "disturbance": 0.01641949706633265,
+      "grasp_affordance": 0.07253360034277041,
+      "occluder_contact": 0.262634892637531,
+      "persistence": 5.348720759153366,
+      "phase": 0.9128680676221848,
+      "planner_ranking": 0.7161665211121241,
+      "planner_risk": 0.03542382351588458,
+      "planner_success": 0.6313644871115685,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.328845535715421,
+      "proposal_reconstruction": 0.07508338304857413,
+      "proposal_success": 0.6797524491945902,
+      "reocclusion": 0.7106639867027601,
+      "role_swap_consistency": 0.0008167610091428893,
+      "support_mode": 0.7801499888300896,
+      "support_stability": 0.21256058973570666,
+      "total": 2.46435983479023,
+      "uncertainty": 0.17734388983808458,
+      "visibility": 0.16707653552293777,
+      "world_model": 4.078198651472728
+    },
+    "val": {
+      "action": 0.023770140690935984,
+      "arm_role": 0.0004891494075612476,
+      "belief": 0.11787863655222787,
+      "clearance": 0.08211326102415721,
+      "corridor": 0.2646504044532776,
+      "disturbance": 0.0077974022262626225,
+      "grasp_affordance": 0.010528300681875812,
+      "occluder_contact": 0.23685429162449306,
+      "persistence": 4.643319712744819,
+      "phase": 0.6877350012461344,
+      "planner_ranking": 0.5576971173286438,
+      "planner_risk": 0.012001174760775434,
+      "planner_success": 0.6474077436659071,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.2473273674647014,
+      "proposal_reconstruction": 0.06659724977281359,
+      "proposal_success": 0.6868854032622443,
+      "reocclusion": 0.6894112494256761,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.7945182191001045,
+      "support_stability": 0.13977908922566307,
+      "total": 1.9791885084576077,
+      "uncertainty": 0.016744557561145887,
+      "visibility": 0.09745695524745518,
+      "world_model": 3.0115205181969538
+    }
+  },
+  {
+    "epoch": 1,
+    "train": {
+      "action": 0.02093995890269677,
+      "arm_role": 0.00021873527142209545,
+      "belief": 0.1156839697311322,
+      "clearance": 0.09139195084571838,
+      "corridor": 0.2529828678816557,
+      "disturbance": 0.003422619032789953,
+      "grasp_affordance": 0.017661277670413256,
+      "occluder_contact": 0.22792026090125242,
+      "persistence": 4.702208956082662,
+      "phase": 0.5312556164960066,
+      "planner_ranking": 0.20636002533137798,
+      "planner_risk": 0.015822513572250802,
+      "planner_success": 0.5910777151584625,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1696062982082367,
+      "proposal_reconstruction": 0.06334876082837582,
+      "proposal_success": 0.6708702544371287,
+      "reocclusion": 0.5039266211291155,
+      "role_swap_consistency": 0.0005020403975019386,
+      "support_mode": 0.3201311229883383,
+      "support_stability": 0.13968352818240723,
+      "total": 1.6841449290513992,
+      "uncertainty": 0.026018289965577424,
+      "visibility": 0.11011519034703572,
+      "world_model": 2.466151461005211
+    },
+    "val": {
+      "action": 0.020535202903880015,
+      "arm_role": 0.00012925987215971368,
+      "belief": 0.10588792545927896,
+      "clearance": 0.08000239895449744,
+      "corridor": 0.23227471278773415,
+      "disturbance": 0.0022439691221936503,
+      "grasp_affordance": 0.011653332453635003,
+      "occluder_contact": 0.21834516359700096,
+      "persistence": 4.46406364440918,
+      "phase": 0.4118766354189979,
+      "planner_ranking": 0.0892416491276688,
+      "planner_risk": 0.0152344209038549,
+      "planner_success": 0.6057713859611087,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.133669826719496,
+      "proposal_reconstruction": 0.06398758581942982,
+      "proposal_success": 0.6783458656734891,
+      "reocclusion": 0.2840655545393626,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.0015922162112676436,
+      "support_stability": 0.13890525698661804,
+      "total": 1.584020005332099,
+      "uncertainty": 0.014379701991048124,
+      "visibility": 0.09630187600851059,
+      "world_model": 2.5434003671010337
+    }
+  },
+  {
+    "epoch": 2,
+    "train": {
+      "action": 0.017165315182258684,
+      "arm_role": 0.00014243966719125942,
+      "belief": 0.1267746559654673,
+      "clearance": 0.09291451362272103,
+      "corridor": 0.2539026445398728,
+      "disturbance": 0.0040997157484525815,
+      "grasp_affordance": 0.016216314087311428,
+      "occluder_contact": 0.2287510900447766,
+      "persistence": 2.7297142073512077,
+      "phase": 0.4553527260820071,
+      "planner_ranking": 0.0675589762783299,
+      "planner_risk": 0.012244323831206808,
+      "planner_success": 0.5227356925606728,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1367994795242946,
+      "proposal_reconstruction": 0.06006583757698536,
+      "proposal_success": 0.6718559389313062,
+      "reocclusion": 0.28394716791808605,
+      "role_swap_consistency": 0.000532965175807476,
+      "support_mode": 0.0007756326898136953,
+      "support_stability": 0.14084124999741712,
+      "total": 1.2956190605958302,
+      "uncertainty": 0.011363255020114593,
+      "visibility": 0.11323032714426517,
+      "world_model": 2.120655362804731
+    },
+    "val": {
+      "action": 0.016470486712124612,
+      "arm_role": 0.00015339441274085807,
+      "belief": 0.15912896229161155,
+      "clearance": 0.07826702462302314,
+      "corridor": 0.21473425957891676,
+      "disturbance": 0.0018082650106710692,
+      "grasp_affordance": 0.008080463701238235,
+      "occluder_contact": 0.22728429403569964,
+      "persistence": 1.846471561325921,
+      "phase": 0.4164143088791106,
+      "planner_ranking": 0.05541756912134588,
+      "planner_risk": 0.011288604181673791,
+      "planner_success": 0.5237696303261651,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1311746835708618,
+      "proposal_reconstruction": 0.06064582823051347,
+      "proposal_success": 0.6669412983788384,
+      "reocclusion": 0.27248211950063705,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.00040661103816496,
+      "support_stability": 0.13817799753612942,
+      "total": 1.241025275654263,
+      "uncertainty": 0.003020187374204397,
+      "visibility": 0.11647009683979882,
+      "world_model": 2.323344442579481
+    }
+  },
+  {
+    "epoch": 3,
+    "train": {
+      "action": 0.015070427674800158,
+      "arm_role": 0.0002641689807205694,
+      "belief": 0.141230215318501,
+      "clearance": 0.07984113336230318,
+      "corridor": 0.225482989102602,
+      "disturbance": 0.0017908170169296984,
+      "grasp_affordance": 0.008550037746317685,
+      "occluder_contact": 0.21477928136785826,
+      "persistence": 1.6129546587665875,
+      "phase": 0.42590194568037987,
+      "planner_ranking": 0.04456973075866699,
+      "planner_risk": 0.010397601523436606,
+      "planner_success": 0.49412518242994946,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1504750202099483,
+      "proposal_reconstruction": 0.058567725432415806,
+      "proposal_success": 0.6462936575214068,
+      "reocclusion": 0.2506879176944494,
+      "role_swap_consistency": 0.000550856914439161,
+      "support_mode": 0.0003065853112881693,
+      "support_stability": 0.1366732595488429,
+      "total": 1.134415107468764,
+      "uncertainty": 0.0035936666245106608,
+      "visibility": 0.10351777387162049,
+      "world_model": 2.024999057253202
+    },
+    "val": {
+      "action": 0.016186242405739095,
+      "arm_role": 0.0002410423346898622,
+      "belief": 0.12203978498776753,
+      "clearance": 0.07702170064051946,
+      "corridor": 0.21113747523890602,
+      "disturbance": 0.0014993647216922706,
+      "grasp_affordance": 0.008119617278377214,
+      "occluder_contact": 0.21474246515168083,
+      "persistence": 1.9725701610247295,
+      "phase": 0.4842751953336928,
+      "planner_ranking": 0.04342265882425838,
+      "planner_risk": 0.01107009764139851,
+      "planner_success": 0.5070097777578566,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1282474862204657,
+      "proposal_reconstruction": 0.05997827731900745,
+      "proposal_success": 0.6469291316138374,
+      "reocclusion": 0.2716698878341251,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.00020467836778455725,
+      "support_stability": 0.13836157073577246,
+      "total": 1.2091523673799303,
+      "uncertainty": 0.0025335378272251952,
+      "visibility": 0.09879730641841888,
+      "world_model": 2.1507359743118286
+    }
+  }
+]

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/summary.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "experiment_name": "proxy_interaction_r3d_stage1_dummy_seed14",
+  "device": "cuda",
+  "best_checkpoint": "/workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed14/checkpoint_best.pt",
+  "final_train_total": 1.134415107468764,
+  "final_val_total": 1.2091523673799303,
+  "train_time_sec": 23.220722675323486,
+  "peak_gpu_memory_mb": 626.4716796875,
+  "num_train_samples": 381,
+  "num_val_samples": 130,
+  "planner_mode": "trainable",
+  "frozen_modules": [],
+  "init_info": null
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_full/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4583333333333333,
+      "bag_proxy": 0.625,
+      "cloth_proxy": 0.7083333333333334
+    },
+    "mean_success": 0.5972222222222222,
+    "visibility_integral": 29.697570121950573,
+    "corridor_availability": 0.8675610861844487,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.20430763148842,
+    "disturbance_cost": 0.36563710583787823
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_full/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/checkpoint_best.pt
+- mean_success: 0.597
+- visibility_integral: 29.698
+- corridor_availability: 0.868
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.204
+- disturbance_cost: 0.366
+- foliage_proxy_success: 0.458
+- bag_proxy_success: 0.625
+- cloth_proxy_success: 0.708

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_no_planner/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4583333333333333,
+      "bag_proxy": 0.625,
+      "cloth_proxy": 0.7083333333333334
+    },
+    "mean_success": 0.5972222222222222,
+    "visibility_integral": 29.697570121950573,
+    "corridor_availability": 0.8675610861844487,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.20430763148842,
+    "disturbance_cost": 0.36563710583787823
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_no_planner/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/checkpoint_best.pt
+- mean_success: 0.597
+- visibility_integral: 29.698
+- corridor_availability: 0.868
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.204
+- disturbance_cost: 0.366
+- foliage_proxy_success: 0.458
+- bag_proxy_success: 0.625
+- cloth_proxy_success: 0.708

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_no_role_symmetry/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.5,
+      "bag_proxy": 0.625,
+      "cloth_proxy": 0.7083333333333334
+    },
+    "mean_success": 0.6111111111111112,
+    "visibility_integral": 28.954636810554398,
+    "corridor_availability": 0.8660841253068712,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.10539705814184,
+    "disturbance_cost": 0.35598844579524463
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/benchmark_no_role_symmetry/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/checkpoint_best.pt
+- mean_success: 0.611
+- visibility_integral: 28.955
+- corridor_availability: 0.866
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.105
+- disturbance_cost: 0.356
+- foliage_proxy_success: 0.500
+- bag_proxy_success: 0.625
+- cloth_proxy_success: 0.708

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/config_resolved.yaml ADDED Viewed

	@@ -0,0 +1,147 @@

+experiment_name: proxy_interaction_r3d_stage1_dummy_seed15
+output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
+device: cuda
+seed: 15
+data:
+  proxies:
+  - foliage_proxy
+  - bag_proxy
+  - cloth_proxy
+  resolution: 96
+  dataset_version: reveal_proxy_v6_rgbd_elastic_state
+  train_episodes_per_proxy: 48
+  val_episodes_per_proxy: 16
+  train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v6_rgbd_stage1_dummy_seed15.pt
+  val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v6_rgbd_stage1_dummy_seed15.pt
+  rebuild_dataset: false
+  chunk_horizon: 8
+  rollout_horizon: 5
+  history_steps: 6
+  planner_candidates: 8
+  seed: 15
+optim:
+  epochs: 4
+  batch_size: 16
+  num_workers: 4
+  lr: 0.001
+  weight_decay: 0.0001
+trainer:
+  policy_type: elastic_reveal
+  use_bf16: false
+  grad_clip_norm: 1.0
+  freeze_backbone: true
+  gradient_checkpointing: false
+  plan_during_train: true
+  plan_during_eval: true
+  support_mode_conditioning: true
+  planner_mode: trainable
+  use_depth: false
+  use_world_model: true
+  use_role_tokens: true
+  compute_equivariance_probe: true
+policy:
+  backbone:
+    model_name: openai/clip-vit-base-patch32
+    hidden_dim: 192
+    max_text_tokens: 32
+    freeze_backbone: true
+    gradient_checkpointing: false
+    use_dummy_backbone: true
+  fusion:
+    hidden_dim: 192
+    num_cameras: 3
+    num_layers: 2
+    num_heads: 4
+    ff_dim: 384
+    dropout: 0.1
+    proprio_dim: 32
+    proprio_tokens: 1
+  memory:
+    hidden_dim: 192
+    action_dim: 14
+    history_steps: 6
+    scene_history_steps: 3
+    belief_history_steps: 8
+    num_layers: 2
+    dropout: 0.1
+    memory_bank_size: 4
+    scene_bank_size: 2
+    belief_bank_size: 2
+    num_heads: 4
+    max_history_steps: 8
+  decoder:
+    hidden_dim: 192
+    num_heads: 4
+    num_layers: 2
+    ff_dim: 384
+    dropout: 0.1
+    chunk_size: 8
+    action_dim: 14
+    arm_action_dim: 7
+    num_candidates: 8
+    num_phases: 5
+    num_arm_roles: 4
+    num_proposal_modes: 6
+    planner_top_k: 4
+  reveal_head:
+    hidden_dim: 192
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    belief_map_size: 32
+    field_size: 16
+    num_heads: 4
+    predict_belief_map: true
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+  world_model:
+    hidden_dim: 192
+    action_dim: 14
+    num_support_modes: 3
+    num_approach_templates: 32
+    rollout_horizon: 5
+    field_size: 16
+    num_heads: 4
+    num_phases: 5
+    num_arm_roles: 4
+    num_interaction_tokens: 8
+    belief_map_size: 32
+    predict_belief_map: true
+    scene_bank_size: 2
+    belief_bank_size: 2
+  planner:
+    hidden_dim: 192
+    num_candidates: 8
+    action_dim: 14
+    num_support_modes: 3
+    utility_margin: 0.1
+    num_heads: 4
+    num_layers: 2
+    num_phases: 5
+    num_arm_roles: 4
+    top_k: 4
+loss_weights:
+  action: 1.0
+  phase: 0.15
+  arm_role: 0.2
+  support_mode: 0.15
+  corridor: 0.2
+  persistence: 0.1
+  disturbance: 0.1
+  world_model: 0.25
+  belief: 0.05
+  visibility: 0.05
+  clearance: 0.05
+  support_stability: 0.05
+  reocclusion: 0.05
+  occluder_contact: 0.05
+  grasp_affordance: 0.05
+  planner_success: 0.2
+  planner_risk: 0.1
+  planner_ranking: 0.1
+  proposal_reconstruction: 0.2
+  proposal_success: 0.1
+  proposal_ranking: 0.1
+  proposal_diversity: 0.05
+  role_swap_consistency: 0.05

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/diagnostics_full/proxy_diagnostics.json ADDED Viewed

	@@ -0,0 +1,16 @@

+{
+  "planner_top1_accuracy": 0.3053435114503817,
+  "planner_regret": 0.013406210578978062,
+  "planner_score_utility_spearman": 0.2839694619178772,
+  "risk_calibration_mse": 0.010891024023294449,
+  "role_collapse_rate": 0.0,
+  "proposal_diversity": 0.02313310280442238,
+  "left_right_equivariance_error": 0.006598936667775407,
+  "belief_calibration_brier": 0.00368268764577806,
+  "reocclusion_calibration_brier": 0.2288682460784912,
+  "support_stability_mae": 0.025202222168445587,
+  "clearance_auc": 0.9189163634555108,
+  "memory_write_rate": 0.0,
+  "memory_saturation": 0.8174758553504944,
+  "num_samples": 131
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/metrics.json ADDED Viewed

	@@ -0,0 +1,230 @@

+[
+  {
+    "epoch": 0,
+    "train": {
+      "action": 0.028008008919035394,
+      "arm_role": 0.2316993211661611,
+      "belief": 0.21131388066957393,
+      "clearance": 0.19917472638189793,
+      "corridor": 0.3046618662774563,
+      "disturbance": 0.020259966540227953,
+      "grasp_affordance": 0.15939014249791703,
+      "occluder_contact": 0.3023037730405728,
+      "persistence": 5.1030773023764295,
+      "phase": 0.7391876379648844,
+      "planner_ranking": 0.6672491803765297,
+      "planner_risk": 0.035407664448333286,
+      "planner_success": 0.6247484882672628,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.2685468345880508,
+      "proposal_reconstruction": 0.07012522220611572,
+      "proposal_success": 0.6749546950062116,
+      "reocclusion": 0.6581779879828294,
+      "role_swap_consistency": 0.0007787000698347887,
+      "support_mode": 0.6318444466839234,
+      "support_stability": 0.21354713415106139,
+      "total": 2.377249076962471,
+      "uncertainty": 0.2297215286331872,
+      "visibility": 0.20075704219440618,
+      "world_model": 4.083281387885411
+    },
+    "val": {
+      "action": 0.023762268117732473,
+      "arm_role": 0.00020197388787184737,
+      "belief": 0.1366901993751526,
+      "clearance": 0.10309203879700767,
+      "corridor": 0.26862603922684986,
+      "disturbance": 0.0037259276594138807,
+      "grasp_affordance": 0.044725324544641704,
+      "occluder_contact": 0.2536553243796031,
+      "persistence": 4.777863184611003,
+      "phase": 0.5066013468636407,
+      "planner_ranking": 0.44456031918525696,
+      "planner_risk": 0.01433694911085897,
+      "planner_success": 0.6283807026015388,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1667029857635498,
+      "proposal_reconstruction": 0.0664608735177252,
+      "proposal_success": 0.6838224861356947,
+      "reocclusion": 0.3364369339413113,
+      "role_swap_consistency": 0.0,
+      "support_mode": 0.06715444227059682,
+      "support_stability": 0.14777708219157326,
+      "total": 1.8394301467471652,
+      "uncertainty": 0.07208604945076837,
+      "visibility": 0.12188677820894453,
+      "world_model": 3.079341014226278
+    }
+  },
+  {
+    "epoch": 1,
+    "train": {
+      "action": 0.018888041842728853,
+      "arm_role": 0.00043030476990679745,
+      "belief": 0.11719414374480645,
+      "clearance": 0.08535642797748248,
+      "corridor": 0.24796467771132788,
+      "disturbance": 0.0024048478032151857,
+      "grasp_affordance": 0.022171703943361838,
+      "occluder_contact": 0.22088239962855974,
+      "persistence": 4.555501798788707,
+      "phase": 0.43327916599810123,
+      "planner_ranking": 0.15463371171305576,
+      "planner_risk": 0.01981719226265947,
+      "planner_success": 0.5631782834728559,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1632012923558552,
+      "proposal_reconstruction": 0.0615519261918962,
+      "proposal_success": 0.6722564473748207,
+      "reocclusion": 0.287830734004577,
+      "role_swap_consistency": 0.00048373279059887864,
+      "support_mode": 0.008119381836574272,
+      "support_stability": 0.13662359025329351,
+      "total": 1.567106415828069,
+      "uncertainty": 0.03243653344300886,
+      "visibility": 0.11203592922538519,
+      "world_model": 2.404594744245211
+    },
+    "val": {
+      "action": 0.019907095055613253,
+      "arm_role": 0.00038116834993060265,
+      "belief": 0.1014507081773546,
+      "clearance": 0.07728531956672668,
+      "corridor": 0.22947043677171072,
+      "disturbance": 0.0014698771928023133,
+      "grasp_affordance": 0.02056772096289529,
+      "occluder_contact": 0.20453951425022548,
+      "persistence": 3.6124378045399985,
+      "phase": 0.47070127063327366,
+      "planner_ranking": 0.08099263947870997,
+      "planner_risk": 0.017360565563042957,
+      "planner_success": 0.5593770245711008,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.11685311794281,
+      "proposal_reconstruction": 0.0633203275501728,
+      "proposal_success": 0.683642049630483,
+      "reocclusion": 0.42518342865837944,
+      "role_swap_consistency": 0.0,
+      "support_mode": 8.963614042537908e-05,
+      "support_stability": 0.1495772964424557,
+      "total": 1.5412384668986003,
+      "uncertainty": 0.024036270876725514,
+      "visibility": 0.10443270951509476,
+      "world_model": 2.6981404887305365
+    }
+  },
+  {
+    "epoch": 2,
+    "train": {
+      "action": 0.01506453799083829,
+      "arm_role": 0.0002299571582019174,
+      "belief": 0.10169448765615623,
+      "clearance": 0.08062320730338494,
+      "corridor": 0.23694788571447134,
+      "disturbance": 0.002010827219540564,
+      "grasp_affordance": 0.012944541425288966,
+      "occluder_contact": 0.20663638102511564,
+      "persistence": 2.024513818323612,
+      "phase": 0.4406547602266073,
+      "planner_ranking": 0.052334820929293834,
+      "planner_risk": 0.012688904457415143,
+      "planner_success": 0.4998842130104701,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1411344707012177,
+      "proposal_reconstruction": 0.058503514621406794,
+      "proposal_success": 0.663138655324777,
+      "reocclusion": 0.28770653810352087,
+      "role_swap_consistency": 0.0005917157322983257,
+      "support_mode": 0.00027886544603461516,
+      "support_stability": 0.14369840795795122,
+      "total": 1.2098931844035785,
+      "uncertainty": 0.009047253523021936,
+      "visibility": 0.09652530650297801,
+      "world_model": 2.1335272987683616
+    },
+    "val": {
+      "action": 0.0173407852028807,
+      "arm_role": 0.00028451886545452807,
+      "belief": 0.09623022625843684,
+      "clearance": 0.07612819969654083,
+      "corridor": 0.22281885809368557,
+      "disturbance": 0.001401680282368842,
+      "grasp_affordance": 0.00781761777276794,
+      "occluder_contact": 0.20622349116537306,
+      "persistence": 2.1598196625709534,
+      "phase": 0.47410638795958626,
+      "planner_ranking": 0.0378283916765617,
+      "planner_risk": 0.013348096515983343,
+      "planner_success": 0.4943488637606303,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1125682062572904,
+      "proposal_reconstruction": 0.06057575262255139,
+      "proposal_success": 0.6509590811199613,
+      "reocclusion": 0.2778696550263299,
+      "role_swap_consistency": 0.0,
+      "support_mode": 7.348006571798275e-05,
+      "support_stability": 0.14099042697085273,
+      "total": 1.2928278247515361,
+      "uncertainty": 0.0023198039270937443,
+      "visibility": 0.08993011878596412,
+      "world_model": 2.425517029232449
+    }
+  },
+  {
+    "epoch": 3,
+    "train": {
+      "action": 0.015032132350218793,
+      "arm_role": 0.00015960596041016592,
+      "belief": 0.10330141056329012,
+      "clearance": 0.0756644958940645,
+      "corridor": 0.22099452962478003,
+      "disturbance": 0.0017974149668589234,
+      "grasp_affordance": 0.008848114540645232,
+      "occluder_contact": 0.20204609570403895,
+      "persistence": 1.6058371538917224,
+      "phase": 0.42861080542206764,
+      "planner_ranking": 0.040083787171170115,
+      "planner_risk": 0.010861996522483727,
+      "planner_success": 0.48133989547689754,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1467161824305852,
+      "proposal_reconstruction": 0.058588774874806404,
+      "proposal_success": 0.6429290076096853,
+      "reocclusion": 0.24268781704207262,
+      "role_swap_consistency": 0.00047596763154918637,
+      "support_mode": 2.783346417345456e-05,
+      "support_stability": 0.1325785775358478,
+      "total": 1.1217727214097977,
+      "uncertainty": 0.003058687725570053,
+      "visibility": 0.09524129331111908,
+      "world_model": 2.0093316386143365
+    },
+    "val": {
+      "action": 0.016727436126934156,
+      "arm_role": 0.0002483524456490866,
+      "belief": 0.09281252986854976,
+      "clearance": 0.0730266264743275,
+      "corridor": 0.22520612014664543,
+      "disturbance": 0.0031746443160550874,
+      "grasp_affordance": 0.00780139294349485,
+      "occluder_contact": 0.20420674648549822,
+      "persistence": 1.9897065493795607,
+      "phase": 0.42935120397143894,
+      "planner_ranking": 0.03520135974718465,
+      "planner_risk": 0.012488630910714468,
+      "planner_success": 0.5116605394416385,
+      "proposal_diversity": 0.0,
+      "proposal_ranking": 1.1216257943047419,
+      "proposal_reconstruction": 0.05996803608205584,
+      "proposal_success": 0.6389667987823486,
+      "reocclusion": 0.26481906490193474,
+      "role_swap_consistency": 0.0,
+      "support_mode": 4.154515813247094e-05,
+      "support_stability": 0.13968953986962637,
+      "total": 1.1943119830555387,
+      "uncertainty": 0.0017189466937755544,
+      "visibility": 0.09683923174937566,
+      "world_model": 2.1186628209220038
+    }
+  }
+]

artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/summary.json ADDED Viewed

	@@ -0,0 +1,14 @@

+{
+  "experiment_name": "proxy_interaction_r3d_stage1_dummy_seed15",
+  "device": "cuda",
+  "best_checkpoint": "/workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage1_dummy_seed15/checkpoint_best.pt",
+  "final_train_total": 1.1217727214097977,
+  "final_val_total": 1.1943119830555387,
+  "train_time_sec": 20.030457735061646,
+  "peak_gpu_memory_mb": 631.1953125,
+  "num_train_samples": 380,
+  "num_val_samples": 131,
+  "planner_mode": "trainable",
+  "frozen_modules": [],
+  "init_info": null
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage2_clip_seed11/benchmark_full/reveal_benchmark.json ADDED Viewed

	@@ -0,0 +1,15 @@

+{
+  "full": {
+    "per_task_success": {
+      "foliage_proxy": 0.4166666666666667,
+      "bag_proxy": 0.5833333333333334,
+      "cloth_proxy": 0.625
+    },
+    "mean_success": 0.5416666666666666,
+    "visibility_integral": 34.34427807728449,
+    "corridor_availability": 0.893132723040051,
+    "reocclusion_rate": 0.0,
+    "persistence_horizon_mae": 2.3119179729333856,
+    "disturbance_cost": 0.39262517919350004
+  }
+}

artifacts/outputs/r3d/proxy_interaction_r3d_stage2_clip_seed11/benchmark_full/reveal_benchmark.md ADDED Viewed

	@@ -0,0 +1,13 @@

+# Reveal Proxy Benchmark
+## full
+- checkpoint: /workspace/VLAarchtests/artifacts/outputs/r3d/proxy_interaction_r3d_stage2_clip_seed11/checkpoint_best.pt
+- mean_success: 0.542
+- visibility_integral: 34.344
+- corridor_availability: 0.893
+- reocclusion_rate: 0.000
+- persistence_horizon_mae: 2.312
+- disturbance_cost: 0.393
+- foliage_proxy_success: 0.417
+- bag_proxy_success: 0.583
+- cloth_proxy_success: 0.625