Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes. See raw diff
- artifacts/generated_configs/proxy_interaction_r3d_stage1_clip_seed7.yaml +149 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage1_clip_seed8.yaml +149 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage1_clip_seed9.yaml +149 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage1_dummy_seed13.yaml +147 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage1_dummy_seed14.yaml +147 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage1_dummy_seed15.yaml +147 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage2_clip_seed11.yaml +149 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage2_clip_seed12.yaml +149 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage2_clip_seed13.yaml +149 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage2_dummy_seed21.yaml +148 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage2_dummy_seed22.yaml +148 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage2_dummy_seed23.yaml +148 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage3_clip_rgbd_seed17.yaml +149 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage3_clip_rgbd_seed18.yaml +149 -0
- artifacts/generated_configs/proxy_interaction_r3d_stage3_clip_rgbd_seed19.yaml +149 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_dual_push_buttons/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_dual_push_buttons/stderr.txt +2 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_dual_push_buttons/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item/stderr.txt +2 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item_easy/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item_easy/stderr.txt +2 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item_easy/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_ball/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_ball/stderr.txt +2 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_ball/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_tray/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_tray/stderr.txt +2 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_tray/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_laptop/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_laptop/stderr.txt +6 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_laptop/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_plate/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_plate/stderr.txt +2 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_plate/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_push_box/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_push_box/stderr.txt +2 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_push_box/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_bottle_in_fridge/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_bottle_in_fridge/stderr.txt +2 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_bottle_in_fridge/stdout.txt +39 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_item_in_drawer/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_item_in_drawer/stderr.txt +12 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_item_in_drawer/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_straighten_rope/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_straighten_rope/stderr.txt +4 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_straighten_rope/stdout.txt +38 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_sweep_to_dustpan/command.txt +1 -0
- artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_sweep_to_dustpan/stderr.txt +2 -0
artifacts/generated_configs/proxy_interaction_r3d_stage1_clip_seed7.yaml
ADDED
|
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage1_clip_seed7
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 7
|
| 5 |
+
init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
|
| 6 |
+
init_strict: false
|
| 7 |
+
data:
|
| 8 |
+
proxies:
|
| 9 |
+
- foliage_proxy
|
| 10 |
+
- bag_proxy
|
| 11 |
+
- cloth_proxy
|
| 12 |
+
resolution: 224
|
| 13 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 14 |
+
train_episodes_per_proxy: 48
|
| 15 |
+
val_episodes_per_proxy: 16
|
| 16 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage1_seed7.pt
|
| 17 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage1_seed7.pt
|
| 18 |
+
rebuild_dataset: false
|
| 19 |
+
chunk_horizon: 8
|
| 20 |
+
rollout_horizon: 5
|
| 21 |
+
history_steps: 6
|
| 22 |
+
planner_candidates: 8
|
| 23 |
+
seed: 7
|
| 24 |
+
optim:
|
| 25 |
+
epochs: 4
|
| 26 |
+
batch_size: 2
|
| 27 |
+
num_workers: 4
|
| 28 |
+
lr: 0.0003
|
| 29 |
+
weight_decay: 0.0001
|
| 30 |
+
trainer:
|
| 31 |
+
policy_type: elastic_reveal
|
| 32 |
+
use_bf16: true
|
| 33 |
+
grad_clip_norm: 1.0
|
| 34 |
+
freeze_backbone: true
|
| 35 |
+
gradient_checkpointing: false
|
| 36 |
+
plan_during_train: true
|
| 37 |
+
plan_during_eval: true
|
| 38 |
+
support_mode_conditioning: true
|
| 39 |
+
planner_mode: trainable
|
| 40 |
+
use_depth: false
|
| 41 |
+
use_world_model: true
|
| 42 |
+
use_role_tokens: true
|
| 43 |
+
compute_equivariance_probe: true
|
| 44 |
+
policy:
|
| 45 |
+
backbone:
|
| 46 |
+
model_name: openai/clip-vit-base-patch32
|
| 47 |
+
hidden_dim: 512
|
| 48 |
+
max_text_tokens: 32
|
| 49 |
+
freeze_backbone: true
|
| 50 |
+
gradient_checkpointing: false
|
| 51 |
+
use_dummy_backbone: false
|
| 52 |
+
fusion:
|
| 53 |
+
hidden_dim: 512
|
| 54 |
+
num_cameras: 3
|
| 55 |
+
num_layers: 4
|
| 56 |
+
num_heads: 8
|
| 57 |
+
ff_dim: 2048
|
| 58 |
+
dropout: 0.1
|
| 59 |
+
proprio_dim: 32
|
| 60 |
+
proprio_tokens: 1
|
| 61 |
+
memory:
|
| 62 |
+
hidden_dim: 512
|
| 63 |
+
action_dim: 14
|
| 64 |
+
history_steps: 6
|
| 65 |
+
scene_history_steps: 3
|
| 66 |
+
belief_history_steps: 8
|
| 67 |
+
num_layers: 2
|
| 68 |
+
dropout: 0.1
|
| 69 |
+
memory_bank_size: 4
|
| 70 |
+
scene_bank_size: 2
|
| 71 |
+
belief_bank_size: 2
|
| 72 |
+
num_heads: 8
|
| 73 |
+
max_history_steps: 8
|
| 74 |
+
decoder:
|
| 75 |
+
hidden_dim: 512
|
| 76 |
+
num_heads: 8
|
| 77 |
+
num_layers: 4
|
| 78 |
+
ff_dim: 2048
|
| 79 |
+
dropout: 0.1
|
| 80 |
+
chunk_size: 8
|
| 81 |
+
action_dim: 14
|
| 82 |
+
arm_action_dim: 7
|
| 83 |
+
num_candidates: 8
|
| 84 |
+
num_phases: 5
|
| 85 |
+
num_arm_roles: 4
|
| 86 |
+
num_proposal_modes: 6
|
| 87 |
+
planner_top_k: 4
|
| 88 |
+
reveal_head:
|
| 89 |
+
hidden_dim: 512
|
| 90 |
+
num_support_modes: 3
|
| 91 |
+
num_approach_templates: 32
|
| 92 |
+
rollout_horizon: 5
|
| 93 |
+
belief_map_size: 32
|
| 94 |
+
field_size: 16
|
| 95 |
+
num_heads: 8
|
| 96 |
+
predict_belief_map: true
|
| 97 |
+
num_phases: 5
|
| 98 |
+
num_arm_roles: 4
|
| 99 |
+
num_interaction_tokens: 8
|
| 100 |
+
world_model:
|
| 101 |
+
hidden_dim: 512
|
| 102 |
+
action_dim: 14
|
| 103 |
+
num_support_modes: 3
|
| 104 |
+
num_approach_templates: 32
|
| 105 |
+
rollout_horizon: 5
|
| 106 |
+
field_size: 16
|
| 107 |
+
num_heads: 8
|
| 108 |
+
num_phases: 5
|
| 109 |
+
num_arm_roles: 4
|
| 110 |
+
num_interaction_tokens: 8
|
| 111 |
+
belief_map_size: 32
|
| 112 |
+
predict_belief_map: true
|
| 113 |
+
scene_bank_size: 2
|
| 114 |
+
belief_bank_size: 2
|
| 115 |
+
planner:
|
| 116 |
+
hidden_dim: 512
|
| 117 |
+
num_candidates: 8
|
| 118 |
+
action_dim: 14
|
| 119 |
+
num_support_modes: 3
|
| 120 |
+
utility_margin: 0.1
|
| 121 |
+
num_heads: 8
|
| 122 |
+
num_layers: 2
|
| 123 |
+
num_phases: 5
|
| 124 |
+
num_arm_roles: 4
|
| 125 |
+
top_k: 4
|
| 126 |
+
loss_weights:
|
| 127 |
+
action: 1.0
|
| 128 |
+
phase: 0.1
|
| 129 |
+
arm_role: 0.15
|
| 130 |
+
support_mode: 0.1
|
| 131 |
+
corridor: 0.15
|
| 132 |
+
persistence: 0.05
|
| 133 |
+
disturbance: 0.05
|
| 134 |
+
world_model: 0.2
|
| 135 |
+
belief: 0.05
|
| 136 |
+
visibility: 0.05
|
| 137 |
+
clearance: 0.05
|
| 138 |
+
support_stability: 0.05
|
| 139 |
+
reocclusion: 0.05
|
| 140 |
+
occluder_contact: 0.05
|
| 141 |
+
grasp_affordance: 0.05
|
| 142 |
+
planner_success: 0.25
|
| 143 |
+
planner_risk: 0.1
|
| 144 |
+
planner_ranking: 0.2
|
| 145 |
+
proposal_reconstruction: 0.1
|
| 146 |
+
proposal_success: 0.15
|
| 147 |
+
proposal_ranking: 0.2
|
| 148 |
+
proposal_diversity: 0.05
|
| 149 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage1_clip_seed8.yaml
ADDED
|
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage1_clip_seed8
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 8
|
| 5 |
+
init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
|
| 6 |
+
init_strict: false
|
| 7 |
+
data:
|
| 8 |
+
proxies:
|
| 9 |
+
- foliage_proxy
|
| 10 |
+
- bag_proxy
|
| 11 |
+
- cloth_proxy
|
| 12 |
+
resolution: 224
|
| 13 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 14 |
+
train_episodes_per_proxy: 48
|
| 15 |
+
val_episodes_per_proxy: 16
|
| 16 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage1_seed8.pt
|
| 17 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage1_seed8.pt
|
| 18 |
+
rebuild_dataset: false
|
| 19 |
+
chunk_horizon: 8
|
| 20 |
+
rollout_horizon: 5
|
| 21 |
+
history_steps: 6
|
| 22 |
+
planner_candidates: 8
|
| 23 |
+
seed: 8
|
| 24 |
+
optim:
|
| 25 |
+
epochs: 4
|
| 26 |
+
batch_size: 2
|
| 27 |
+
num_workers: 4
|
| 28 |
+
lr: 0.0003
|
| 29 |
+
weight_decay: 0.0001
|
| 30 |
+
trainer:
|
| 31 |
+
policy_type: elastic_reveal
|
| 32 |
+
use_bf16: true
|
| 33 |
+
grad_clip_norm: 1.0
|
| 34 |
+
freeze_backbone: true
|
| 35 |
+
gradient_checkpointing: false
|
| 36 |
+
plan_during_train: true
|
| 37 |
+
plan_during_eval: true
|
| 38 |
+
support_mode_conditioning: true
|
| 39 |
+
planner_mode: trainable
|
| 40 |
+
use_depth: false
|
| 41 |
+
use_world_model: true
|
| 42 |
+
use_role_tokens: true
|
| 43 |
+
compute_equivariance_probe: true
|
| 44 |
+
policy:
|
| 45 |
+
backbone:
|
| 46 |
+
model_name: openai/clip-vit-base-patch32
|
| 47 |
+
hidden_dim: 512
|
| 48 |
+
max_text_tokens: 32
|
| 49 |
+
freeze_backbone: true
|
| 50 |
+
gradient_checkpointing: false
|
| 51 |
+
use_dummy_backbone: false
|
| 52 |
+
fusion:
|
| 53 |
+
hidden_dim: 512
|
| 54 |
+
num_cameras: 3
|
| 55 |
+
num_layers: 4
|
| 56 |
+
num_heads: 8
|
| 57 |
+
ff_dim: 2048
|
| 58 |
+
dropout: 0.1
|
| 59 |
+
proprio_dim: 32
|
| 60 |
+
proprio_tokens: 1
|
| 61 |
+
memory:
|
| 62 |
+
hidden_dim: 512
|
| 63 |
+
action_dim: 14
|
| 64 |
+
history_steps: 6
|
| 65 |
+
scene_history_steps: 3
|
| 66 |
+
belief_history_steps: 8
|
| 67 |
+
num_layers: 2
|
| 68 |
+
dropout: 0.1
|
| 69 |
+
memory_bank_size: 4
|
| 70 |
+
scene_bank_size: 2
|
| 71 |
+
belief_bank_size: 2
|
| 72 |
+
num_heads: 8
|
| 73 |
+
max_history_steps: 8
|
| 74 |
+
decoder:
|
| 75 |
+
hidden_dim: 512
|
| 76 |
+
num_heads: 8
|
| 77 |
+
num_layers: 4
|
| 78 |
+
ff_dim: 2048
|
| 79 |
+
dropout: 0.1
|
| 80 |
+
chunk_size: 8
|
| 81 |
+
action_dim: 14
|
| 82 |
+
arm_action_dim: 7
|
| 83 |
+
num_candidates: 8
|
| 84 |
+
num_phases: 5
|
| 85 |
+
num_arm_roles: 4
|
| 86 |
+
num_proposal_modes: 6
|
| 87 |
+
planner_top_k: 4
|
| 88 |
+
reveal_head:
|
| 89 |
+
hidden_dim: 512
|
| 90 |
+
num_support_modes: 3
|
| 91 |
+
num_approach_templates: 32
|
| 92 |
+
rollout_horizon: 5
|
| 93 |
+
belief_map_size: 32
|
| 94 |
+
field_size: 16
|
| 95 |
+
num_heads: 8
|
| 96 |
+
predict_belief_map: true
|
| 97 |
+
num_phases: 5
|
| 98 |
+
num_arm_roles: 4
|
| 99 |
+
num_interaction_tokens: 8
|
| 100 |
+
world_model:
|
| 101 |
+
hidden_dim: 512
|
| 102 |
+
action_dim: 14
|
| 103 |
+
num_support_modes: 3
|
| 104 |
+
num_approach_templates: 32
|
| 105 |
+
rollout_horizon: 5
|
| 106 |
+
field_size: 16
|
| 107 |
+
num_heads: 8
|
| 108 |
+
num_phases: 5
|
| 109 |
+
num_arm_roles: 4
|
| 110 |
+
num_interaction_tokens: 8
|
| 111 |
+
belief_map_size: 32
|
| 112 |
+
predict_belief_map: true
|
| 113 |
+
scene_bank_size: 2
|
| 114 |
+
belief_bank_size: 2
|
| 115 |
+
planner:
|
| 116 |
+
hidden_dim: 512
|
| 117 |
+
num_candidates: 8
|
| 118 |
+
action_dim: 14
|
| 119 |
+
num_support_modes: 3
|
| 120 |
+
utility_margin: 0.1
|
| 121 |
+
num_heads: 8
|
| 122 |
+
num_layers: 2
|
| 123 |
+
num_phases: 5
|
| 124 |
+
num_arm_roles: 4
|
| 125 |
+
top_k: 4
|
| 126 |
+
loss_weights:
|
| 127 |
+
action: 1.0
|
| 128 |
+
phase: 0.1
|
| 129 |
+
arm_role: 0.15
|
| 130 |
+
support_mode: 0.1
|
| 131 |
+
corridor: 0.15
|
| 132 |
+
persistence: 0.05
|
| 133 |
+
disturbance: 0.05
|
| 134 |
+
world_model: 0.2
|
| 135 |
+
belief: 0.05
|
| 136 |
+
visibility: 0.05
|
| 137 |
+
clearance: 0.05
|
| 138 |
+
support_stability: 0.05
|
| 139 |
+
reocclusion: 0.05
|
| 140 |
+
occluder_contact: 0.05
|
| 141 |
+
grasp_affordance: 0.05
|
| 142 |
+
planner_success: 0.25
|
| 143 |
+
planner_risk: 0.1
|
| 144 |
+
planner_ranking: 0.2
|
| 145 |
+
proposal_reconstruction: 0.1
|
| 146 |
+
proposal_success: 0.15
|
| 147 |
+
proposal_ranking: 0.2
|
| 148 |
+
proposal_diversity: 0.05
|
| 149 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage1_clip_seed9.yaml
ADDED
|
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage1_clip_seed9
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 9
|
| 5 |
+
init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
|
| 6 |
+
init_strict: false
|
| 7 |
+
data:
|
| 8 |
+
proxies:
|
| 9 |
+
- foliage_proxy
|
| 10 |
+
- bag_proxy
|
| 11 |
+
- cloth_proxy
|
| 12 |
+
resolution: 224
|
| 13 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 14 |
+
train_episodes_per_proxy: 48
|
| 15 |
+
val_episodes_per_proxy: 16
|
| 16 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage1_seed9.pt
|
| 17 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage1_seed9.pt
|
| 18 |
+
rebuild_dataset: false
|
| 19 |
+
chunk_horizon: 8
|
| 20 |
+
rollout_horizon: 5
|
| 21 |
+
history_steps: 6
|
| 22 |
+
planner_candidates: 8
|
| 23 |
+
seed: 9
|
| 24 |
+
optim:
|
| 25 |
+
epochs: 4
|
| 26 |
+
batch_size: 2
|
| 27 |
+
num_workers: 4
|
| 28 |
+
lr: 0.0003
|
| 29 |
+
weight_decay: 0.0001
|
| 30 |
+
trainer:
|
| 31 |
+
policy_type: elastic_reveal
|
| 32 |
+
use_bf16: true
|
| 33 |
+
grad_clip_norm: 1.0
|
| 34 |
+
freeze_backbone: true
|
| 35 |
+
gradient_checkpointing: false
|
| 36 |
+
plan_during_train: true
|
| 37 |
+
plan_during_eval: true
|
| 38 |
+
support_mode_conditioning: true
|
| 39 |
+
planner_mode: trainable
|
| 40 |
+
use_depth: false
|
| 41 |
+
use_world_model: true
|
| 42 |
+
use_role_tokens: true
|
| 43 |
+
compute_equivariance_probe: true
|
| 44 |
+
policy:
|
| 45 |
+
backbone:
|
| 46 |
+
model_name: openai/clip-vit-base-patch32
|
| 47 |
+
hidden_dim: 512
|
| 48 |
+
max_text_tokens: 32
|
| 49 |
+
freeze_backbone: true
|
| 50 |
+
gradient_checkpointing: false
|
| 51 |
+
use_dummy_backbone: false
|
| 52 |
+
fusion:
|
| 53 |
+
hidden_dim: 512
|
| 54 |
+
num_cameras: 3
|
| 55 |
+
num_layers: 4
|
| 56 |
+
num_heads: 8
|
| 57 |
+
ff_dim: 2048
|
| 58 |
+
dropout: 0.1
|
| 59 |
+
proprio_dim: 32
|
| 60 |
+
proprio_tokens: 1
|
| 61 |
+
memory:
|
| 62 |
+
hidden_dim: 512
|
| 63 |
+
action_dim: 14
|
| 64 |
+
history_steps: 6
|
| 65 |
+
scene_history_steps: 3
|
| 66 |
+
belief_history_steps: 8
|
| 67 |
+
num_layers: 2
|
| 68 |
+
dropout: 0.1
|
| 69 |
+
memory_bank_size: 4
|
| 70 |
+
scene_bank_size: 2
|
| 71 |
+
belief_bank_size: 2
|
| 72 |
+
num_heads: 8
|
| 73 |
+
max_history_steps: 8
|
| 74 |
+
decoder:
|
| 75 |
+
hidden_dim: 512
|
| 76 |
+
num_heads: 8
|
| 77 |
+
num_layers: 4
|
| 78 |
+
ff_dim: 2048
|
| 79 |
+
dropout: 0.1
|
| 80 |
+
chunk_size: 8
|
| 81 |
+
action_dim: 14
|
| 82 |
+
arm_action_dim: 7
|
| 83 |
+
num_candidates: 8
|
| 84 |
+
num_phases: 5
|
| 85 |
+
num_arm_roles: 4
|
| 86 |
+
num_proposal_modes: 6
|
| 87 |
+
planner_top_k: 4
|
| 88 |
+
reveal_head:
|
| 89 |
+
hidden_dim: 512
|
| 90 |
+
num_support_modes: 3
|
| 91 |
+
num_approach_templates: 32
|
| 92 |
+
rollout_horizon: 5
|
| 93 |
+
belief_map_size: 32
|
| 94 |
+
field_size: 16
|
| 95 |
+
num_heads: 8
|
| 96 |
+
predict_belief_map: true
|
| 97 |
+
num_phases: 5
|
| 98 |
+
num_arm_roles: 4
|
| 99 |
+
num_interaction_tokens: 8
|
| 100 |
+
world_model:
|
| 101 |
+
hidden_dim: 512
|
| 102 |
+
action_dim: 14
|
| 103 |
+
num_support_modes: 3
|
| 104 |
+
num_approach_templates: 32
|
| 105 |
+
rollout_horizon: 5
|
| 106 |
+
field_size: 16
|
| 107 |
+
num_heads: 8
|
| 108 |
+
num_phases: 5
|
| 109 |
+
num_arm_roles: 4
|
| 110 |
+
num_interaction_tokens: 8
|
| 111 |
+
belief_map_size: 32
|
| 112 |
+
predict_belief_map: true
|
| 113 |
+
scene_bank_size: 2
|
| 114 |
+
belief_bank_size: 2
|
| 115 |
+
planner:
|
| 116 |
+
hidden_dim: 512
|
| 117 |
+
num_candidates: 8
|
| 118 |
+
action_dim: 14
|
| 119 |
+
num_support_modes: 3
|
| 120 |
+
utility_margin: 0.1
|
| 121 |
+
num_heads: 8
|
| 122 |
+
num_layers: 2
|
| 123 |
+
num_phases: 5
|
| 124 |
+
num_arm_roles: 4
|
| 125 |
+
top_k: 4
|
| 126 |
+
loss_weights:
|
| 127 |
+
action: 1.0
|
| 128 |
+
phase: 0.1
|
| 129 |
+
arm_role: 0.15
|
| 130 |
+
support_mode: 0.1
|
| 131 |
+
corridor: 0.15
|
| 132 |
+
persistence: 0.05
|
| 133 |
+
disturbance: 0.05
|
| 134 |
+
world_model: 0.2
|
| 135 |
+
belief: 0.05
|
| 136 |
+
visibility: 0.05
|
| 137 |
+
clearance: 0.05
|
| 138 |
+
support_stability: 0.05
|
| 139 |
+
reocclusion: 0.05
|
| 140 |
+
occluder_contact: 0.05
|
| 141 |
+
grasp_affordance: 0.05
|
| 142 |
+
planner_success: 0.25
|
| 143 |
+
planner_risk: 0.1
|
| 144 |
+
planner_ranking: 0.2
|
| 145 |
+
proposal_reconstruction: 0.1
|
| 146 |
+
proposal_success: 0.15
|
| 147 |
+
proposal_ranking: 0.2
|
| 148 |
+
proposal_diversity: 0.05
|
| 149 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage1_dummy_seed13.yaml
ADDED
|
@@ -0,0 +1,147 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage1_dummy_seed13
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 13
|
| 5 |
+
data:
|
| 6 |
+
proxies:
|
| 7 |
+
- foliage_proxy
|
| 8 |
+
- bag_proxy
|
| 9 |
+
- cloth_proxy
|
| 10 |
+
resolution: 96
|
| 11 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 12 |
+
train_episodes_per_proxy: 48
|
| 13 |
+
val_episodes_per_proxy: 16
|
| 14 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v6_rgbd_stage1_dummy_seed13.pt
|
| 15 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v6_rgbd_stage1_dummy_seed13.pt
|
| 16 |
+
rebuild_dataset: false
|
| 17 |
+
chunk_horizon: 8
|
| 18 |
+
rollout_horizon: 5
|
| 19 |
+
history_steps: 6
|
| 20 |
+
planner_candidates: 8
|
| 21 |
+
seed: 13
|
| 22 |
+
optim:
|
| 23 |
+
epochs: 4
|
| 24 |
+
batch_size: 16
|
| 25 |
+
num_workers: 4
|
| 26 |
+
lr: 0.001
|
| 27 |
+
weight_decay: 0.0001
|
| 28 |
+
trainer:
|
| 29 |
+
policy_type: elastic_reveal
|
| 30 |
+
use_bf16: false
|
| 31 |
+
grad_clip_norm: 1.0
|
| 32 |
+
freeze_backbone: true
|
| 33 |
+
gradient_checkpointing: false
|
| 34 |
+
plan_during_train: true
|
| 35 |
+
plan_during_eval: true
|
| 36 |
+
support_mode_conditioning: true
|
| 37 |
+
planner_mode: trainable
|
| 38 |
+
use_depth: false
|
| 39 |
+
use_world_model: true
|
| 40 |
+
use_role_tokens: true
|
| 41 |
+
compute_equivariance_probe: true
|
| 42 |
+
policy:
|
| 43 |
+
backbone:
|
| 44 |
+
model_name: openai/clip-vit-base-patch32
|
| 45 |
+
hidden_dim: 192
|
| 46 |
+
max_text_tokens: 32
|
| 47 |
+
freeze_backbone: true
|
| 48 |
+
gradient_checkpointing: false
|
| 49 |
+
use_dummy_backbone: true
|
| 50 |
+
fusion:
|
| 51 |
+
hidden_dim: 192
|
| 52 |
+
num_cameras: 3
|
| 53 |
+
num_layers: 2
|
| 54 |
+
num_heads: 4
|
| 55 |
+
ff_dim: 384
|
| 56 |
+
dropout: 0.1
|
| 57 |
+
proprio_dim: 32
|
| 58 |
+
proprio_tokens: 1
|
| 59 |
+
memory:
|
| 60 |
+
hidden_dim: 192
|
| 61 |
+
action_dim: 14
|
| 62 |
+
history_steps: 6
|
| 63 |
+
scene_history_steps: 3
|
| 64 |
+
belief_history_steps: 8
|
| 65 |
+
num_layers: 2
|
| 66 |
+
dropout: 0.1
|
| 67 |
+
memory_bank_size: 4
|
| 68 |
+
scene_bank_size: 2
|
| 69 |
+
belief_bank_size: 2
|
| 70 |
+
num_heads: 4
|
| 71 |
+
max_history_steps: 8
|
| 72 |
+
decoder:
|
| 73 |
+
hidden_dim: 192
|
| 74 |
+
num_heads: 4
|
| 75 |
+
num_layers: 2
|
| 76 |
+
ff_dim: 384
|
| 77 |
+
dropout: 0.1
|
| 78 |
+
chunk_size: 8
|
| 79 |
+
action_dim: 14
|
| 80 |
+
arm_action_dim: 7
|
| 81 |
+
num_candidates: 8
|
| 82 |
+
num_phases: 5
|
| 83 |
+
num_arm_roles: 4
|
| 84 |
+
num_proposal_modes: 6
|
| 85 |
+
planner_top_k: 4
|
| 86 |
+
reveal_head:
|
| 87 |
+
hidden_dim: 192
|
| 88 |
+
num_support_modes: 3
|
| 89 |
+
num_approach_templates: 32
|
| 90 |
+
rollout_horizon: 5
|
| 91 |
+
belief_map_size: 32
|
| 92 |
+
field_size: 16
|
| 93 |
+
num_heads: 4
|
| 94 |
+
predict_belief_map: true
|
| 95 |
+
num_phases: 5
|
| 96 |
+
num_arm_roles: 4
|
| 97 |
+
num_interaction_tokens: 8
|
| 98 |
+
world_model:
|
| 99 |
+
hidden_dim: 192
|
| 100 |
+
action_dim: 14
|
| 101 |
+
num_support_modes: 3
|
| 102 |
+
num_approach_templates: 32
|
| 103 |
+
rollout_horizon: 5
|
| 104 |
+
field_size: 16
|
| 105 |
+
num_heads: 4
|
| 106 |
+
num_phases: 5
|
| 107 |
+
num_arm_roles: 4
|
| 108 |
+
num_interaction_tokens: 8
|
| 109 |
+
belief_map_size: 32
|
| 110 |
+
predict_belief_map: true
|
| 111 |
+
scene_bank_size: 2
|
| 112 |
+
belief_bank_size: 2
|
| 113 |
+
planner:
|
| 114 |
+
hidden_dim: 192
|
| 115 |
+
num_candidates: 8
|
| 116 |
+
action_dim: 14
|
| 117 |
+
num_support_modes: 3
|
| 118 |
+
utility_margin: 0.1
|
| 119 |
+
num_heads: 4
|
| 120 |
+
num_layers: 2
|
| 121 |
+
num_phases: 5
|
| 122 |
+
num_arm_roles: 4
|
| 123 |
+
top_k: 4
|
| 124 |
+
loss_weights:
|
| 125 |
+
action: 1.0
|
| 126 |
+
phase: 0.15
|
| 127 |
+
arm_role: 0.2
|
| 128 |
+
support_mode: 0.15
|
| 129 |
+
corridor: 0.2
|
| 130 |
+
persistence: 0.1
|
| 131 |
+
disturbance: 0.1
|
| 132 |
+
world_model: 0.25
|
| 133 |
+
belief: 0.05
|
| 134 |
+
visibility: 0.05
|
| 135 |
+
clearance: 0.05
|
| 136 |
+
support_stability: 0.05
|
| 137 |
+
reocclusion: 0.05
|
| 138 |
+
occluder_contact: 0.05
|
| 139 |
+
grasp_affordance: 0.05
|
| 140 |
+
planner_success: 0.2
|
| 141 |
+
planner_risk: 0.1
|
| 142 |
+
planner_ranking: 0.1
|
| 143 |
+
proposal_reconstruction: 0.2
|
| 144 |
+
proposal_success: 0.1
|
| 145 |
+
proposal_ranking: 0.1
|
| 146 |
+
proposal_diversity: 0.05
|
| 147 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage1_dummy_seed14.yaml
ADDED
|
@@ -0,0 +1,147 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage1_dummy_seed14
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 14
|
| 5 |
+
data:
|
| 6 |
+
proxies:
|
| 7 |
+
- foliage_proxy
|
| 8 |
+
- bag_proxy
|
| 9 |
+
- cloth_proxy
|
| 10 |
+
resolution: 96
|
| 11 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 12 |
+
train_episodes_per_proxy: 48
|
| 13 |
+
val_episodes_per_proxy: 16
|
| 14 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v6_rgbd_stage1_dummy_seed14.pt
|
| 15 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v6_rgbd_stage1_dummy_seed14.pt
|
| 16 |
+
rebuild_dataset: false
|
| 17 |
+
chunk_horizon: 8
|
| 18 |
+
rollout_horizon: 5
|
| 19 |
+
history_steps: 6
|
| 20 |
+
planner_candidates: 8
|
| 21 |
+
seed: 14
|
| 22 |
+
optim:
|
| 23 |
+
epochs: 4
|
| 24 |
+
batch_size: 16
|
| 25 |
+
num_workers: 4
|
| 26 |
+
lr: 0.001
|
| 27 |
+
weight_decay: 0.0001
|
| 28 |
+
trainer:
|
| 29 |
+
policy_type: elastic_reveal
|
| 30 |
+
use_bf16: false
|
| 31 |
+
grad_clip_norm: 1.0
|
| 32 |
+
freeze_backbone: true
|
| 33 |
+
gradient_checkpointing: false
|
| 34 |
+
plan_during_train: true
|
| 35 |
+
plan_during_eval: true
|
| 36 |
+
support_mode_conditioning: true
|
| 37 |
+
planner_mode: trainable
|
| 38 |
+
use_depth: false
|
| 39 |
+
use_world_model: true
|
| 40 |
+
use_role_tokens: true
|
| 41 |
+
compute_equivariance_probe: true
|
| 42 |
+
policy:
|
| 43 |
+
backbone:
|
| 44 |
+
model_name: openai/clip-vit-base-patch32
|
| 45 |
+
hidden_dim: 192
|
| 46 |
+
max_text_tokens: 32
|
| 47 |
+
freeze_backbone: true
|
| 48 |
+
gradient_checkpointing: false
|
| 49 |
+
use_dummy_backbone: true
|
| 50 |
+
fusion:
|
| 51 |
+
hidden_dim: 192
|
| 52 |
+
num_cameras: 3
|
| 53 |
+
num_layers: 2
|
| 54 |
+
num_heads: 4
|
| 55 |
+
ff_dim: 384
|
| 56 |
+
dropout: 0.1
|
| 57 |
+
proprio_dim: 32
|
| 58 |
+
proprio_tokens: 1
|
| 59 |
+
memory:
|
| 60 |
+
hidden_dim: 192
|
| 61 |
+
action_dim: 14
|
| 62 |
+
history_steps: 6
|
| 63 |
+
scene_history_steps: 3
|
| 64 |
+
belief_history_steps: 8
|
| 65 |
+
num_layers: 2
|
| 66 |
+
dropout: 0.1
|
| 67 |
+
memory_bank_size: 4
|
| 68 |
+
scene_bank_size: 2
|
| 69 |
+
belief_bank_size: 2
|
| 70 |
+
num_heads: 4
|
| 71 |
+
max_history_steps: 8
|
| 72 |
+
decoder:
|
| 73 |
+
hidden_dim: 192
|
| 74 |
+
num_heads: 4
|
| 75 |
+
num_layers: 2
|
| 76 |
+
ff_dim: 384
|
| 77 |
+
dropout: 0.1
|
| 78 |
+
chunk_size: 8
|
| 79 |
+
action_dim: 14
|
| 80 |
+
arm_action_dim: 7
|
| 81 |
+
num_candidates: 8
|
| 82 |
+
num_phases: 5
|
| 83 |
+
num_arm_roles: 4
|
| 84 |
+
num_proposal_modes: 6
|
| 85 |
+
planner_top_k: 4
|
| 86 |
+
reveal_head:
|
| 87 |
+
hidden_dim: 192
|
| 88 |
+
num_support_modes: 3
|
| 89 |
+
num_approach_templates: 32
|
| 90 |
+
rollout_horizon: 5
|
| 91 |
+
belief_map_size: 32
|
| 92 |
+
field_size: 16
|
| 93 |
+
num_heads: 4
|
| 94 |
+
predict_belief_map: true
|
| 95 |
+
num_phases: 5
|
| 96 |
+
num_arm_roles: 4
|
| 97 |
+
num_interaction_tokens: 8
|
| 98 |
+
world_model:
|
| 99 |
+
hidden_dim: 192
|
| 100 |
+
action_dim: 14
|
| 101 |
+
num_support_modes: 3
|
| 102 |
+
num_approach_templates: 32
|
| 103 |
+
rollout_horizon: 5
|
| 104 |
+
field_size: 16
|
| 105 |
+
num_heads: 4
|
| 106 |
+
num_phases: 5
|
| 107 |
+
num_arm_roles: 4
|
| 108 |
+
num_interaction_tokens: 8
|
| 109 |
+
belief_map_size: 32
|
| 110 |
+
predict_belief_map: true
|
| 111 |
+
scene_bank_size: 2
|
| 112 |
+
belief_bank_size: 2
|
| 113 |
+
planner:
|
| 114 |
+
hidden_dim: 192
|
| 115 |
+
num_candidates: 8
|
| 116 |
+
action_dim: 14
|
| 117 |
+
num_support_modes: 3
|
| 118 |
+
utility_margin: 0.1
|
| 119 |
+
num_heads: 4
|
| 120 |
+
num_layers: 2
|
| 121 |
+
num_phases: 5
|
| 122 |
+
num_arm_roles: 4
|
| 123 |
+
top_k: 4
|
| 124 |
+
loss_weights:
|
| 125 |
+
action: 1.0
|
| 126 |
+
phase: 0.15
|
| 127 |
+
arm_role: 0.2
|
| 128 |
+
support_mode: 0.15
|
| 129 |
+
corridor: 0.2
|
| 130 |
+
persistence: 0.1
|
| 131 |
+
disturbance: 0.1
|
| 132 |
+
world_model: 0.25
|
| 133 |
+
belief: 0.05
|
| 134 |
+
visibility: 0.05
|
| 135 |
+
clearance: 0.05
|
| 136 |
+
support_stability: 0.05
|
| 137 |
+
reocclusion: 0.05
|
| 138 |
+
occluder_contact: 0.05
|
| 139 |
+
grasp_affordance: 0.05
|
| 140 |
+
planner_success: 0.2
|
| 141 |
+
planner_risk: 0.1
|
| 142 |
+
planner_ranking: 0.1
|
| 143 |
+
proposal_reconstruction: 0.2
|
| 144 |
+
proposal_success: 0.1
|
| 145 |
+
proposal_ranking: 0.1
|
| 146 |
+
proposal_diversity: 0.05
|
| 147 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage1_dummy_seed15.yaml
ADDED
|
@@ -0,0 +1,147 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage1_dummy_seed15
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 15
|
| 5 |
+
data:
|
| 6 |
+
proxies:
|
| 7 |
+
- foliage_proxy
|
| 8 |
+
- bag_proxy
|
| 9 |
+
- cloth_proxy
|
| 10 |
+
resolution: 96
|
| 11 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 12 |
+
train_episodes_per_proxy: 48
|
| 13 |
+
val_episodes_per_proxy: 16
|
| 14 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v6_rgbd_stage1_dummy_seed15.pt
|
| 15 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v6_rgbd_stage1_dummy_seed15.pt
|
| 16 |
+
rebuild_dataset: false
|
| 17 |
+
chunk_horizon: 8
|
| 18 |
+
rollout_horizon: 5
|
| 19 |
+
history_steps: 6
|
| 20 |
+
planner_candidates: 8
|
| 21 |
+
seed: 15
|
| 22 |
+
optim:
|
| 23 |
+
epochs: 4
|
| 24 |
+
batch_size: 16
|
| 25 |
+
num_workers: 4
|
| 26 |
+
lr: 0.001
|
| 27 |
+
weight_decay: 0.0001
|
| 28 |
+
trainer:
|
| 29 |
+
policy_type: elastic_reveal
|
| 30 |
+
use_bf16: false
|
| 31 |
+
grad_clip_norm: 1.0
|
| 32 |
+
freeze_backbone: true
|
| 33 |
+
gradient_checkpointing: false
|
| 34 |
+
plan_during_train: true
|
| 35 |
+
plan_during_eval: true
|
| 36 |
+
support_mode_conditioning: true
|
| 37 |
+
planner_mode: trainable
|
| 38 |
+
use_depth: false
|
| 39 |
+
use_world_model: true
|
| 40 |
+
use_role_tokens: true
|
| 41 |
+
compute_equivariance_probe: true
|
| 42 |
+
policy:
|
| 43 |
+
backbone:
|
| 44 |
+
model_name: openai/clip-vit-base-patch32
|
| 45 |
+
hidden_dim: 192
|
| 46 |
+
max_text_tokens: 32
|
| 47 |
+
freeze_backbone: true
|
| 48 |
+
gradient_checkpointing: false
|
| 49 |
+
use_dummy_backbone: true
|
| 50 |
+
fusion:
|
| 51 |
+
hidden_dim: 192
|
| 52 |
+
num_cameras: 3
|
| 53 |
+
num_layers: 2
|
| 54 |
+
num_heads: 4
|
| 55 |
+
ff_dim: 384
|
| 56 |
+
dropout: 0.1
|
| 57 |
+
proprio_dim: 32
|
| 58 |
+
proprio_tokens: 1
|
| 59 |
+
memory:
|
| 60 |
+
hidden_dim: 192
|
| 61 |
+
action_dim: 14
|
| 62 |
+
history_steps: 6
|
| 63 |
+
scene_history_steps: 3
|
| 64 |
+
belief_history_steps: 8
|
| 65 |
+
num_layers: 2
|
| 66 |
+
dropout: 0.1
|
| 67 |
+
memory_bank_size: 4
|
| 68 |
+
scene_bank_size: 2
|
| 69 |
+
belief_bank_size: 2
|
| 70 |
+
num_heads: 4
|
| 71 |
+
max_history_steps: 8
|
| 72 |
+
decoder:
|
| 73 |
+
hidden_dim: 192
|
| 74 |
+
num_heads: 4
|
| 75 |
+
num_layers: 2
|
| 76 |
+
ff_dim: 384
|
| 77 |
+
dropout: 0.1
|
| 78 |
+
chunk_size: 8
|
| 79 |
+
action_dim: 14
|
| 80 |
+
arm_action_dim: 7
|
| 81 |
+
num_candidates: 8
|
| 82 |
+
num_phases: 5
|
| 83 |
+
num_arm_roles: 4
|
| 84 |
+
num_proposal_modes: 6
|
| 85 |
+
planner_top_k: 4
|
| 86 |
+
reveal_head:
|
| 87 |
+
hidden_dim: 192
|
| 88 |
+
num_support_modes: 3
|
| 89 |
+
num_approach_templates: 32
|
| 90 |
+
rollout_horizon: 5
|
| 91 |
+
belief_map_size: 32
|
| 92 |
+
field_size: 16
|
| 93 |
+
num_heads: 4
|
| 94 |
+
predict_belief_map: true
|
| 95 |
+
num_phases: 5
|
| 96 |
+
num_arm_roles: 4
|
| 97 |
+
num_interaction_tokens: 8
|
| 98 |
+
world_model:
|
| 99 |
+
hidden_dim: 192
|
| 100 |
+
action_dim: 14
|
| 101 |
+
num_support_modes: 3
|
| 102 |
+
num_approach_templates: 32
|
| 103 |
+
rollout_horizon: 5
|
| 104 |
+
field_size: 16
|
| 105 |
+
num_heads: 4
|
| 106 |
+
num_phases: 5
|
| 107 |
+
num_arm_roles: 4
|
| 108 |
+
num_interaction_tokens: 8
|
| 109 |
+
belief_map_size: 32
|
| 110 |
+
predict_belief_map: true
|
| 111 |
+
scene_bank_size: 2
|
| 112 |
+
belief_bank_size: 2
|
| 113 |
+
planner:
|
| 114 |
+
hidden_dim: 192
|
| 115 |
+
num_candidates: 8
|
| 116 |
+
action_dim: 14
|
| 117 |
+
num_support_modes: 3
|
| 118 |
+
utility_margin: 0.1
|
| 119 |
+
num_heads: 4
|
| 120 |
+
num_layers: 2
|
| 121 |
+
num_phases: 5
|
| 122 |
+
num_arm_roles: 4
|
| 123 |
+
top_k: 4
|
| 124 |
+
loss_weights:
|
| 125 |
+
action: 1.0
|
| 126 |
+
phase: 0.15
|
| 127 |
+
arm_role: 0.2
|
| 128 |
+
support_mode: 0.15
|
| 129 |
+
corridor: 0.2
|
| 130 |
+
persistence: 0.1
|
| 131 |
+
disturbance: 0.1
|
| 132 |
+
world_model: 0.25
|
| 133 |
+
belief: 0.05
|
| 134 |
+
visibility: 0.05
|
| 135 |
+
clearance: 0.05
|
| 136 |
+
support_stability: 0.05
|
| 137 |
+
reocclusion: 0.05
|
| 138 |
+
occluder_contact: 0.05
|
| 139 |
+
grasp_affordance: 0.05
|
| 140 |
+
planner_success: 0.2
|
| 141 |
+
planner_risk: 0.1
|
| 142 |
+
planner_ranking: 0.1
|
| 143 |
+
proposal_reconstruction: 0.2
|
| 144 |
+
proposal_success: 0.1
|
| 145 |
+
proposal_ranking: 0.1
|
| 146 |
+
proposal_diversity: 0.05
|
| 147 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage2_clip_seed11.yaml
ADDED
|
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage2_clip_seed11
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 11
|
| 5 |
+
init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
|
| 6 |
+
init_strict: false
|
| 7 |
+
data:
|
| 8 |
+
proxies:
|
| 9 |
+
- foliage_proxy
|
| 10 |
+
- bag_proxy
|
| 11 |
+
- cloth_proxy
|
| 12 |
+
resolution: 224
|
| 13 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 14 |
+
train_episodes_per_proxy: 48
|
| 15 |
+
val_episodes_per_proxy: 16
|
| 16 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage2_seed11.pt
|
| 17 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage2_seed11.pt
|
| 18 |
+
rebuild_dataset: false
|
| 19 |
+
chunk_horizon: 8
|
| 20 |
+
rollout_horizon: 5
|
| 21 |
+
history_steps: 6
|
| 22 |
+
planner_candidates: 8
|
| 23 |
+
seed: 11
|
| 24 |
+
optim:
|
| 25 |
+
epochs: 4
|
| 26 |
+
batch_size: 2
|
| 27 |
+
num_workers: 4
|
| 28 |
+
lr: 0.0003
|
| 29 |
+
weight_decay: 0.0001
|
| 30 |
+
trainer:
|
| 31 |
+
policy_type: elastic_reveal
|
| 32 |
+
use_bf16: true
|
| 33 |
+
grad_clip_norm: 1.0
|
| 34 |
+
freeze_backbone: true
|
| 35 |
+
gradient_checkpointing: false
|
| 36 |
+
plan_during_train: true
|
| 37 |
+
plan_during_eval: true
|
| 38 |
+
support_mode_conditioning: true
|
| 39 |
+
planner_mode: trainable
|
| 40 |
+
use_depth: false
|
| 41 |
+
use_world_model: true
|
| 42 |
+
use_role_tokens: true
|
| 43 |
+
compute_equivariance_probe: true
|
| 44 |
+
policy:
|
| 45 |
+
backbone:
|
| 46 |
+
model_name: openai/clip-vit-base-patch32
|
| 47 |
+
hidden_dim: 512
|
| 48 |
+
max_text_tokens: 32
|
| 49 |
+
freeze_backbone: true
|
| 50 |
+
gradient_checkpointing: false
|
| 51 |
+
use_dummy_backbone: false
|
| 52 |
+
fusion:
|
| 53 |
+
hidden_dim: 512
|
| 54 |
+
num_cameras: 3
|
| 55 |
+
num_layers: 4
|
| 56 |
+
num_heads: 8
|
| 57 |
+
ff_dim: 2048
|
| 58 |
+
dropout: 0.1
|
| 59 |
+
proprio_dim: 32
|
| 60 |
+
proprio_tokens: 1
|
| 61 |
+
memory:
|
| 62 |
+
hidden_dim: 512
|
| 63 |
+
action_dim: 14
|
| 64 |
+
history_steps: 6
|
| 65 |
+
scene_history_steps: 3
|
| 66 |
+
belief_history_steps: 8
|
| 67 |
+
num_layers: 2
|
| 68 |
+
dropout: 0.1
|
| 69 |
+
memory_bank_size: 4
|
| 70 |
+
scene_bank_size: 2
|
| 71 |
+
belief_bank_size: 2
|
| 72 |
+
num_heads: 8
|
| 73 |
+
max_history_steps: 8
|
| 74 |
+
decoder:
|
| 75 |
+
hidden_dim: 512
|
| 76 |
+
num_heads: 8
|
| 77 |
+
num_layers: 4
|
| 78 |
+
ff_dim: 2048
|
| 79 |
+
dropout: 0.1
|
| 80 |
+
chunk_size: 8
|
| 81 |
+
action_dim: 14
|
| 82 |
+
arm_action_dim: 7
|
| 83 |
+
num_candidates: 8
|
| 84 |
+
num_phases: 5
|
| 85 |
+
num_arm_roles: 4
|
| 86 |
+
num_proposal_modes: 6
|
| 87 |
+
planner_top_k: 4
|
| 88 |
+
reveal_head:
|
| 89 |
+
hidden_dim: 512
|
| 90 |
+
num_support_modes: 3
|
| 91 |
+
num_approach_templates: 32
|
| 92 |
+
rollout_horizon: 5
|
| 93 |
+
belief_map_size: 32
|
| 94 |
+
field_size: 16
|
| 95 |
+
num_heads: 8
|
| 96 |
+
predict_belief_map: true
|
| 97 |
+
num_phases: 5
|
| 98 |
+
num_arm_roles: 4
|
| 99 |
+
num_interaction_tokens: 8
|
| 100 |
+
world_model:
|
| 101 |
+
hidden_dim: 512
|
| 102 |
+
action_dim: 14
|
| 103 |
+
num_support_modes: 3
|
| 104 |
+
num_approach_templates: 32
|
| 105 |
+
rollout_horizon: 5
|
| 106 |
+
field_size: 16
|
| 107 |
+
num_heads: 8
|
| 108 |
+
num_phases: 5
|
| 109 |
+
num_arm_roles: 4
|
| 110 |
+
num_interaction_tokens: 8
|
| 111 |
+
belief_map_size: 32
|
| 112 |
+
predict_belief_map: true
|
| 113 |
+
scene_bank_size: 2
|
| 114 |
+
belief_bank_size: 2
|
| 115 |
+
planner:
|
| 116 |
+
hidden_dim: 512
|
| 117 |
+
num_candidates: 8
|
| 118 |
+
action_dim: 14
|
| 119 |
+
num_support_modes: 3
|
| 120 |
+
utility_margin: 0.1
|
| 121 |
+
num_heads: 8
|
| 122 |
+
num_layers: 2
|
| 123 |
+
num_phases: 5
|
| 124 |
+
num_arm_roles: 4
|
| 125 |
+
top_k: 4
|
| 126 |
+
loss_weights:
|
| 127 |
+
action: 1.0
|
| 128 |
+
phase: 0.1
|
| 129 |
+
arm_role: 0.15
|
| 130 |
+
support_mode: 0.1
|
| 131 |
+
corridor: 0.15
|
| 132 |
+
persistence: 0.05
|
| 133 |
+
disturbance: 0.05
|
| 134 |
+
world_model: 0.25
|
| 135 |
+
belief: 0.05
|
| 136 |
+
visibility: 0.05
|
| 137 |
+
clearance: 0.05
|
| 138 |
+
support_stability: 0.05
|
| 139 |
+
reocclusion: 0.05
|
| 140 |
+
occluder_contact: 0.05
|
| 141 |
+
grasp_affordance: 0.05
|
| 142 |
+
planner_success: 0.25
|
| 143 |
+
planner_risk: 0.1
|
| 144 |
+
planner_ranking: 0.2
|
| 145 |
+
proposal_reconstruction: 0.1
|
| 146 |
+
proposal_success: 0.15
|
| 147 |
+
proposal_ranking: 0.2
|
| 148 |
+
proposal_diversity: 0.05
|
| 149 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage2_clip_seed12.yaml
ADDED
|
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage2_clip_seed12
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 12
|
| 5 |
+
init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
|
| 6 |
+
init_strict: false
|
| 7 |
+
data:
|
| 8 |
+
proxies:
|
| 9 |
+
- foliage_proxy
|
| 10 |
+
- bag_proxy
|
| 11 |
+
- cloth_proxy
|
| 12 |
+
resolution: 224
|
| 13 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 14 |
+
train_episodes_per_proxy: 48
|
| 15 |
+
val_episodes_per_proxy: 16
|
| 16 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage2_seed12.pt
|
| 17 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage2_seed12.pt
|
| 18 |
+
rebuild_dataset: false
|
| 19 |
+
chunk_horizon: 8
|
| 20 |
+
rollout_horizon: 5
|
| 21 |
+
history_steps: 6
|
| 22 |
+
planner_candidates: 8
|
| 23 |
+
seed: 12
|
| 24 |
+
optim:
|
| 25 |
+
epochs: 4
|
| 26 |
+
batch_size: 2
|
| 27 |
+
num_workers: 4
|
| 28 |
+
lr: 0.0003
|
| 29 |
+
weight_decay: 0.0001
|
| 30 |
+
trainer:
|
| 31 |
+
policy_type: elastic_reveal
|
| 32 |
+
use_bf16: true
|
| 33 |
+
grad_clip_norm: 1.0
|
| 34 |
+
freeze_backbone: true
|
| 35 |
+
gradient_checkpointing: false
|
| 36 |
+
plan_during_train: true
|
| 37 |
+
plan_during_eval: true
|
| 38 |
+
support_mode_conditioning: true
|
| 39 |
+
planner_mode: trainable
|
| 40 |
+
use_depth: false
|
| 41 |
+
use_world_model: true
|
| 42 |
+
use_role_tokens: true
|
| 43 |
+
compute_equivariance_probe: true
|
| 44 |
+
policy:
|
| 45 |
+
backbone:
|
| 46 |
+
model_name: openai/clip-vit-base-patch32
|
| 47 |
+
hidden_dim: 512
|
| 48 |
+
max_text_tokens: 32
|
| 49 |
+
freeze_backbone: true
|
| 50 |
+
gradient_checkpointing: false
|
| 51 |
+
use_dummy_backbone: false
|
| 52 |
+
fusion:
|
| 53 |
+
hidden_dim: 512
|
| 54 |
+
num_cameras: 3
|
| 55 |
+
num_layers: 4
|
| 56 |
+
num_heads: 8
|
| 57 |
+
ff_dim: 2048
|
| 58 |
+
dropout: 0.1
|
| 59 |
+
proprio_dim: 32
|
| 60 |
+
proprio_tokens: 1
|
| 61 |
+
memory:
|
| 62 |
+
hidden_dim: 512
|
| 63 |
+
action_dim: 14
|
| 64 |
+
history_steps: 6
|
| 65 |
+
scene_history_steps: 3
|
| 66 |
+
belief_history_steps: 8
|
| 67 |
+
num_layers: 2
|
| 68 |
+
dropout: 0.1
|
| 69 |
+
memory_bank_size: 4
|
| 70 |
+
scene_bank_size: 2
|
| 71 |
+
belief_bank_size: 2
|
| 72 |
+
num_heads: 8
|
| 73 |
+
max_history_steps: 8
|
| 74 |
+
decoder:
|
| 75 |
+
hidden_dim: 512
|
| 76 |
+
num_heads: 8
|
| 77 |
+
num_layers: 4
|
| 78 |
+
ff_dim: 2048
|
| 79 |
+
dropout: 0.1
|
| 80 |
+
chunk_size: 8
|
| 81 |
+
action_dim: 14
|
| 82 |
+
arm_action_dim: 7
|
| 83 |
+
num_candidates: 8
|
| 84 |
+
num_phases: 5
|
| 85 |
+
num_arm_roles: 4
|
| 86 |
+
num_proposal_modes: 6
|
| 87 |
+
planner_top_k: 4
|
| 88 |
+
reveal_head:
|
| 89 |
+
hidden_dim: 512
|
| 90 |
+
num_support_modes: 3
|
| 91 |
+
num_approach_templates: 32
|
| 92 |
+
rollout_horizon: 5
|
| 93 |
+
belief_map_size: 32
|
| 94 |
+
field_size: 16
|
| 95 |
+
num_heads: 8
|
| 96 |
+
predict_belief_map: true
|
| 97 |
+
num_phases: 5
|
| 98 |
+
num_arm_roles: 4
|
| 99 |
+
num_interaction_tokens: 8
|
| 100 |
+
world_model:
|
| 101 |
+
hidden_dim: 512
|
| 102 |
+
action_dim: 14
|
| 103 |
+
num_support_modes: 3
|
| 104 |
+
num_approach_templates: 32
|
| 105 |
+
rollout_horizon: 5
|
| 106 |
+
field_size: 16
|
| 107 |
+
num_heads: 8
|
| 108 |
+
num_phases: 5
|
| 109 |
+
num_arm_roles: 4
|
| 110 |
+
num_interaction_tokens: 8
|
| 111 |
+
belief_map_size: 32
|
| 112 |
+
predict_belief_map: true
|
| 113 |
+
scene_bank_size: 2
|
| 114 |
+
belief_bank_size: 2
|
| 115 |
+
planner:
|
| 116 |
+
hidden_dim: 512
|
| 117 |
+
num_candidates: 8
|
| 118 |
+
action_dim: 14
|
| 119 |
+
num_support_modes: 3
|
| 120 |
+
utility_margin: 0.1
|
| 121 |
+
num_heads: 8
|
| 122 |
+
num_layers: 2
|
| 123 |
+
num_phases: 5
|
| 124 |
+
num_arm_roles: 4
|
| 125 |
+
top_k: 4
|
| 126 |
+
loss_weights:
|
| 127 |
+
action: 1.0
|
| 128 |
+
phase: 0.1
|
| 129 |
+
arm_role: 0.15
|
| 130 |
+
support_mode: 0.1
|
| 131 |
+
corridor: 0.15
|
| 132 |
+
persistence: 0.05
|
| 133 |
+
disturbance: 0.05
|
| 134 |
+
world_model: 0.25
|
| 135 |
+
belief: 0.05
|
| 136 |
+
visibility: 0.05
|
| 137 |
+
clearance: 0.05
|
| 138 |
+
support_stability: 0.05
|
| 139 |
+
reocclusion: 0.05
|
| 140 |
+
occluder_contact: 0.05
|
| 141 |
+
grasp_affordance: 0.05
|
| 142 |
+
planner_success: 0.25
|
| 143 |
+
planner_risk: 0.1
|
| 144 |
+
planner_ranking: 0.2
|
| 145 |
+
proposal_reconstruction: 0.1
|
| 146 |
+
proposal_success: 0.15
|
| 147 |
+
proposal_ranking: 0.2
|
| 148 |
+
proposal_diversity: 0.05
|
| 149 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage2_clip_seed13.yaml
ADDED
|
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage2_clip_seed13
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 13
|
| 5 |
+
init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
|
| 6 |
+
init_strict: false
|
| 7 |
+
data:
|
| 8 |
+
proxies:
|
| 9 |
+
- foliage_proxy
|
| 10 |
+
- bag_proxy
|
| 11 |
+
- cloth_proxy
|
| 12 |
+
resolution: 224
|
| 13 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 14 |
+
train_episodes_per_proxy: 48
|
| 15 |
+
val_episodes_per_proxy: 16
|
| 16 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage2_seed13.pt
|
| 17 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage2_seed13.pt
|
| 18 |
+
rebuild_dataset: false
|
| 19 |
+
chunk_horizon: 8
|
| 20 |
+
rollout_horizon: 5
|
| 21 |
+
history_steps: 6
|
| 22 |
+
planner_candidates: 8
|
| 23 |
+
seed: 13
|
| 24 |
+
optim:
|
| 25 |
+
epochs: 4
|
| 26 |
+
batch_size: 2
|
| 27 |
+
num_workers: 4
|
| 28 |
+
lr: 0.0003
|
| 29 |
+
weight_decay: 0.0001
|
| 30 |
+
trainer:
|
| 31 |
+
policy_type: elastic_reveal
|
| 32 |
+
use_bf16: true
|
| 33 |
+
grad_clip_norm: 1.0
|
| 34 |
+
freeze_backbone: true
|
| 35 |
+
gradient_checkpointing: false
|
| 36 |
+
plan_during_train: true
|
| 37 |
+
plan_during_eval: true
|
| 38 |
+
support_mode_conditioning: true
|
| 39 |
+
planner_mode: trainable
|
| 40 |
+
use_depth: false
|
| 41 |
+
use_world_model: true
|
| 42 |
+
use_role_tokens: true
|
| 43 |
+
compute_equivariance_probe: true
|
| 44 |
+
policy:
|
| 45 |
+
backbone:
|
| 46 |
+
model_name: openai/clip-vit-base-patch32
|
| 47 |
+
hidden_dim: 512
|
| 48 |
+
max_text_tokens: 32
|
| 49 |
+
freeze_backbone: true
|
| 50 |
+
gradient_checkpointing: false
|
| 51 |
+
use_dummy_backbone: false
|
| 52 |
+
fusion:
|
| 53 |
+
hidden_dim: 512
|
| 54 |
+
num_cameras: 3
|
| 55 |
+
num_layers: 4
|
| 56 |
+
num_heads: 8
|
| 57 |
+
ff_dim: 2048
|
| 58 |
+
dropout: 0.1
|
| 59 |
+
proprio_dim: 32
|
| 60 |
+
proprio_tokens: 1
|
| 61 |
+
memory:
|
| 62 |
+
hidden_dim: 512
|
| 63 |
+
action_dim: 14
|
| 64 |
+
history_steps: 6
|
| 65 |
+
scene_history_steps: 3
|
| 66 |
+
belief_history_steps: 8
|
| 67 |
+
num_layers: 2
|
| 68 |
+
dropout: 0.1
|
| 69 |
+
memory_bank_size: 4
|
| 70 |
+
scene_bank_size: 2
|
| 71 |
+
belief_bank_size: 2
|
| 72 |
+
num_heads: 8
|
| 73 |
+
max_history_steps: 8
|
| 74 |
+
decoder:
|
| 75 |
+
hidden_dim: 512
|
| 76 |
+
num_heads: 8
|
| 77 |
+
num_layers: 4
|
| 78 |
+
ff_dim: 2048
|
| 79 |
+
dropout: 0.1
|
| 80 |
+
chunk_size: 8
|
| 81 |
+
action_dim: 14
|
| 82 |
+
arm_action_dim: 7
|
| 83 |
+
num_candidates: 8
|
| 84 |
+
num_phases: 5
|
| 85 |
+
num_arm_roles: 4
|
| 86 |
+
num_proposal_modes: 6
|
| 87 |
+
planner_top_k: 4
|
| 88 |
+
reveal_head:
|
| 89 |
+
hidden_dim: 512
|
| 90 |
+
num_support_modes: 3
|
| 91 |
+
num_approach_templates: 32
|
| 92 |
+
rollout_horizon: 5
|
| 93 |
+
belief_map_size: 32
|
| 94 |
+
field_size: 16
|
| 95 |
+
num_heads: 8
|
| 96 |
+
predict_belief_map: true
|
| 97 |
+
num_phases: 5
|
| 98 |
+
num_arm_roles: 4
|
| 99 |
+
num_interaction_tokens: 8
|
| 100 |
+
world_model:
|
| 101 |
+
hidden_dim: 512
|
| 102 |
+
action_dim: 14
|
| 103 |
+
num_support_modes: 3
|
| 104 |
+
num_approach_templates: 32
|
| 105 |
+
rollout_horizon: 5
|
| 106 |
+
field_size: 16
|
| 107 |
+
num_heads: 8
|
| 108 |
+
num_phases: 5
|
| 109 |
+
num_arm_roles: 4
|
| 110 |
+
num_interaction_tokens: 8
|
| 111 |
+
belief_map_size: 32
|
| 112 |
+
predict_belief_map: true
|
| 113 |
+
scene_bank_size: 2
|
| 114 |
+
belief_bank_size: 2
|
| 115 |
+
planner:
|
| 116 |
+
hidden_dim: 512
|
| 117 |
+
num_candidates: 8
|
| 118 |
+
action_dim: 14
|
| 119 |
+
num_support_modes: 3
|
| 120 |
+
utility_margin: 0.1
|
| 121 |
+
num_heads: 8
|
| 122 |
+
num_layers: 2
|
| 123 |
+
num_phases: 5
|
| 124 |
+
num_arm_roles: 4
|
| 125 |
+
top_k: 4
|
| 126 |
+
loss_weights:
|
| 127 |
+
action: 1.0
|
| 128 |
+
phase: 0.1
|
| 129 |
+
arm_role: 0.15
|
| 130 |
+
support_mode: 0.1
|
| 131 |
+
corridor: 0.15
|
| 132 |
+
persistence: 0.05
|
| 133 |
+
disturbance: 0.05
|
| 134 |
+
world_model: 0.25
|
| 135 |
+
belief: 0.05
|
| 136 |
+
visibility: 0.05
|
| 137 |
+
clearance: 0.05
|
| 138 |
+
support_stability: 0.05
|
| 139 |
+
reocclusion: 0.05
|
| 140 |
+
occluder_contact: 0.05
|
| 141 |
+
grasp_affordance: 0.05
|
| 142 |
+
planner_success: 0.25
|
| 143 |
+
planner_risk: 0.1
|
| 144 |
+
planner_ranking: 0.2
|
| 145 |
+
proposal_reconstruction: 0.1
|
| 146 |
+
proposal_success: 0.15
|
| 147 |
+
proposal_ranking: 0.2
|
| 148 |
+
proposal_diversity: 0.05
|
| 149 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage2_dummy_seed21.yaml
ADDED
|
@@ -0,0 +1,148 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage2_dummy_seed21
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 21
|
| 5 |
+
defaults: []
|
| 6 |
+
data:
|
| 7 |
+
proxies:
|
| 8 |
+
- foliage_proxy
|
| 9 |
+
- bag_proxy
|
| 10 |
+
- cloth_proxy
|
| 11 |
+
resolution: 96
|
| 12 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 13 |
+
train_episodes_per_proxy: 48
|
| 14 |
+
val_episodes_per_proxy: 16
|
| 15 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v6_rgbd_stage2_dummy_seed21.pt
|
| 16 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v6_rgbd_stage2_dummy_seed21.pt
|
| 17 |
+
rebuild_dataset: false
|
| 18 |
+
chunk_horizon: 8
|
| 19 |
+
rollout_horizon: 5
|
| 20 |
+
history_steps: 6
|
| 21 |
+
planner_candidates: 8
|
| 22 |
+
seed: 21
|
| 23 |
+
optim:
|
| 24 |
+
epochs: 4
|
| 25 |
+
batch_size: 16
|
| 26 |
+
num_workers: 4
|
| 27 |
+
lr: 0.001
|
| 28 |
+
weight_decay: 0.0001
|
| 29 |
+
trainer:
|
| 30 |
+
policy_type: elastic_reveal
|
| 31 |
+
use_bf16: false
|
| 32 |
+
grad_clip_norm: 1.0
|
| 33 |
+
freeze_backbone: true
|
| 34 |
+
gradient_checkpointing: false
|
| 35 |
+
plan_during_train: true
|
| 36 |
+
plan_during_eval: true
|
| 37 |
+
support_mode_conditioning: true
|
| 38 |
+
planner_mode: trainable
|
| 39 |
+
use_depth: false
|
| 40 |
+
use_world_model: true
|
| 41 |
+
use_role_tokens: true
|
| 42 |
+
compute_equivariance_probe: true
|
| 43 |
+
policy:
|
| 44 |
+
backbone:
|
| 45 |
+
model_name: openai/clip-vit-base-patch32
|
| 46 |
+
hidden_dim: 192
|
| 47 |
+
max_text_tokens: 32
|
| 48 |
+
freeze_backbone: true
|
| 49 |
+
gradient_checkpointing: false
|
| 50 |
+
use_dummy_backbone: true
|
| 51 |
+
fusion:
|
| 52 |
+
hidden_dim: 192
|
| 53 |
+
num_cameras: 3
|
| 54 |
+
num_layers: 2
|
| 55 |
+
num_heads: 4
|
| 56 |
+
ff_dim: 384
|
| 57 |
+
dropout: 0.1
|
| 58 |
+
proprio_dim: 32
|
| 59 |
+
proprio_tokens: 1
|
| 60 |
+
memory:
|
| 61 |
+
hidden_dim: 192
|
| 62 |
+
action_dim: 14
|
| 63 |
+
history_steps: 6
|
| 64 |
+
scene_history_steps: 3
|
| 65 |
+
belief_history_steps: 8
|
| 66 |
+
num_layers: 2
|
| 67 |
+
dropout: 0.1
|
| 68 |
+
memory_bank_size: 4
|
| 69 |
+
scene_bank_size: 2
|
| 70 |
+
belief_bank_size: 2
|
| 71 |
+
num_heads: 4
|
| 72 |
+
max_history_steps: 8
|
| 73 |
+
decoder:
|
| 74 |
+
hidden_dim: 192
|
| 75 |
+
num_heads: 4
|
| 76 |
+
num_layers: 2
|
| 77 |
+
ff_dim: 384
|
| 78 |
+
dropout: 0.1
|
| 79 |
+
chunk_size: 8
|
| 80 |
+
action_dim: 14
|
| 81 |
+
arm_action_dim: 7
|
| 82 |
+
num_candidates: 8
|
| 83 |
+
num_phases: 5
|
| 84 |
+
num_arm_roles: 4
|
| 85 |
+
num_proposal_modes: 6
|
| 86 |
+
planner_top_k: 4
|
| 87 |
+
reveal_head:
|
| 88 |
+
hidden_dim: 192
|
| 89 |
+
num_support_modes: 3
|
| 90 |
+
num_approach_templates: 32
|
| 91 |
+
rollout_horizon: 5
|
| 92 |
+
belief_map_size: 32
|
| 93 |
+
field_size: 16
|
| 94 |
+
num_heads: 4
|
| 95 |
+
predict_belief_map: true
|
| 96 |
+
num_phases: 5
|
| 97 |
+
num_arm_roles: 4
|
| 98 |
+
num_interaction_tokens: 8
|
| 99 |
+
world_model:
|
| 100 |
+
hidden_dim: 192
|
| 101 |
+
action_dim: 14
|
| 102 |
+
num_support_modes: 3
|
| 103 |
+
num_approach_templates: 32
|
| 104 |
+
rollout_horizon: 5
|
| 105 |
+
field_size: 16
|
| 106 |
+
num_heads: 4
|
| 107 |
+
num_phases: 5
|
| 108 |
+
num_arm_roles: 4
|
| 109 |
+
num_interaction_tokens: 8
|
| 110 |
+
belief_map_size: 32
|
| 111 |
+
predict_belief_map: true
|
| 112 |
+
scene_bank_size: 2
|
| 113 |
+
belief_bank_size: 2
|
| 114 |
+
planner:
|
| 115 |
+
hidden_dim: 192
|
| 116 |
+
num_candidates: 8
|
| 117 |
+
action_dim: 14
|
| 118 |
+
num_support_modes: 3
|
| 119 |
+
utility_margin: 0.1
|
| 120 |
+
num_heads: 4
|
| 121 |
+
num_layers: 2
|
| 122 |
+
num_phases: 5
|
| 123 |
+
num_arm_roles: 4
|
| 124 |
+
top_k: 4
|
| 125 |
+
loss_weights:
|
| 126 |
+
action: 1.0
|
| 127 |
+
phase: 0.15
|
| 128 |
+
arm_role: 0.2
|
| 129 |
+
support_mode: 0.15
|
| 130 |
+
corridor: 0.2
|
| 131 |
+
persistence: 0.1
|
| 132 |
+
disturbance: 0.1
|
| 133 |
+
world_model: 0.3
|
| 134 |
+
belief: 0.05
|
| 135 |
+
visibility: 0.05
|
| 136 |
+
clearance: 0.05
|
| 137 |
+
support_stability: 0.05
|
| 138 |
+
reocclusion: 0.05
|
| 139 |
+
occluder_contact: 0.05
|
| 140 |
+
grasp_affordance: 0.05
|
| 141 |
+
planner_success: 0.2
|
| 142 |
+
planner_risk: 0.1
|
| 143 |
+
planner_ranking: 0.1
|
| 144 |
+
proposal_reconstruction: 0.2
|
| 145 |
+
proposal_success: 0.1
|
| 146 |
+
proposal_ranking: 0.1
|
| 147 |
+
proposal_diversity: 0.05
|
| 148 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage2_dummy_seed22.yaml
ADDED
|
@@ -0,0 +1,148 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage2_dummy_seed22
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 22
|
| 5 |
+
defaults: []
|
| 6 |
+
data:
|
| 7 |
+
proxies:
|
| 8 |
+
- foliage_proxy
|
| 9 |
+
- bag_proxy
|
| 10 |
+
- cloth_proxy
|
| 11 |
+
resolution: 96
|
| 12 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 13 |
+
train_episodes_per_proxy: 48
|
| 14 |
+
val_episodes_per_proxy: 16
|
| 15 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v6_rgbd_stage2_dummy_seed22.pt
|
| 16 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v6_rgbd_stage2_dummy_seed22.pt
|
| 17 |
+
rebuild_dataset: false
|
| 18 |
+
chunk_horizon: 8
|
| 19 |
+
rollout_horizon: 5
|
| 20 |
+
history_steps: 6
|
| 21 |
+
planner_candidates: 8
|
| 22 |
+
seed: 22
|
| 23 |
+
optim:
|
| 24 |
+
epochs: 4
|
| 25 |
+
batch_size: 16
|
| 26 |
+
num_workers: 4
|
| 27 |
+
lr: 0.001
|
| 28 |
+
weight_decay: 0.0001
|
| 29 |
+
trainer:
|
| 30 |
+
policy_type: elastic_reveal
|
| 31 |
+
use_bf16: false
|
| 32 |
+
grad_clip_norm: 1.0
|
| 33 |
+
freeze_backbone: true
|
| 34 |
+
gradient_checkpointing: false
|
| 35 |
+
plan_during_train: true
|
| 36 |
+
plan_during_eval: true
|
| 37 |
+
support_mode_conditioning: true
|
| 38 |
+
planner_mode: trainable
|
| 39 |
+
use_depth: false
|
| 40 |
+
use_world_model: true
|
| 41 |
+
use_role_tokens: true
|
| 42 |
+
compute_equivariance_probe: true
|
| 43 |
+
policy:
|
| 44 |
+
backbone:
|
| 45 |
+
model_name: openai/clip-vit-base-patch32
|
| 46 |
+
hidden_dim: 192
|
| 47 |
+
max_text_tokens: 32
|
| 48 |
+
freeze_backbone: true
|
| 49 |
+
gradient_checkpointing: false
|
| 50 |
+
use_dummy_backbone: true
|
| 51 |
+
fusion:
|
| 52 |
+
hidden_dim: 192
|
| 53 |
+
num_cameras: 3
|
| 54 |
+
num_layers: 2
|
| 55 |
+
num_heads: 4
|
| 56 |
+
ff_dim: 384
|
| 57 |
+
dropout: 0.1
|
| 58 |
+
proprio_dim: 32
|
| 59 |
+
proprio_tokens: 1
|
| 60 |
+
memory:
|
| 61 |
+
hidden_dim: 192
|
| 62 |
+
action_dim: 14
|
| 63 |
+
history_steps: 6
|
| 64 |
+
scene_history_steps: 3
|
| 65 |
+
belief_history_steps: 8
|
| 66 |
+
num_layers: 2
|
| 67 |
+
dropout: 0.1
|
| 68 |
+
memory_bank_size: 4
|
| 69 |
+
scene_bank_size: 2
|
| 70 |
+
belief_bank_size: 2
|
| 71 |
+
num_heads: 4
|
| 72 |
+
max_history_steps: 8
|
| 73 |
+
decoder:
|
| 74 |
+
hidden_dim: 192
|
| 75 |
+
num_heads: 4
|
| 76 |
+
num_layers: 2
|
| 77 |
+
ff_dim: 384
|
| 78 |
+
dropout: 0.1
|
| 79 |
+
chunk_size: 8
|
| 80 |
+
action_dim: 14
|
| 81 |
+
arm_action_dim: 7
|
| 82 |
+
num_candidates: 8
|
| 83 |
+
num_phases: 5
|
| 84 |
+
num_arm_roles: 4
|
| 85 |
+
num_proposal_modes: 6
|
| 86 |
+
planner_top_k: 4
|
| 87 |
+
reveal_head:
|
| 88 |
+
hidden_dim: 192
|
| 89 |
+
num_support_modes: 3
|
| 90 |
+
num_approach_templates: 32
|
| 91 |
+
rollout_horizon: 5
|
| 92 |
+
belief_map_size: 32
|
| 93 |
+
field_size: 16
|
| 94 |
+
num_heads: 4
|
| 95 |
+
predict_belief_map: true
|
| 96 |
+
num_phases: 5
|
| 97 |
+
num_arm_roles: 4
|
| 98 |
+
num_interaction_tokens: 8
|
| 99 |
+
world_model:
|
| 100 |
+
hidden_dim: 192
|
| 101 |
+
action_dim: 14
|
| 102 |
+
num_support_modes: 3
|
| 103 |
+
num_approach_templates: 32
|
| 104 |
+
rollout_horizon: 5
|
| 105 |
+
field_size: 16
|
| 106 |
+
num_heads: 4
|
| 107 |
+
num_phases: 5
|
| 108 |
+
num_arm_roles: 4
|
| 109 |
+
num_interaction_tokens: 8
|
| 110 |
+
belief_map_size: 32
|
| 111 |
+
predict_belief_map: true
|
| 112 |
+
scene_bank_size: 2
|
| 113 |
+
belief_bank_size: 2
|
| 114 |
+
planner:
|
| 115 |
+
hidden_dim: 192
|
| 116 |
+
num_candidates: 8
|
| 117 |
+
action_dim: 14
|
| 118 |
+
num_support_modes: 3
|
| 119 |
+
utility_margin: 0.1
|
| 120 |
+
num_heads: 4
|
| 121 |
+
num_layers: 2
|
| 122 |
+
num_phases: 5
|
| 123 |
+
num_arm_roles: 4
|
| 124 |
+
top_k: 4
|
| 125 |
+
loss_weights:
|
| 126 |
+
action: 1.0
|
| 127 |
+
phase: 0.15
|
| 128 |
+
arm_role: 0.2
|
| 129 |
+
support_mode: 0.15
|
| 130 |
+
corridor: 0.2
|
| 131 |
+
persistence: 0.1
|
| 132 |
+
disturbance: 0.1
|
| 133 |
+
world_model: 0.3
|
| 134 |
+
belief: 0.05
|
| 135 |
+
visibility: 0.05
|
| 136 |
+
clearance: 0.05
|
| 137 |
+
support_stability: 0.05
|
| 138 |
+
reocclusion: 0.05
|
| 139 |
+
occluder_contact: 0.05
|
| 140 |
+
grasp_affordance: 0.05
|
| 141 |
+
planner_success: 0.2
|
| 142 |
+
planner_risk: 0.1
|
| 143 |
+
planner_ranking: 0.1
|
| 144 |
+
proposal_reconstruction: 0.2
|
| 145 |
+
proposal_success: 0.1
|
| 146 |
+
proposal_ranking: 0.1
|
| 147 |
+
proposal_diversity: 0.05
|
| 148 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage2_dummy_seed23.yaml
ADDED
|
@@ -0,0 +1,148 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage2_dummy_seed23
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 23
|
| 5 |
+
defaults: []
|
| 6 |
+
data:
|
| 7 |
+
proxies:
|
| 8 |
+
- foliage_proxy
|
| 9 |
+
- bag_proxy
|
| 10 |
+
- cloth_proxy
|
| 11 |
+
resolution: 96
|
| 12 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 13 |
+
train_episodes_per_proxy: 48
|
| 14 |
+
val_episodes_per_proxy: 16
|
| 15 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_v6_rgbd_stage2_dummy_seed23.pt
|
| 16 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_v6_rgbd_stage2_dummy_seed23.pt
|
| 17 |
+
rebuild_dataset: false
|
| 18 |
+
chunk_horizon: 8
|
| 19 |
+
rollout_horizon: 5
|
| 20 |
+
history_steps: 6
|
| 21 |
+
planner_candidates: 8
|
| 22 |
+
seed: 23
|
| 23 |
+
optim:
|
| 24 |
+
epochs: 4
|
| 25 |
+
batch_size: 16
|
| 26 |
+
num_workers: 4
|
| 27 |
+
lr: 0.001
|
| 28 |
+
weight_decay: 0.0001
|
| 29 |
+
trainer:
|
| 30 |
+
policy_type: elastic_reveal
|
| 31 |
+
use_bf16: false
|
| 32 |
+
grad_clip_norm: 1.0
|
| 33 |
+
freeze_backbone: true
|
| 34 |
+
gradient_checkpointing: false
|
| 35 |
+
plan_during_train: true
|
| 36 |
+
plan_during_eval: true
|
| 37 |
+
support_mode_conditioning: true
|
| 38 |
+
planner_mode: trainable
|
| 39 |
+
use_depth: false
|
| 40 |
+
use_world_model: true
|
| 41 |
+
use_role_tokens: true
|
| 42 |
+
compute_equivariance_probe: true
|
| 43 |
+
policy:
|
| 44 |
+
backbone:
|
| 45 |
+
model_name: openai/clip-vit-base-patch32
|
| 46 |
+
hidden_dim: 192
|
| 47 |
+
max_text_tokens: 32
|
| 48 |
+
freeze_backbone: true
|
| 49 |
+
gradient_checkpointing: false
|
| 50 |
+
use_dummy_backbone: true
|
| 51 |
+
fusion:
|
| 52 |
+
hidden_dim: 192
|
| 53 |
+
num_cameras: 3
|
| 54 |
+
num_layers: 2
|
| 55 |
+
num_heads: 4
|
| 56 |
+
ff_dim: 384
|
| 57 |
+
dropout: 0.1
|
| 58 |
+
proprio_dim: 32
|
| 59 |
+
proprio_tokens: 1
|
| 60 |
+
memory:
|
| 61 |
+
hidden_dim: 192
|
| 62 |
+
action_dim: 14
|
| 63 |
+
history_steps: 6
|
| 64 |
+
scene_history_steps: 3
|
| 65 |
+
belief_history_steps: 8
|
| 66 |
+
num_layers: 2
|
| 67 |
+
dropout: 0.1
|
| 68 |
+
memory_bank_size: 4
|
| 69 |
+
scene_bank_size: 2
|
| 70 |
+
belief_bank_size: 2
|
| 71 |
+
num_heads: 4
|
| 72 |
+
max_history_steps: 8
|
| 73 |
+
decoder:
|
| 74 |
+
hidden_dim: 192
|
| 75 |
+
num_heads: 4
|
| 76 |
+
num_layers: 2
|
| 77 |
+
ff_dim: 384
|
| 78 |
+
dropout: 0.1
|
| 79 |
+
chunk_size: 8
|
| 80 |
+
action_dim: 14
|
| 81 |
+
arm_action_dim: 7
|
| 82 |
+
num_candidates: 8
|
| 83 |
+
num_phases: 5
|
| 84 |
+
num_arm_roles: 4
|
| 85 |
+
num_proposal_modes: 6
|
| 86 |
+
planner_top_k: 4
|
| 87 |
+
reveal_head:
|
| 88 |
+
hidden_dim: 192
|
| 89 |
+
num_support_modes: 3
|
| 90 |
+
num_approach_templates: 32
|
| 91 |
+
rollout_horizon: 5
|
| 92 |
+
belief_map_size: 32
|
| 93 |
+
field_size: 16
|
| 94 |
+
num_heads: 4
|
| 95 |
+
predict_belief_map: true
|
| 96 |
+
num_phases: 5
|
| 97 |
+
num_arm_roles: 4
|
| 98 |
+
num_interaction_tokens: 8
|
| 99 |
+
world_model:
|
| 100 |
+
hidden_dim: 192
|
| 101 |
+
action_dim: 14
|
| 102 |
+
num_support_modes: 3
|
| 103 |
+
num_approach_templates: 32
|
| 104 |
+
rollout_horizon: 5
|
| 105 |
+
field_size: 16
|
| 106 |
+
num_heads: 4
|
| 107 |
+
num_phases: 5
|
| 108 |
+
num_arm_roles: 4
|
| 109 |
+
num_interaction_tokens: 8
|
| 110 |
+
belief_map_size: 32
|
| 111 |
+
predict_belief_map: true
|
| 112 |
+
scene_bank_size: 2
|
| 113 |
+
belief_bank_size: 2
|
| 114 |
+
planner:
|
| 115 |
+
hidden_dim: 192
|
| 116 |
+
num_candidates: 8
|
| 117 |
+
action_dim: 14
|
| 118 |
+
num_support_modes: 3
|
| 119 |
+
utility_margin: 0.1
|
| 120 |
+
num_heads: 4
|
| 121 |
+
num_layers: 2
|
| 122 |
+
num_phases: 5
|
| 123 |
+
num_arm_roles: 4
|
| 124 |
+
top_k: 4
|
| 125 |
+
loss_weights:
|
| 126 |
+
action: 1.0
|
| 127 |
+
phase: 0.15
|
| 128 |
+
arm_role: 0.2
|
| 129 |
+
support_mode: 0.15
|
| 130 |
+
corridor: 0.2
|
| 131 |
+
persistence: 0.1
|
| 132 |
+
disturbance: 0.1
|
| 133 |
+
world_model: 0.3
|
| 134 |
+
belief: 0.05
|
| 135 |
+
visibility: 0.05
|
| 136 |
+
clearance: 0.05
|
| 137 |
+
support_stability: 0.05
|
| 138 |
+
reocclusion: 0.05
|
| 139 |
+
occluder_contact: 0.05
|
| 140 |
+
grasp_affordance: 0.05
|
| 141 |
+
planner_success: 0.2
|
| 142 |
+
planner_risk: 0.1
|
| 143 |
+
planner_ranking: 0.1
|
| 144 |
+
proposal_reconstruction: 0.2
|
| 145 |
+
proposal_success: 0.1
|
| 146 |
+
proposal_ranking: 0.1
|
| 147 |
+
proposal_diversity: 0.05
|
| 148 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage3_clip_rgbd_seed17.yaml
ADDED
|
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage3_clip_rgbd_seed17
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 17
|
| 5 |
+
init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
|
| 6 |
+
init_strict: false
|
| 7 |
+
data:
|
| 8 |
+
proxies:
|
| 9 |
+
- foliage_proxy
|
| 10 |
+
- bag_proxy
|
| 11 |
+
- cloth_proxy
|
| 12 |
+
resolution: 224
|
| 13 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 14 |
+
train_episodes_per_proxy: 48
|
| 15 |
+
val_episodes_per_proxy: 16
|
| 16 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage3_seed17.pt
|
| 17 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage3_seed17.pt
|
| 18 |
+
rebuild_dataset: false
|
| 19 |
+
chunk_horizon: 8
|
| 20 |
+
rollout_horizon: 5
|
| 21 |
+
history_steps: 6
|
| 22 |
+
planner_candidates: 8
|
| 23 |
+
seed: 17
|
| 24 |
+
optim:
|
| 25 |
+
epochs: 4
|
| 26 |
+
batch_size: 2
|
| 27 |
+
num_workers: 4
|
| 28 |
+
lr: 0.0003
|
| 29 |
+
weight_decay: 0.0001
|
| 30 |
+
trainer:
|
| 31 |
+
policy_type: elastic_reveal
|
| 32 |
+
use_bf16: true
|
| 33 |
+
grad_clip_norm: 1.0
|
| 34 |
+
freeze_backbone: true
|
| 35 |
+
gradient_checkpointing: false
|
| 36 |
+
plan_during_train: true
|
| 37 |
+
plan_during_eval: true
|
| 38 |
+
support_mode_conditioning: true
|
| 39 |
+
planner_mode: trainable
|
| 40 |
+
use_depth: true
|
| 41 |
+
use_world_model: true
|
| 42 |
+
use_role_tokens: true
|
| 43 |
+
compute_equivariance_probe: true
|
| 44 |
+
policy:
|
| 45 |
+
backbone:
|
| 46 |
+
model_name: openai/clip-vit-base-patch32
|
| 47 |
+
hidden_dim: 512
|
| 48 |
+
max_text_tokens: 32
|
| 49 |
+
freeze_backbone: true
|
| 50 |
+
gradient_checkpointing: false
|
| 51 |
+
use_dummy_backbone: false
|
| 52 |
+
fusion:
|
| 53 |
+
hidden_dim: 512
|
| 54 |
+
num_cameras: 3
|
| 55 |
+
num_layers: 4
|
| 56 |
+
num_heads: 8
|
| 57 |
+
ff_dim: 2048
|
| 58 |
+
dropout: 0.1
|
| 59 |
+
proprio_dim: 32
|
| 60 |
+
proprio_tokens: 1
|
| 61 |
+
memory:
|
| 62 |
+
hidden_dim: 512
|
| 63 |
+
action_dim: 14
|
| 64 |
+
history_steps: 6
|
| 65 |
+
scene_history_steps: 3
|
| 66 |
+
belief_history_steps: 8
|
| 67 |
+
num_layers: 2
|
| 68 |
+
dropout: 0.1
|
| 69 |
+
memory_bank_size: 4
|
| 70 |
+
scene_bank_size: 2
|
| 71 |
+
belief_bank_size: 2
|
| 72 |
+
num_heads: 8
|
| 73 |
+
max_history_steps: 8
|
| 74 |
+
decoder:
|
| 75 |
+
hidden_dim: 512
|
| 76 |
+
num_heads: 8
|
| 77 |
+
num_layers: 4
|
| 78 |
+
ff_dim: 2048
|
| 79 |
+
dropout: 0.1
|
| 80 |
+
chunk_size: 8
|
| 81 |
+
action_dim: 14
|
| 82 |
+
arm_action_dim: 7
|
| 83 |
+
num_candidates: 8
|
| 84 |
+
num_phases: 5
|
| 85 |
+
num_arm_roles: 4
|
| 86 |
+
num_proposal_modes: 6
|
| 87 |
+
planner_top_k: 4
|
| 88 |
+
reveal_head:
|
| 89 |
+
hidden_dim: 512
|
| 90 |
+
num_support_modes: 3
|
| 91 |
+
num_approach_templates: 32
|
| 92 |
+
rollout_horizon: 5
|
| 93 |
+
belief_map_size: 32
|
| 94 |
+
field_size: 16
|
| 95 |
+
num_heads: 8
|
| 96 |
+
predict_belief_map: true
|
| 97 |
+
num_phases: 5
|
| 98 |
+
num_arm_roles: 4
|
| 99 |
+
num_interaction_tokens: 8
|
| 100 |
+
world_model:
|
| 101 |
+
hidden_dim: 512
|
| 102 |
+
action_dim: 14
|
| 103 |
+
num_support_modes: 3
|
| 104 |
+
num_approach_templates: 32
|
| 105 |
+
rollout_horizon: 5
|
| 106 |
+
field_size: 16
|
| 107 |
+
num_heads: 8
|
| 108 |
+
num_phases: 5
|
| 109 |
+
num_arm_roles: 4
|
| 110 |
+
num_interaction_tokens: 8
|
| 111 |
+
belief_map_size: 32
|
| 112 |
+
predict_belief_map: true
|
| 113 |
+
scene_bank_size: 2
|
| 114 |
+
belief_bank_size: 2
|
| 115 |
+
planner:
|
| 116 |
+
hidden_dim: 512
|
| 117 |
+
num_candidates: 8
|
| 118 |
+
action_dim: 14
|
| 119 |
+
num_support_modes: 3
|
| 120 |
+
utility_margin: 0.1
|
| 121 |
+
num_heads: 8
|
| 122 |
+
num_layers: 2
|
| 123 |
+
num_phases: 5
|
| 124 |
+
num_arm_roles: 4
|
| 125 |
+
top_k: 4
|
| 126 |
+
loss_weights:
|
| 127 |
+
action: 1.0
|
| 128 |
+
phase: 0.1
|
| 129 |
+
arm_role: 0.15
|
| 130 |
+
support_mode: 0.1
|
| 131 |
+
corridor: 0.15
|
| 132 |
+
persistence: 0.05
|
| 133 |
+
disturbance: 0.05
|
| 134 |
+
world_model: 0.25
|
| 135 |
+
belief: 0.05
|
| 136 |
+
visibility: 0.05
|
| 137 |
+
clearance: 0.05
|
| 138 |
+
support_stability: 0.05
|
| 139 |
+
reocclusion: 0.05
|
| 140 |
+
occluder_contact: 0.05
|
| 141 |
+
grasp_affordance: 0.05
|
| 142 |
+
planner_success: 0.25
|
| 143 |
+
planner_risk: 0.1
|
| 144 |
+
planner_ranking: 0.2
|
| 145 |
+
proposal_reconstruction: 0.1
|
| 146 |
+
proposal_success: 0.15
|
| 147 |
+
proposal_ranking: 0.2
|
| 148 |
+
proposal_diversity: 0.05
|
| 149 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage3_clip_rgbd_seed18.yaml
ADDED
|
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage3_clip_rgbd_seed18
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 18
|
| 5 |
+
init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
|
| 6 |
+
init_strict: false
|
| 7 |
+
data:
|
| 8 |
+
proxies:
|
| 9 |
+
- foliage_proxy
|
| 10 |
+
- bag_proxy
|
| 11 |
+
- cloth_proxy
|
| 12 |
+
resolution: 224
|
| 13 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 14 |
+
train_episodes_per_proxy: 48
|
| 15 |
+
val_episodes_per_proxy: 16
|
| 16 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage3_seed18.pt
|
| 17 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage3_seed18.pt
|
| 18 |
+
rebuild_dataset: false
|
| 19 |
+
chunk_horizon: 8
|
| 20 |
+
rollout_horizon: 5
|
| 21 |
+
history_steps: 6
|
| 22 |
+
planner_candidates: 8
|
| 23 |
+
seed: 18
|
| 24 |
+
optim:
|
| 25 |
+
epochs: 4
|
| 26 |
+
batch_size: 2
|
| 27 |
+
num_workers: 4
|
| 28 |
+
lr: 0.0003
|
| 29 |
+
weight_decay: 0.0001
|
| 30 |
+
trainer:
|
| 31 |
+
policy_type: elastic_reveal
|
| 32 |
+
use_bf16: true
|
| 33 |
+
grad_clip_norm: 1.0
|
| 34 |
+
freeze_backbone: true
|
| 35 |
+
gradient_checkpointing: false
|
| 36 |
+
plan_during_train: true
|
| 37 |
+
plan_during_eval: true
|
| 38 |
+
support_mode_conditioning: true
|
| 39 |
+
planner_mode: trainable
|
| 40 |
+
use_depth: true
|
| 41 |
+
use_world_model: true
|
| 42 |
+
use_role_tokens: true
|
| 43 |
+
compute_equivariance_probe: true
|
| 44 |
+
policy:
|
| 45 |
+
backbone:
|
| 46 |
+
model_name: openai/clip-vit-base-patch32
|
| 47 |
+
hidden_dim: 512
|
| 48 |
+
max_text_tokens: 32
|
| 49 |
+
freeze_backbone: true
|
| 50 |
+
gradient_checkpointing: false
|
| 51 |
+
use_dummy_backbone: false
|
| 52 |
+
fusion:
|
| 53 |
+
hidden_dim: 512
|
| 54 |
+
num_cameras: 3
|
| 55 |
+
num_layers: 4
|
| 56 |
+
num_heads: 8
|
| 57 |
+
ff_dim: 2048
|
| 58 |
+
dropout: 0.1
|
| 59 |
+
proprio_dim: 32
|
| 60 |
+
proprio_tokens: 1
|
| 61 |
+
memory:
|
| 62 |
+
hidden_dim: 512
|
| 63 |
+
action_dim: 14
|
| 64 |
+
history_steps: 6
|
| 65 |
+
scene_history_steps: 3
|
| 66 |
+
belief_history_steps: 8
|
| 67 |
+
num_layers: 2
|
| 68 |
+
dropout: 0.1
|
| 69 |
+
memory_bank_size: 4
|
| 70 |
+
scene_bank_size: 2
|
| 71 |
+
belief_bank_size: 2
|
| 72 |
+
num_heads: 8
|
| 73 |
+
max_history_steps: 8
|
| 74 |
+
decoder:
|
| 75 |
+
hidden_dim: 512
|
| 76 |
+
num_heads: 8
|
| 77 |
+
num_layers: 4
|
| 78 |
+
ff_dim: 2048
|
| 79 |
+
dropout: 0.1
|
| 80 |
+
chunk_size: 8
|
| 81 |
+
action_dim: 14
|
| 82 |
+
arm_action_dim: 7
|
| 83 |
+
num_candidates: 8
|
| 84 |
+
num_phases: 5
|
| 85 |
+
num_arm_roles: 4
|
| 86 |
+
num_proposal_modes: 6
|
| 87 |
+
planner_top_k: 4
|
| 88 |
+
reveal_head:
|
| 89 |
+
hidden_dim: 512
|
| 90 |
+
num_support_modes: 3
|
| 91 |
+
num_approach_templates: 32
|
| 92 |
+
rollout_horizon: 5
|
| 93 |
+
belief_map_size: 32
|
| 94 |
+
field_size: 16
|
| 95 |
+
num_heads: 8
|
| 96 |
+
predict_belief_map: true
|
| 97 |
+
num_phases: 5
|
| 98 |
+
num_arm_roles: 4
|
| 99 |
+
num_interaction_tokens: 8
|
| 100 |
+
world_model:
|
| 101 |
+
hidden_dim: 512
|
| 102 |
+
action_dim: 14
|
| 103 |
+
num_support_modes: 3
|
| 104 |
+
num_approach_templates: 32
|
| 105 |
+
rollout_horizon: 5
|
| 106 |
+
field_size: 16
|
| 107 |
+
num_heads: 8
|
| 108 |
+
num_phases: 5
|
| 109 |
+
num_arm_roles: 4
|
| 110 |
+
num_interaction_tokens: 8
|
| 111 |
+
belief_map_size: 32
|
| 112 |
+
predict_belief_map: true
|
| 113 |
+
scene_bank_size: 2
|
| 114 |
+
belief_bank_size: 2
|
| 115 |
+
planner:
|
| 116 |
+
hidden_dim: 512
|
| 117 |
+
num_candidates: 8
|
| 118 |
+
action_dim: 14
|
| 119 |
+
num_support_modes: 3
|
| 120 |
+
utility_margin: 0.1
|
| 121 |
+
num_heads: 8
|
| 122 |
+
num_layers: 2
|
| 123 |
+
num_phases: 5
|
| 124 |
+
num_arm_roles: 4
|
| 125 |
+
top_k: 4
|
| 126 |
+
loss_weights:
|
| 127 |
+
action: 1.0
|
| 128 |
+
phase: 0.1
|
| 129 |
+
arm_role: 0.15
|
| 130 |
+
support_mode: 0.1
|
| 131 |
+
corridor: 0.15
|
| 132 |
+
persistence: 0.05
|
| 133 |
+
disturbance: 0.05
|
| 134 |
+
world_model: 0.25
|
| 135 |
+
belief: 0.05
|
| 136 |
+
visibility: 0.05
|
| 137 |
+
clearance: 0.05
|
| 138 |
+
support_stability: 0.05
|
| 139 |
+
reocclusion: 0.05
|
| 140 |
+
occluder_contact: 0.05
|
| 141 |
+
grasp_affordance: 0.05
|
| 142 |
+
planner_success: 0.25
|
| 143 |
+
planner_risk: 0.1
|
| 144 |
+
planner_ranking: 0.2
|
| 145 |
+
proposal_reconstruction: 0.1
|
| 146 |
+
proposal_success: 0.15
|
| 147 |
+
proposal_ranking: 0.2
|
| 148 |
+
proposal_diversity: 0.05
|
| 149 |
+
role_swap_consistency: 0.05
|
artifacts/generated_configs/proxy_interaction_r3d_stage3_clip_rgbd_seed19.yaml
ADDED
|
@@ -0,0 +1,149 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
experiment_name: proxy_interaction_r3d_stage3_clip_rgbd_seed19
|
| 2 |
+
output_dir: /workspace/VLAarchtests/artifacts/outputs/r3d
|
| 3 |
+
device: cuda
|
| 4 |
+
seed: 19
|
| 5 |
+
init_checkpoint: /workspace/VLAarchtests/artifacts/outputs/reveal_runs/proxy_backbone_only_clip/checkpoint_best.pt
|
| 6 |
+
init_strict: false
|
| 7 |
+
data:
|
| 8 |
+
proxies:
|
| 9 |
+
- foliage_proxy
|
| 10 |
+
- bag_proxy
|
| 11 |
+
- cloth_proxy
|
| 12 |
+
resolution: 224
|
| 13 |
+
dataset_version: reveal_proxy_v6_rgbd_elastic_state
|
| 14 |
+
train_episodes_per_proxy: 48
|
| 15 |
+
val_episodes_per_proxy: 16
|
| 16 |
+
train_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_train_clip224_v6_rgbd_stage3_seed19.pt
|
| 17 |
+
val_dataset_path: /workspace/VLAarchtests/artifacts/data/reveal_proxy/proxy_val_clip224_v6_rgbd_stage3_seed19.pt
|
| 18 |
+
rebuild_dataset: false
|
| 19 |
+
chunk_horizon: 8
|
| 20 |
+
rollout_horizon: 5
|
| 21 |
+
history_steps: 6
|
| 22 |
+
planner_candidates: 8
|
| 23 |
+
seed: 19
|
| 24 |
+
optim:
|
| 25 |
+
epochs: 4
|
| 26 |
+
batch_size: 2
|
| 27 |
+
num_workers: 4
|
| 28 |
+
lr: 0.0003
|
| 29 |
+
weight_decay: 0.0001
|
| 30 |
+
trainer:
|
| 31 |
+
policy_type: elastic_reveal
|
| 32 |
+
use_bf16: true
|
| 33 |
+
grad_clip_norm: 1.0
|
| 34 |
+
freeze_backbone: true
|
| 35 |
+
gradient_checkpointing: false
|
| 36 |
+
plan_during_train: true
|
| 37 |
+
plan_during_eval: true
|
| 38 |
+
support_mode_conditioning: true
|
| 39 |
+
planner_mode: trainable
|
| 40 |
+
use_depth: true
|
| 41 |
+
use_world_model: true
|
| 42 |
+
use_role_tokens: true
|
| 43 |
+
compute_equivariance_probe: true
|
| 44 |
+
policy:
|
| 45 |
+
backbone:
|
| 46 |
+
model_name: openai/clip-vit-base-patch32
|
| 47 |
+
hidden_dim: 512
|
| 48 |
+
max_text_tokens: 32
|
| 49 |
+
freeze_backbone: true
|
| 50 |
+
gradient_checkpointing: false
|
| 51 |
+
use_dummy_backbone: false
|
| 52 |
+
fusion:
|
| 53 |
+
hidden_dim: 512
|
| 54 |
+
num_cameras: 3
|
| 55 |
+
num_layers: 4
|
| 56 |
+
num_heads: 8
|
| 57 |
+
ff_dim: 2048
|
| 58 |
+
dropout: 0.1
|
| 59 |
+
proprio_dim: 32
|
| 60 |
+
proprio_tokens: 1
|
| 61 |
+
memory:
|
| 62 |
+
hidden_dim: 512
|
| 63 |
+
action_dim: 14
|
| 64 |
+
history_steps: 6
|
| 65 |
+
scene_history_steps: 3
|
| 66 |
+
belief_history_steps: 8
|
| 67 |
+
num_layers: 2
|
| 68 |
+
dropout: 0.1
|
| 69 |
+
memory_bank_size: 4
|
| 70 |
+
scene_bank_size: 2
|
| 71 |
+
belief_bank_size: 2
|
| 72 |
+
num_heads: 8
|
| 73 |
+
max_history_steps: 8
|
| 74 |
+
decoder:
|
| 75 |
+
hidden_dim: 512
|
| 76 |
+
num_heads: 8
|
| 77 |
+
num_layers: 4
|
| 78 |
+
ff_dim: 2048
|
| 79 |
+
dropout: 0.1
|
| 80 |
+
chunk_size: 8
|
| 81 |
+
action_dim: 14
|
| 82 |
+
arm_action_dim: 7
|
| 83 |
+
num_candidates: 8
|
| 84 |
+
num_phases: 5
|
| 85 |
+
num_arm_roles: 4
|
| 86 |
+
num_proposal_modes: 6
|
| 87 |
+
planner_top_k: 4
|
| 88 |
+
reveal_head:
|
| 89 |
+
hidden_dim: 512
|
| 90 |
+
num_support_modes: 3
|
| 91 |
+
num_approach_templates: 32
|
| 92 |
+
rollout_horizon: 5
|
| 93 |
+
belief_map_size: 32
|
| 94 |
+
field_size: 16
|
| 95 |
+
num_heads: 8
|
| 96 |
+
predict_belief_map: true
|
| 97 |
+
num_phases: 5
|
| 98 |
+
num_arm_roles: 4
|
| 99 |
+
num_interaction_tokens: 8
|
| 100 |
+
world_model:
|
| 101 |
+
hidden_dim: 512
|
| 102 |
+
action_dim: 14
|
| 103 |
+
num_support_modes: 3
|
| 104 |
+
num_approach_templates: 32
|
| 105 |
+
rollout_horizon: 5
|
| 106 |
+
field_size: 16
|
| 107 |
+
num_heads: 8
|
| 108 |
+
num_phases: 5
|
| 109 |
+
num_arm_roles: 4
|
| 110 |
+
num_interaction_tokens: 8
|
| 111 |
+
belief_map_size: 32
|
| 112 |
+
predict_belief_map: true
|
| 113 |
+
scene_bank_size: 2
|
| 114 |
+
belief_bank_size: 2
|
| 115 |
+
planner:
|
| 116 |
+
hidden_dim: 512
|
| 117 |
+
num_candidates: 8
|
| 118 |
+
action_dim: 14
|
| 119 |
+
num_support_modes: 3
|
| 120 |
+
utility_margin: 0.1
|
| 121 |
+
num_heads: 8
|
| 122 |
+
num_layers: 2
|
| 123 |
+
num_phases: 5
|
| 124 |
+
num_arm_roles: 4
|
| 125 |
+
top_k: 4
|
| 126 |
+
loss_weights:
|
| 127 |
+
action: 1.0
|
| 128 |
+
phase: 0.1
|
| 129 |
+
arm_role: 0.15
|
| 130 |
+
support_mode: 0.1
|
| 131 |
+
corridor: 0.15
|
| 132 |
+
persistence: 0.05
|
| 133 |
+
disturbance: 0.05
|
| 134 |
+
world_model: 0.25
|
| 135 |
+
belief: 0.05
|
| 136 |
+
visibility: 0.05
|
| 137 |
+
clearance: 0.05
|
| 138 |
+
support_stability: 0.05
|
| 139 |
+
reocclusion: 0.05
|
| 140 |
+
occluder_contact: 0.05
|
| 141 |
+
grasp_affordance: 0.05
|
| 142 |
+
planner_success: 0.25
|
| 143 |
+
planner_risk: 0.1
|
| 144 |
+
planner_ranking: 0.2
|
| 145 |
+
proposal_reconstruction: 0.1
|
| 146 |
+
proposal_success: 0.15
|
| 147 |
+
proposal_ranking: 0.2
|
| 148 |
+
proposal_diversity: 0.05
|
| 149 |
+
role_swap_consistency: 0.05
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_dual_push_buttons/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_dual_push_buttons --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_dual_push_buttons/stderr.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_dual_push_buttons/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualDualPushButtons",
|
| 5 |
+
"description": "push the olive and the orange buttons",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_handover_item --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item/stderr.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualHandoverItem",
|
| 5 |
+
"description": "bring me the red item",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item_easy/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_handover_item_easy --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item_easy/stderr.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_handover_item_easy/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualHandoverItemEasy",
|
| 5 |
+
"description": "bring me the item",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_ball/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_lift_ball --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_ball/stderr.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_ball/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualLiftBall",
|
| 5 |
+
"description": "Lift the ball",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_tray/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_lift_tray --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_tray/stderr.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_lift_tray/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualLiftTray",
|
| 5 |
+
"description": "Lift the tray",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_laptop/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_pick_laptop --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_laptop/stderr.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
| 3 |
+
WARNING:root:Waypoints are not reachable right=(False, 'waypoint1 - DualPanda') left=(True, '')
|
| 4 |
+
ERROR:root:Error when checking waypoints. Exception is: Error in task bimanual_pick_laptop. Infeasible episode. Can't reach waypoint ((False, 'waypoint1 - DualPanda'), (True, '')).
|
| 5 |
+
WARNING:root:Waypoints are not reachable right=(False, 'waypoint1 - DualPanda') left=(True, '')
|
| 6 |
+
ERROR:root:Error when checking waypoints. Exception is: Error in task bimanual_pick_laptop. Infeasible episode. Can't reach waypoint ((False, 'waypoint1 - DualPanda'), (True, '')).
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_laptop/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualPickLaptop",
|
| 5 |
+
"description": "pick up the laptop",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_plate/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_pick_plate --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_plate/stderr.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_pick_plate/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualPickPlate",
|
| 5 |
+
"description": "pick up the plate",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_push_box/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_push_box --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_push_box/stderr.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_push_box/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualPushBox",
|
| 5 |
+
"description": "push the box to the red area",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_bottle_in_fridge/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_put_bottle_in_fridge --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_bottle_in_fridge/stderr.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_bottle_in_fridge/stdout.txt
ADDED
|
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[ 0.05 -0.27500001 0.75199997]
|
| 2 |
+
{
|
| 3 |
+
"display": ":99",
|
| 4 |
+
"headless": true,
|
| 5 |
+
"task": "BimanualPutBottleInFridge",
|
| 6 |
+
"description": "put bottle in fridge",
|
| 7 |
+
"front_rgb_shape": [
|
| 8 |
+
224,
|
| 9 |
+
224,
|
| 10 |
+
3
|
| 11 |
+
],
|
| 12 |
+
"wrist_left_rgb_shape": [
|
| 13 |
+
224,
|
| 14 |
+
224,
|
| 15 |
+
3
|
| 16 |
+
],
|
| 17 |
+
"wrist_right_rgb_shape": [
|
| 18 |
+
224,
|
| 19 |
+
224,
|
| 20 |
+
3
|
| 21 |
+
],
|
| 22 |
+
"right_pose_shape": [
|
| 23 |
+
7
|
| 24 |
+
],
|
| 25 |
+
"left_pose_shape": [
|
| 26 |
+
7
|
| 27 |
+
],
|
| 28 |
+
"stepped_mode": "bimanual_noop",
|
| 29 |
+
"action_finite": true,
|
| 30 |
+
"action_dim": 18,
|
| 31 |
+
"reward": 0.0,
|
| 32 |
+
"done": false,
|
| 33 |
+
"front_rgb_shape_after_step": [
|
| 34 |
+
224,
|
| 35 |
+
224,
|
| 36 |
+
3
|
| 37 |
+
]
|
| 38 |
+
}
|
| 39 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_item_in_drawer/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_put_item_in_drawer --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_item_in_drawer/stderr.txt
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
| 3 |
+
WARNING:root:Waypoints are not reachable right=(False, 'waypoint4 - DualPanda') left=(False, 'waypoint2 - DualPanda')
|
| 4 |
+
ERROR:root:Error when checking waypoints. Exception is: Error in task bimanual_put_item_in_drawer. Infeasible episode. Can't reach waypoint ((False, 'waypoint4 - DualPanda'), (False, 'waypoint2 - DualPanda')).
|
| 5 |
+
WARNING:root:Waypoints are not reachable right=(False, 'waypoint4 - DualPanda') left=(False, 'waypoint2 - DualPanda')
|
| 6 |
+
ERROR:root:Error when checking waypoints. Exception is: Error in task bimanual_put_item_in_drawer. Infeasible episode. Can't reach waypoint ((False, 'waypoint4 - DualPanda'), (False, 'waypoint2 - DualPanda')).
|
| 7 |
+
WARNING:root:Waypoints are not reachable right=(False, 'waypoint4 - DualPanda') left=(True, '')
|
| 8 |
+
ERROR:root:Error when checking waypoints. Exception is: Error in task bimanual_put_item_in_drawer. Infeasible episode. Can't reach waypoint ((False, 'waypoint4 - DualPanda'), (True, '')).
|
| 9 |
+
WARNING:root:Waypoints are not reachable right=(False, 'waypoint4 - DualPanda') left=(False, 'waypoint2 - DualPanda')
|
| 10 |
+
ERROR:root:Error when checking waypoints. Exception is: Error in task bimanual_put_item_in_drawer. Infeasible episode. Can't reach waypoint ((False, 'waypoint4 - DualPanda'), (False, 'waypoint2 - DualPanda')).
|
| 11 |
+
WARNING:root:Waypoints are not reachable right=(False, 'waypoint4 - DualPanda') left=(True, '')
|
| 12 |
+
ERROR:root:Error when checking waypoints. Exception is: Error in task bimanual_put_item_in_drawer. Infeasible episode. Can't reach waypoint ((False, 'waypoint4 - DualPanda'), (True, '')).
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_put_item_in_drawer/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualPutItemInDrawer",
|
| 5 |
+
"description": "put the item in the bottom drawer",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_straighten_rope/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_straighten_rope --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_straighten_rope/stderr.txt
ADDED
|
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|
| 3 |
+
WARNING:root:Waypoints are not reachable right=(False, 'waypoint3 - DualPanda') left=(True, '')
|
| 4 |
+
ERROR:root:Error when checking waypoints. Exception is: Error in task bimanual_straighten_rope. Infeasible episode. Can't reach waypoint ((False, 'waypoint3 - DualPanda'), (True, '')).
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_straighten_rope/stdout.txt
ADDED
|
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"display": ":99",
|
| 3 |
+
"headless": true,
|
| 4 |
+
"task": "BimanualStraightenRope",
|
| 5 |
+
"description": "straighten rope",
|
| 6 |
+
"front_rgb_shape": [
|
| 7 |
+
224,
|
| 8 |
+
224,
|
| 9 |
+
3
|
| 10 |
+
],
|
| 11 |
+
"wrist_left_rgb_shape": [
|
| 12 |
+
224,
|
| 13 |
+
224,
|
| 14 |
+
3
|
| 15 |
+
],
|
| 16 |
+
"wrist_right_rgb_shape": [
|
| 17 |
+
224,
|
| 18 |
+
224,
|
| 19 |
+
3
|
| 20 |
+
],
|
| 21 |
+
"right_pose_shape": [
|
| 22 |
+
7
|
| 23 |
+
],
|
| 24 |
+
"left_pose_shape": [
|
| 25 |
+
7
|
| 26 |
+
],
|
| 27 |
+
"stepped_mode": "bimanual_noop",
|
| 28 |
+
"action_finite": true,
|
| 29 |
+
"action_dim": 18,
|
| 30 |
+
"reward": 0.0,
|
| 31 |
+
"done": false,
|
| 32 |
+
"front_rgb_shape_after_step": [
|
| 33 |
+
224,
|
| 34 |
+
224,
|
| 35 |
+
3
|
| 36 |
+
]
|
| 37 |
+
}
|
| 38 |
+
[CoppeliaSim:loadinfo] done.
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_sweep_to_dustpan/command.txt
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
/workspace/envs/rlbench/bin/python -m sim_rlbench.launch_smoke --task bimanual_sweep_to_dustpan --resolution 224 --headless
|
artifacts/outputs/r3d/peract2_13_launch_smoke/bimanual_sweep_to_dustpan/stderr.txt
ADDED
|
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
|
|
|
| 1 |
+
qt.qpa.xcb: QXcbConnection: XCB error: 148 (Unknown), sequence: 181, resource id: 0, major code: 140 (Unknown), minor code: 20
|
| 2 |
+
WARNING:root:not sure how _robot_shapes are used is used.
|