Rutav commited on
Commit
2a894f9
·
verified ·
1 Parent(s): 53d5ddd

Upload folder using huggingface_hub

Browse files
checkpoint-100.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:222fe8d576c9f94d02ae80838368838d51c899200f66d898530df864ee698f99
3
+ size 1086628090
checkpoint-prism-100.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1415a83c870155f3e7544858261aa610c2c4cd0acfa614883d0d66849f835f21
3
+ size 1086624506
events.out.tfevents.1768103766.xzhang-vla-finetune-h100-8gpu-group-worker-dwrdd.3494898.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9500c3b3775d6f015fea813faf14010274b744f1049fa6432baacf897ec915a3
3
+ size 14259198
log.txt ADDED
@@ -0,0 +1,102 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"train_lr": 0.00012442254388666513, "train_loss": 0.3106695828571558, "epoch": 0}
2
+ {"train_lr": 0.00037442254388666657, "train_loss": 0.1765579505204583, "epoch": 1}
3
+ {"train_lr": 0.0004999895847251151, "train_loss": 0.1204350220322297, "epoch": 2}
4
+ {"train_lr": 0.0004999267965555358, "train_loss": 0.10512903698047145, "epoch": 3}
5
+ {"train_lr": 0.000499801090651457, "train_loss": 0.09721263018323434, "epoch": 4}
6
+ {"train_lr": 0.000499612498658695, "train_loss": 0.09171448527308411, "epoch": 5}
7
+ {"train_lr": 0.0004993610680542452, "train_loss": 0.08695411841962446, "epoch": 6}
8
+ {"train_lr": 0.0004990468621344369, "train_loss": 0.08087445833769888, "epoch": 7}
9
+ {"train_lr": 0.000498669959998947, "train_loss": 0.07634419156898135, "epoch": 8}
10
+ {"train_lr": 0.0004982304565308317, "train_loss": 0.07051568671852732, "epoch": 9}
11
+ {"train_lr": 0.0004977284623727689, "train_loss": 0.0674788464112583, "epoch": 10}
12
+ {"train_lr": 0.000497164103899089, "train_loss": 0.0654696337283541, "epoch": 11}
13
+ {"train_lr": 0.0004965375231840242, "train_loss": 0.06279148746162543, "epoch": 12}
14
+ {"train_lr": 0.000495848877965922, "train_loss": 0.060323238908664575, "epoch": 13}
15
+ {"train_lr": 0.000495098341607544, "train_loss": 0.05694042379746439, "epoch": 14}
16
+ {"train_lr": 0.0004942861030523532, "train_loss": 0.05254918934498011, "epoch": 15}
17
+ {"train_lr": 0.0004934123667771247, "train_loss": 0.048871026988278055, "epoch": 16}
18
+ {"train_lr": 0.0004924773527402652, "train_loss": 0.046795259160964865, "epoch": 17}
19
+ {"train_lr": 0.0004914812963265581, "train_loss": 0.04460288662668364, "epoch": 18}
20
+ {"train_lr": 0.0004904244482878885, "train_loss": 0.042538205515167356, "epoch": 19}
21
+ {"train_lr": 0.0004893070746800906, "train_loss": 0.0405509257690194, "epoch": 20}
22
+ {"train_lr": 0.0004881294567959938, "train_loss": 0.039287820584866386, "epoch": 21}
23
+ {"train_lr": 0.0004868918910945998, "train_loss": 0.03803709820202604, "epoch": 22}
24
+ {"train_lr": 0.00048559468912647095, "train_loss": 0.03727623393734321, "epoch": 23}
25
+ {"train_lr": 0.00048423817745526197, "train_loss": 0.03635868519914033, "epoch": 24}
26
+ {"train_lr": 0.00048282269757551324, "train_loss": 0.035470682053193155, "epoch": 25}
27
+ {"train_lr": 0.00048134860582673604, "train_loss": 0.03436020502226452, "epoch": 26}
28
+ {"train_lr": 0.00047981627330363384, "train_loss": 0.03362559669345335, "epoch": 27}
29
+ {"train_lr": 0.0004782260857627244, "train_loss": 0.033024097851675184, "epoch": 28}
30
+ {"train_lr": 0.00047657844352522205, "train_loss": 0.03246270484458953, "epoch": 29}
31
+ {"train_lr": 0.0004748737613762465, "train_loss": 0.03193189644536263, "epoch": 30}
32
+ {"train_lr": 0.0004731124684604214, "train_loss": 0.031190929833294356, "epoch": 31}
33
+ {"train_lr": 0.0004712950081737899, "train_loss": 0.03056241925207776, "epoch": 32}
34
+ {"train_lr": 0.0004694218380523076, "train_loss": 0.029931797038955647, "epoch": 33}
35
+ {"train_lr": 0.00046749342965647715, "train_loss": 0.02938416024297777, "epoch": 34}
36
+ {"train_lr": 0.00046551026845287634, "train_loss": 0.02895656854657426, "epoch": 35}
37
+ {"train_lr": 0.0004634728536916469, "train_loss": 0.02855706407095833, "epoch": 36}
38
+ {"train_lr": 0.00046138169828110727, "train_loss": 0.028285302986864293, "epoch": 37}
39
+ {"train_lr": 0.00045923732865845644, "train_loss": 0.02793090866068992, "epoch": 38}
40
+ {"train_lr": 0.0004570402846572667, "train_loss": 0.02750447166595731, "epoch": 39}
41
+ {"train_lr": 0.0004547911193715973, "train_loss": 0.02719697173304648, "epoch": 40}
42
+ {"train_lr": 0.0004524903990167991, "train_loss": 0.026828367616214727, "epoch": 41}
43
+ {"train_lr": 0.0004501387027869346, "train_loss": 0.02656354377338646, "epoch": 42}
44
+ {"train_lr": 0.0004477366227089122, "train_loss": 0.026073855690526584, "epoch": 43}
45
+ {"train_lr": 0.00044528476349357706, "train_loss": 0.02558653131257146, "epoch": 44}
46
+ {"train_lr": 0.0004427837423833779, "train_loss": 0.025155968964189517, "epoch": 45}
47
+ {"train_lr": 0.0004402341889969815, "train_loss": 0.024923711238267036, "epoch": 46}
48
+ {"train_lr": 0.00043763674517082824, "train_loss": 0.024778983413970626, "epoch": 47}
49
+ {"train_lr": 0.00043499206479752557, "train_loss": 0.02437653219389572, "epoch": 48}
50
+ {"train_lr": 0.0004323008136611902, "train_loss": 0.024127835892176, "epoch": 49}
51
+ {"train_lr": 0.0004295636692699243, "train_loss": 0.024061144793673307, "epoch": 50}
52
+ {"train_lr": 0.0004267813206851613, "train_loss": 0.02371762236895402, "epoch": 51}
53
+ {"train_lr": 0.00042395446834832116, "train_loss": 0.023586711529009177, "epoch": 52}
54
+ {"train_lr": 0.0004210838239043303, "train_loss": 0.02339996546571059, "epoch": 53}
55
+ {"train_lr": 0.000418170110022581, "train_loss": 0.023331272883557557, "epoch": 54}
56
+ {"train_lr": 0.0004152140602149747, "train_loss": 0.022939835333343955, "epoch": 55}
57
+ {"train_lr": 0.0004122164186512228, "train_loss": 0.022742653930062685, "epoch": 56}
58
+ {"train_lr": 0.0004091779399715766, "train_loss": 0.022589488850228434, "epoch": 57}
59
+ {"train_lr": 0.00040609938909678126, "train_loss": 0.02226874454806062, "epoch": 58}
60
+ {"train_lr": 0.0004029815410355584, "train_loss": 0.022061608113099807, "epoch": 59}
61
+ {"train_lr": 0.0003998251806894967, "train_loss": 0.0218637260706577, "epoch": 60}
62
+ {"train_lr": 0.0003966311026554213, "train_loss": 0.021659375753381765, "epoch": 61}
63
+ {"train_lr": 0.00039340011102539246, "train_loss": 0.021473534835900046, "epoch": 62}
64
+ {"train_lr": 0.00039013301918427843, "train_loss": 0.02136045050270073, "epoch": 63}
65
+ {"train_lr": 0.0003868306496049915, "train_loss": 0.021258544771603508, "epoch": 64}
66
+ {"train_lr": 0.00038349383364139636, "train_loss": 0.021133298709823525, "epoch": 65}
67
+ {"train_lr": 0.00038012341131907234, "train_loss": 0.021022808593492766, "epoch": 66}
68
+ {"train_lr": 0.0003767202311238196, "train_loss": 0.02089578813532913, "epoch": 67}
69
+ {"train_lr": 0.00037328514978804834, "train_loss": 0.020739652609188294, "epoch": 68}
70
+ {"train_lr": 0.0003698190320751148, "train_loss": 0.020612976758250082, "epoch": 69}
71
+ {"train_lr": 0.0003663227505616289, "train_loss": 0.020530629719294605, "epoch": 70}
72
+ {"train_lr": 0.0003627971854177555, "train_loss": 0.020418202951371936, "epoch": 71}
73
+ {"train_lr": 0.0003592432241856427, "train_loss": 0.020347804001564475, "epoch": 72}
74
+ {"train_lr": 0.00035566176155605976, "train_loss": 0.020233220371425876, "epoch": 73}
75
+ {"train_lr": 0.00035205369914305997, "train_loss": 0.020152423528576206, "epoch": 74}
76
+ {"train_lr": 0.000348419945257054, "train_loss": 0.020014205569804946, "epoch": 75}
77
+ {"train_lr": 0.0003447614146761572, "train_loss": 0.019932750324309353, "epoch": 76}
78
+ {"train_lr": 0.00034107902841587126, "train_loss": 0.01980366973392981, "epoch": 77}
79
+ {"train_lr": 0.00033737371349725365, "train_loss": 0.019748475697988082, "epoch": 78}
80
+ {"train_lr": 0.00033364640271351683, "train_loss": 0.019675734331181676, "epoch": 79}
81
+ {"train_lr": 0.00032989803439521125, "train_loss": 0.019610411182588324, "epoch": 80}
82
+ {"train_lr": 0.00032612955217403125, "train_loss": 0.019501670381825986, "epoch": 81}
83
+ {"train_lr": 0.0003223419047452072, "train_loss": 0.019465307419461952, "epoch": 82}
84
+ {"train_lr": 0.00031853604562872363, "train_loss": 0.019317056300060628, "epoch": 83}
85
+ {"train_lr": 0.000314712932929276, "train_loss": 0.01924570535176884, "epoch": 84}
86
+ {"train_lr": 0.00031087352909502683, "train_loss": 0.01921790678825727, "epoch": 85}
87
+ {"train_lr": 0.0003070188006753687, "train_loss": 0.0191203878184208, "epoch": 86}
88
+ {"train_lr": 0.0003031497180775688, "train_loss": 0.018995062414310645, "epoch": 87}
89
+ {"train_lr": 0.00029926725532246237, "train_loss": 0.018894653228115295, "epoch": 88}
90
+ {"train_lr": 0.000295372389799301, "train_loss": 0.018844347112270145, "epoch": 89}
91
+ {"train_lr": 0.0002914661020196496, "train_loss": 0.018712236197917165, "epoch": 90}
92
+ {"train_lr": 0.00028754937537056586, "train_loss": 0.018601788093821667, "epoch": 91}
93
+ {"train_lr": 0.00028362319586703824, "train_loss": 0.018510111748926545, "epoch": 92}
94
+ {"train_lr": 0.0002796885519037529, "train_loss": 0.018389944572524148, "epoch": 93}
95
+ {"train_lr": 0.0002757464340062982, "train_loss": 0.01826450743363705, "epoch": 94}
96
+ {"train_lr": 0.0002717978345817676, "train_loss": 0.018135870946037018, "epoch": 95}
97
+ {"train_lr": 0.00026784374766894995, "train_loss": 0.017987648956262522, "epoch": 96}
98
+ {"train_lr": 0.0002638851686880748, "train_loss": 0.017831332910776397, "epoch": 97}
99
+ {"train_lr": 0.0002599230941902473, "train_loss": 0.017715244356683084, "epoch": 98}
100
+ {"train_lr": 0.0002559585216065196, "train_loss": 0.017702003495481893, "epoch": 99}
101
+ {"train_lr": 0.0002519924489968411, "train_loss": 0.017629278209084092, "epoch": 100}
102
+ {"train_lr": 0.0002480258747987811, "train_loss": 0.017556594441993915, "epoch": 101}
results_s0_evals20_tt_window_obs_checkpoint-100.csv ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ n_eval,success_rate,task_name
2
+ 20,0.55,MemFruitInSinkRightFar
3
+ 20,0.6,MemFruitInSinkLeftFar
4
+ 20,0.25,MemPutKBreadInMicrowave
5
+ 20,0.35,MemWashAndReturnRight
6
+ 20,0.25,MemWashAndReturnLeft
7
+ 20,0.6,MemHeatPot
results_s0_evals20_tt_window_obs_checkpoint-50.csv ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ n_eval,success_rate,task_name
2
+ 20,0.4,MemFruitInSinkRightFar
3
+ 20,0.35,MemFruitInSinkLeftFar
4
+ 20,0.45,MemPutKBreadInMicrowave
5
+ 20,0.3,MemWashAndReturnRight
6
+ 20,0.35,MemWashAndReturnLeft
7
+ 20,0.7,MemHeatPot
results_s0_evals20_tt_window_obs_checkpoint-60.csv ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ n_eval,success_rate,task_name
2
+ 20,0.2,MemFruitInSinkRightFar
3
+ 20,0.55,MemFruitInSinkLeftFar
4
+ 20,0.1,MemPutKBreadInMicrowave
5
+ 20,0.35,MemWashAndReturnRight
6
+ 20,0.5,MemWashAndReturnLeft
7
+ 20,0.8,MemHeatPot
results_s0_evals20_tt_window_obs_checkpoint-70.csv ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ n_eval,success_rate,task_name
2
+ 20,0.35,MemFruitInSinkRightFar
3
+ 20,0.5,MemFruitInSinkLeftFar
4
+ 20,0.05,MemPutKBreadInMicrowave
5
+ 20,0.3,MemWashAndReturnRight
6
+ 20,0.35,MemWashAndReturnLeft
7
+ 20,0.7,MemHeatPot
results_s0_evals20_tt_window_obs_checkpoint-80.csv ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ n_eval,success_rate,task_name
2
+ 20,0.4,MemFruitInSinkRightFar
3
+ 20,0.4,MemFruitInSinkLeftFar
4
+ 20,0.2,MemPutKBreadInMicrowave
5
+ 20,0.4,MemWashAndReturnRight
6
+ 20,0.3,MemWashAndReturnLeft
7
+ 20,0.75,MemHeatPot
results_s0_evals20_tt_window_obs_checkpoint-90.csv ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ n_eval,success_rate,task_name
2
+ 20,0.4,MemFruitInSinkRightFar
3
+ 20,0.4,MemFruitInSinkLeftFar
4
+ 20,0.2,MemPutKBreadInMicrowave
5
+ 20,0.2,MemWashAndReturnRight
6
+ 20,0.4,MemWashAndReturnLeft
7
+ 20,0.8,MemHeatPot
run-prism.yaml ADDED
@@ -0,0 +1,122 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ dataset_cfg:
2
+ action_noise: 0.0
3
+ dataset_json:
4
+ - /storage/nfs/xzhang/experiments/nopool_exps/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress/task_robocasa_mem_four.json
5
+ dataset_val_json:
6
+ - ''
7
+ load_in_mem: false
8
+ n_examples_only: -1
9
+ non_overlapping:
10
+ - 2
11
+ num_repeat_traj:
12
+ - 256
13
+ proprio_noise: 0.005
14
+ sample_each_state: false
15
+ task_name: ''
16
+ task_names: null
17
+ train_on_exploration: false
18
+ use_dali: true
19
+ dataset_json_contents:
20
+ - action_keys:
21
+ - actions
22
+ dataset_path:
23
+ - memory/MemPutKBreadInMicrowave/2025-07-25-10-40-55/demo_im128_notp.hdf5
24
+ - memory/MemPutKBreadInMicrowave/2025-07-25-13-25-05/demo_im128_notp.hdf5
25
+ - memory/MemPutKBreadInMicrowave/2025-07-25-14-50-59/demo_im128_notp.hdf5
26
+ - memory/MemFruitInSinkLeftFar/2025-07-13-15-44-32/demo_im128_notp.hdf5
27
+ - memory/MemFruitInSinkRightFar/2025-07-15-15-07-57/demo_im128_notp.hdf5
28
+ - memory/MemHeatPot/2025-07-24-22-26-20/demo_im128_notp.hdf5
29
+ - memory/MemHeatPot/2025-07-25-15-56-53/demo_im128_notp.hdf5
30
+ - memory/MemWashAndReturnLeft/2025-07-25-00-12-14/demo_im128_notp.hdf5
31
+ - memory/MemWashAndReturnRight/2025-07-25-00-45-53/demo_im128_notp.hdf5
32
+ group_method: dinov2
33
+ image_keys:
34
+ - obs/robot0_agentview_center_image
35
+ - obs/robot0_eye_in_hand_image
36
+ low_dim_keys: []
37
+ max_traj_len: 1024
38
+ proprio_keys:
39
+ - obs/robot0_joint_pos_cos
40
+ - obs/robot0_gripper_qpos
41
+ device: cuda
42
+ dist_on_itp: false
43
+ dist_url: env://
44
+ load_config: null
45
+ logging_cfg:
46
+ log_dir: /storage/nfs/xzhang/experiments/nopool_exps/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress
47
+ log_name: exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress
48
+ output_dir: /storage/nfs/xzhang/experiments/nopool_exps/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress
49
+ model_cfg:
50
+ policy_cfg:
51
+ attn_drop: 0.0
52
+ attn_scale_factor: null
53
+ block_attn_ind: null
54
+ block_pattern_start_offset: 0
55
+ compress_full_attn: true
56
+ compressor_latent_len: 1
57
+ decoder_pred_head: mlp
58
+ full_attn_inds: null
59
+ gate_full_attn_layers: true
60
+ gating_type: sigmoid_g1
61
+ lora_rank: 4
62
+ model_version: v2
63
+ phase: pretrain
64
+ pool_block_inds: null
65
+ position_language_embedding: start
66
+ pretrained_path: null
67
+ remove_action: false
68
+ remove_proprio: false
69
+ scratch_llama_config: config/model_config/libero_1x.json
70
+ tt_window_obs: false
71
+ use_block_attention: true
72
+ use_linear_attention: false
73
+ use_lstm: false
74
+ use_mamba: false
75
+ use_transformer_xl: false
76
+ xl_chunk_factor: 32
77
+ xl_mem_len: 32
78
+ vision_encoder_cfg:
79
+ freeze_all: false
80
+ vision_encoder: /storage/nfs/rshah/datasets/robocasa/datasets/crossmae_rtx/cross-mae-rtx-vitb.pth
81
+ vision_lora: false
82
+ vision_lora_rank: 8
83
+ vision_nonpretrained: false
84
+ vision_unfreeze_all: false
85
+ vision_unfreeze_last_n: 0
86
+ optimizer_cfg:
87
+ blr: 0.001
88
+ lr: 0.0005
89
+ min_lr: 0.0
90
+ warmup_epochs: 2.0
91
+ weight_decay: 0.01
92
+ shared_cfg:
93
+ batch_size: 2
94
+ block_finetune: ''
95
+ downsample_obs: 8
96
+ enable_gradient_checkpointing: false
97
+ gripper_img: true
98
+ has_base_action: true
99
+ is_bimanual: false
100
+ k_ptp: 0
101
+ num_cameras: 2
102
+ num_pred_steps: 32
103
+ pad_to_max_length: true
104
+ resume: null
105
+ save_every: 10
106
+ seed: 2
107
+ seq_length: 2048
108
+ split_epoch: 1
109
+ start_epoch: 0
110
+ use_language_conditioning: true
111
+ train: true
112
+ trainer_cfg:
113
+ accum_iter: 32
114
+ break_after_n_epochs: 101
115
+ compile_model: true
116
+ epochs: 200
117
+ num_workers: 72
118
+ pin_memory: true
119
+ val_every: 10
120
+ wandb_project: icrt_reruns
121
+ wandb_watch: true
122
+ world_size: 1
run.yaml ADDED
@@ -0,0 +1,223 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ !!python/object:icrt.util.args.ExperimentConfig
2
+ dataset_cfg: !!python/object:icrt.util.args.DatasetConfig
3
+ action_noise: 0.0
4
+ action_traj_noise: false
5
+ dataset_fraction: 1.0
6
+ dataset_json:
7
+ - /storage/nfs/xzhang/experiments/nopool_exps/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress/task_robocasa_mem_four.json
8
+ dataset_val_json:
9
+ - ''
10
+ goal_conditioned: false
11
+ load_in_mem: false
12
+ low_dim_noise: 0.005
13
+ min_subsample_length: 64
14
+ n_examples_only: -1
15
+ non_overlapping:
16
+ - 2
17
+ num_repeat_traj:
18
+ - 256
19
+ num_weighted_steps: 30
20
+ only_k: 10
21
+ proprio_noise: 0.005
22
+ random_patch_masking: false
23
+ rebalance_indices: false
24
+ rebalance_tasks: true
25
+ sample_each_state: false
26
+ shuffle_repeat_traj: true
27
+ shuffle_rnd_prob: 0.0
28
+ sim_score_th: -1.0
29
+ skip_step: false
30
+ sort_by_closeness: false
31
+ sort_by_lang: true
32
+ start_from_beginning: false
33
+ subsample_traj: false
34
+ task_barrier: true
35
+ task_name: ''
36
+ task_names: null
37
+ toy_max_distractors: 1
38
+ toy_max_tasks: 5
39
+ toy_task_id: 1
40
+ toy_train_dataset_size: 1000000
41
+ toy_train_seed: 42
42
+ toy_val_dataset_size: 500000
43
+ toy_val_seed: 84
44
+ train_on_exploration: false
45
+ trim_num: -1
46
+ trim_set: ''
47
+ use_dali: true
48
+ val_only_k: 5
49
+ video_conditioned: false
50
+ vision_aug: true
51
+ weight_by_dataset:
52
+ - 1
53
+ dataset_json_contents:
54
+ - action_keys:
55
+ - actions
56
+ dataset_path:
57
+ - memory/MemPutKBreadInMicrowave/2025-07-25-10-40-55/demo_im128_notp.hdf5
58
+ - memory/MemPutKBreadInMicrowave/2025-07-25-13-25-05/demo_im128_notp.hdf5
59
+ - memory/MemPutKBreadInMicrowave/2025-07-25-14-50-59/demo_im128_notp.hdf5
60
+ - memory/MemFruitInSinkLeftFar/2025-07-13-15-44-32/demo_im128_notp.hdf5
61
+ - memory/MemFruitInSinkRightFar/2025-07-15-15-07-57/demo_im128_notp.hdf5
62
+ - memory/MemHeatPot/2025-07-24-22-26-20/demo_im128_notp.hdf5
63
+ - memory/MemHeatPot/2025-07-25-15-56-53/demo_im128_notp.hdf5
64
+ - memory/MemWashAndReturnLeft/2025-07-25-00-12-14/demo_im128_notp.hdf5
65
+ - memory/MemWashAndReturnRight/2025-07-25-00-45-53/demo_im128_notp.hdf5
66
+ group_method: dinov2
67
+ image_keys:
68
+ - obs/robot0_agentview_center_image
69
+ - obs/robot0_eye_in_hand_image
70
+ low_dim_keys: []
71
+ max_traj_len: 1024
72
+ proprio_keys:
73
+ - obs/robot0_joint_pos_cos
74
+ - obs/robot0_gripper_qpos
75
+ device: cuda
76
+ dist_on_itp: false
77
+ dist_url: env://
78
+ load_config: null
79
+ local_rank: -1
80
+ logging_cfg: !!python/object:icrt.util.args.LoggingConfig
81
+ log_dir: /storage/nfs/xzhang/experiments/nopool_exps/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress
82
+ log_name: exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress
83
+ output_dir: /storage/nfs/xzhang/experiments/nopool_exps/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress/exp_ds8_libero_1x_task_robocasa_mem_four_GBS256_cfgtask_robocasa_mem_four_sl2048_s2_crossmae_block_sigmoid_g1_nopool_compress
84
+ model_cfg: !!python/object:icrt.util.args.ModelConfig
85
+ policy_cfg: !!python/object:icrt.util.args.PolicyConfig
86
+ adapter_mlp_ratio: 4.0
87
+ adapter_num_heads: 8
88
+ add_sink_token_to_full_attn: false
89
+ attn_drop: 0.0
90
+ attn_latent_len: 1
91
+ attn_scale_factor: null
92
+ block_attn_ind: null
93
+ block_pattern_start_offset: 0
94
+ compress_full_attn: true
95
+ compress_include_prev_action: false
96
+ compressor_latent_len: 1
97
+ decoder_cfg_path: config/model_config/action_head.json
98
+ decoder_pred_head: mlp
99
+ full_attn_inds: null
100
+ gate_full_attn_layers: true
101
+ gating_type: sigmoid_g1
102
+ gr00t_add_dit_lora: false
103
+ gr00t_add_full_attn: true
104
+ gr00t_add_lora_to_vision_projector: false
105
+ gr00t_compute_dtype: bfloat16
106
+ gr00t_full_attn_idx:
107
+ - 3
108
+ - 7
109
+ - 11
110
+ - 15
111
+ gr00t_pretrained_model: true
112
+ gr00t_tune_diffusion_model: true
113
+ gr00t_tune_llm: false
114
+ gr00t_tune_projector: true
115
+ gr00t_tune_vision_projector: false
116
+ gr00t_tune_visual: false
117
+ hist_attn_latent_len: 1
118
+ hist_blind_gating: false
119
+ hist_feature_gating: false
120
+ interpolation_factor: null
121
+ llama_ckpt_dir: /home/rutavms/.llama/checkpoints/Llama3.2-1B-Instruct
122
+ load_llama: true
123
+ lora_layer_idxs: null
124
+ lora_rank: 4
125
+ loss_w_action: 1.0
126
+ model_version: v2
127
+ multikv_attn_pool: false
128
+ no_prompt_loss: true
129
+ num_inference_diffusion_steps: null
130
+ num_train_diffusion_steps: null
131
+ phase: pretrain
132
+ pool_block_inds: null
133
+ position_language_embedding: start
134
+ pretrained_path: null
135
+ prop_act_norm: null
136
+ remove_action: false
137
+ remove_proprio: false
138
+ scale_loss: 1.0
139
+ scratch_llama_config: config/model_config/libero_1x.json
140
+ separate_camera_adapter: true
141
+ skip_obs_pooling: true
142
+ step_weight: 1.0
143
+ tt_window_obs: false
144
+ use_block_attention: true
145
+ use_linear_attention: false
146
+ use_lstm: false
147
+ use_mamba: false
148
+ use_reshape_block_attn: false
149
+ use_transformer_xl: false
150
+ use_yarn: null
151
+ vision_projection_layer: false
152
+ xl_chunk_factor: 32
153
+ xl_mem_len: 32
154
+ vision_encoder_cfg: !!python/object:icrt.util.args.VisionEncoderConfig
155
+ bbox_vision_encoder_cfg: config/model_config/bbox_vit_128_16.json
156
+ freeze_all: false
157
+ vision_encoder: /storage/nfs/rshah/datasets/robocasa/datasets/crossmae_rtx/cross-mae-rtx-vitb.pth
158
+ vision_lora: false
159
+ vision_lora_rank: 8
160
+ vision_nonpretrained: false
161
+ vision_unfreeze_all: false
162
+ vision_unfreeze_last_n: 0
163
+ optimizer_cfg: !!python/object:icrt.util.args.OptimizerConfig
164
+ blr: 0.001
165
+ lr: 0.0005
166
+ min_lr: 0.0
167
+ warmup_epochs: 2.0
168
+ weight_decay: 0.01
169
+ shared_cfg: !!python/object:icrt.util.args.SharedConfig
170
+ batch_size: 2
171
+ bbox_noise: 0.015625
172
+ block_finetune: ''
173
+ downsample_obs: 8
174
+ drop_bbox_prob: 0.0
175
+ dropping_prompt_rnd: false
176
+ enable_gradient_checkpointing: false
177
+ gr00t_embodiment_str: single_panda_omron
178
+ gr00t_metadata_path: metadata.json
179
+ gr00t_model_path: nvidia/GR00T-N1.5-3B
180
+ gripper_img: true
181
+ has_base_action: true
182
+ hist_seq_length: 2048
183
+ is_bimanual: false
184
+ k_ptp: 0
185
+ max_bbox_per_img: 15
186
+ no_img: false
187
+ no_img_low_dim: 42
188
+ normalize_io: false
189
+ num_cameras: 2
190
+ num_pred_steps: 32
191
+ num_stages: 1
192
+ only_first_obs: false
193
+ pad_to_max_length: true
194
+ resume: null
195
+ rot_6d: false
196
+ rot_euler: false
197
+ save_every: 10
198
+ seed: 2
199
+ seq_length: 2048
200
+ split_epoch: 1
201
+ start_epoch: 0
202
+ state_center_coords: false
203
+ tokenizer_path: physical-intelligence/fast
204
+ use_bboxes: false
205
+ use_delta_action: false
206
+ use_fast_tokenizer: false
207
+ use_gr00t: false
208
+ use_history: false
209
+ use_language_conditioning: true
210
+ use_toy_vision_dataset: false
211
+ use_vqvae_tokenizer: false
212
+ train: true
213
+ trainer_cfg: !!python/object:icrt.util.args.TrainerConfig
214
+ accum_iter: 32
215
+ break_after_n_epochs: 101
216
+ compile_model: true
217
+ epochs: 200
218
+ num_workers: 72
219
+ pin_memory: true
220
+ val_every: 10
221
+ wandb_project: icrt_reruns
222
+ wandb_watch: true
223
+ world_size: 1
run_id.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ j6hocd88
task_robocasa_mem_four.json ADDED
@@ -0,0 +1,27 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "dataset_path": [
3
+ "memory/MemPutKBreadInMicrowave/2025-07-25-10-40-55/demo_im128_notp.hdf5",
4
+ "memory/MemPutKBreadInMicrowave/2025-07-25-13-25-05/demo_im128_notp.hdf5",
5
+ "memory/MemPutKBreadInMicrowave/2025-07-25-14-50-59/demo_im128_notp.hdf5",
6
+ "memory/MemFruitInSinkLeftFar/2025-07-13-15-44-32/demo_im128_notp.hdf5",
7
+ "memory/MemFruitInSinkRightFar/2025-07-15-15-07-57/demo_im128_notp.hdf5",
8
+ "memory/MemHeatPot/2025-07-24-22-26-20/demo_im128_notp.hdf5",
9
+ "memory/MemHeatPot/2025-07-25-15-56-53/demo_im128_notp.hdf5",
10
+ "memory/MemWashAndReturnLeft/2025-07-25-00-12-14/demo_im128_notp.hdf5",
11
+ "memory/MemWashAndReturnRight/2025-07-25-00-45-53/demo_im128_notp.hdf5"
12
+ ],
13
+ "image_keys": [
14
+ "obs/robot0_agentview_center_image",
15
+ "obs/robot0_eye_in_hand_image"
16
+ ],
17
+ "max_traj_len": 1024,
18
+ "low_dim_keys": [],
19
+ "group_method": "dinov2",
20
+ "proprio_keys": [
21
+ "obs/robot0_joint_pos_cos",
22
+ "obs/robot0_gripper_qpos"
23
+ ],
24
+ "action_keys": [
25
+ "actions"
26
+ ]
27
+ }