File size: 2,680 Bytes
cde0ae5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4db10fe
cde0ae5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
d3f45e8
 
 
cde0ae5
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
{
    "type": "transformer_flow_matching",
    "n_obs_steps": 2,
    "input_features": {
        "observation.state": {
            "type": "STATE",
            "shape": [
                7
            ]
        },
        "observation.box": {
            "type": "STATE",
            "shape": [
                6,
                6
            ]
        },
        "observation.images.gripper": {
            "type": "VISUAL",
            "shape": [
                3,
                400,
                640
            ]
        },
        "observation.images.front": {
            "type": "VISUAL",
            "shape": [
                3,
                400,
                640
            ]
        },
        "observation.images.right": {
            "type": "VISUAL",
            "shape": [
                3,
                400,
                640
            ]
        }
    },
    "output_features": {
        "action": {
            "type": "ACTION",
            "shape": [
                7
            ]
        }
    },
    "device": "cuda",
    "use_amp": false,
    "push_to_hub": true,
    "repo_id": null,
    "private": null,
    "tags": null,
    "license": null,
    "pretrained_path": null,
    "horizon": 64,
    "n_action_steps": 64,
    "normalization_mapping": {
        "VISUAL": "IDENTITY",
        "STATE": "MEAN_STD",
        "ACTION": "MEAN_STD"
    },
    "vision_input_size": 384,
    "num_cameras": 3,
    "num_vlm_layers": 16,
    "detection_classes": [
        "cube",
        "container"
    ],
    "detection_conf": 0.1,
    "cameras_for_vision_state_concat": [
        "observation.images.front",
        "observation.images.gripper",
        "observation.images.right"
    ],
    "state_dim": 7,
    "action_dim": 7,
    "d_model": 512,
    "nhead": 8,
    "num_decoder_layers": 16,
    "dim_feedforward": 2048,
    "num_inference_steps": 10,
    "noise_temporal_correlation": 0.0,
    "action_dim_weights": [
        1.0,
        1.0,
        1.0,
        0.0,
        1.0,
        1.0,
        1.0
    ],
    "pos_decay_lambda": 0.0,
    "future_steps_weight": 0.3,
    "optimizer_lr": 2.8e-05,
    "optimizer_betas": [
        0.95,
        0.999
    ],
    "optimizer_eps": 1e-08,
    "optimizer_weight_decay": 1e-06,
    "scheduler_warmup_steps": 1500,
    "robot_encoder_tokens": 16,
    "robot_encoder_input_size": 224,
    "lora_rank": 16,
    "lora_alpha": 32,
    "lora_dropout": 0.05,
    "lora_target_modules": [
        "q_proj",
        "v_proj"
    ],
    "vision_lora_num_layers": 8,
    "training_step": 119000,
    "training_epoch": 414,
    "current_lr": 8.581771368787766e-06,
    "training_steps_total": 200000
}