File size: 4,760 Bytes
abbb998
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
{
    "type": "sac",
    "n_obs_steps": 1,
    "normalization_mapping": {
        "VISUAL": "MEAN_STD",
        "STATE": "MIN_MAX",
        "ENV": "MIN_MAX",
        "ACTION": "MIN_MAX"
    },
    "input_features": {
        "observation.images.front": {
            "type": "VISUAL",
            "shape": [
                3,
                128,
                128
            ]
        },
        "observation.images.wrist": {
            "type": "VISUAL",
            "shape": [
                3,
                128,
                128
            ]
        },
        "observation.state": {
            "type": "STATE",
            "shape": [
                18
            ]
        }
    },
    "output_features": {
        "action": {
            "type": "ACTION",
            "shape": [
                3
            ]
        }
    },
    "device": "cuda",
    "use_amp": false,
    "push_to_hub": true,
    "repo_id": "yfynb1111/sac",
    "private": null,
    "tags": null,
    "license": null,
    "dataset_stats": {
        "observation.images.front": {
            "mean": [
                0.485,
                0.456,
                0.406
            ],
            "std": [
                0.229,
                0.224,
                0.225
            ]
        },
        "observation.images.wrist": {
            "mean": [
                0.485,
                0.456,
                0.406
            ],
            "std": [
                0.229,
                0.224,
                0.225
            ]
        },
        "observation.state": {
            "min": [
                -0.6897139549255371,
                -1.1421763896942139,
                -0.5745007991790771,
                -2.97829008102417,
                -0.2710767090320587,
                1.3246592283248901,
                -0.04057434946298599,
                -0.21261805295944214,
                -0.4548068344593048,
                -0.6540042757987976,
                -0.3644964098930359,
                -1.1057522296905518,
                -0.40768879652023315,
                -0.2220114767551422,
                0.0,
                0.19176171720027924,
                -0.3013063669204712,
                0.00362197193317115
            ],
            "max": [
                0.5107022523880005,
                0.5516204237937927,
                0.5620884299278259,
                -1.3330878019332886,
                0.32758936285972595,
                3.119610548019409,
                1.8364211320877075,
                0.25358933210372925,
                0.36316126585006714,
                0.14765967428684235,
                0.49947625398635864,
                0.144814133644104,
                0.2820609211921692,
                0.7382049560546875,
                255.0,
                0.6012658476829529,
                0.3005995750427246,
                0.5004003643989563
            ]
        }
    },
    "storage_device": "cpu",
    "vision_encoder_name": "helper2424/resnet10",
    "freeze_vision_encoder": true,
    "image_encoder_hidden_dim": 32,
    "shared_encoder": true,
    "num_discrete_actions": 3,
    "image_embedding_pooling_dim": 8,
    "online_steps": 1000000,
    "online_env_seed": 10000,
    "online_buffer_capacity": 100000,
    "offline_buffer_capacity": 100000,
    "async_prefetch": false,
    "online_step_before_learning": 100,
    "policy_update_freq": 1,
    "discount": 0.97,
    "temperature_init": 0.01,
    "num_critics": 2,
    "num_subsample_critics": null,
    "critic_lr": 0.0003,
    "actor_lr": 0.0003,
    "temperature_lr": 0.0003,
    "critic_target_update_weight": 0.005,
    "utd_ratio": 2,
    "state_encoder_hidden_dim": 256,
    "latent_dim": 64,
    "target_entropy": null,
    "use_backup_entropy": true,
    "grad_clip_norm": 10.0,
    "critic_network_kwargs": {
        "hidden_dims": [
            256,
            256
        ],
        "activate_final": true,
        "final_activation": null
    },
    "actor_network_kwargs": {
        "hidden_dims": [
            256,
            256
        ],
        "activate_final": true
    },
    "policy_kwargs": {
        "use_tanh_squash": true,
        "std_min": 1e-05,
        "std_max": 5.0,
        "init_final": 0.05
    },
    "discrete_critic_network_kwargs": {
        "hidden_dims": [
            256,
            256
        ],
        "activate_final": true,
        "final_activation": null
    },
    "actor_learner_config": {
        "learner_host": "127.0.0.1",
        "learner_port": 50051,
        "policy_parameters_push_frequency": 4,
        "queue_get_timeout": 2
    },
    "concurrency": {
        "actor": "threads",
        "learner": "threads"
    },
    "use_torch_compile": true
}