{ "_target_": "stable_worldmodel.wm.lewm.LeWM", "encoder": { "_target_": "stable_pretraining.backbone.utils.vit_hf", "size": "tiny", "patch_size": 14, "image_size": 224, "pretrained": false, "use_mask_token": false }, "predictor": { "_target_": "stable_worldmodel.wm.lewm.module.Predictor", "num_frames": 3, "input_dim": 192, "hidden_dim": 192, "output_dim": 192, "depth": 6, "heads": 16, "mlp_dim": 2048, "dim_head": 64, "dropout": 0.1, "emb_dropout": 0.0 }, "action_encoder": { "_target_": "stable_worldmodel.wm.lewm.module.Embedder", "input_dim": 25, "emb_dim": 192 }, "projector": { "_target_": "stable_worldmodel.wm.lewm.module.MLP", "input_dim": 192, "output_dim": 192, "hidden_dim": 2048, "norm_fn": { "_target_": "torch.nn.BatchNorm1d", "_partial_": true } }, "pred_proj": { "_target_": "stable_worldmodel.wm.lewm.module.MLP", "input_dim": 192, "output_dim": 192, "hidden_dim": 2048, "norm_fn": { "_target_": "torch.nn.BatchNorm1d", "_partial_": true } } }