{ "decoder_args": { "attn_bias_for_inference_enabled": false, "attn_drop": 0.0, "attn_implementation": "flash_attention", "decoder_type": "fast3r", "depth": 24, "drop": 0.0, "embed_dim": 1024, "enc_embed_dim": 1024, "mlp_ratio": 4.0, "num_heads": 16, "qkv_bias": true, "random_image_idx_embedding": true }, "encoder_args": { "attn_implementation": "flash_attention", "depth": 24, "embed_dim": 1024, "encoder_type": "croco", "img_size": 512, "mlp_ratio": 4, "num_heads": 16, "patch_embed_cls": "PatchEmbedDust3R", "patch_size": 16, "pos_embed": "RoPE100" }, "head_args": { "conf_mode": [ "exp", 1, Infinity ], "depth_mode": [ "exp", -Infinity, Infinity ], "head_type": "dpt", "landscape_only": false, "output_mode": "pts3d", "patch_size": 16, "with_local_head": true } }