{ "model_type": "stellar", "library_name": "stellar", "code": "https://github.com/microsoft/STELLAR", "default": "stellar-b16", "models": { "stellar-b16": { "weights": "stellar-b16.safetensors", "category": "main", "backbone": "facebook/vit-mae-base", "image_size": 224, "patch_size": 16, "embed_dim": 768, "num_sparse_tokens": 16, "num_decoder_layers": 6, "spatial_temp": 0.06, "do_recon": true, "do_clustering": true, "do_cls": true, "num_clusters": 16384, "recon_type": "vq" }, "stellar-l16": { "weights": "stellar-l16.safetensors", "category": "main", "backbone": "facebook/vit-mae-large", "image_size": 224, "patch_size": 16, "embed_dim": 1024, "num_sparse_tokens": 16, "num_decoder_layers": 6, "spatial_temp": 0.06, "do_recon": true, "do_clustering": true, "do_cls": true, "num_clusters": 16384, "recon_type": "vq" }, "stellar-h16": { "weights": "stellar-h16.safetensors", "category": "main", "backbone": "facebook/vit-mae-huge", "image_size": 224, "patch_size": 14, "embed_dim": 1280, "num_sparse_tokens": 16, "num_decoder_layers": 6, "spatial_temp": 0.06, "do_recon": true, "do_clustering": true, "do_cls": true, "num_clusters": 16384, "recon_type": "vq" }, "stellar-b8": { "weights": "stellar-b8.safetensors", "category": "ablation", "backbone": "facebook/vit-mae-base", "image_size": 224, "patch_size": 16, "embed_dim": 768, "num_sparse_tokens": 8, "num_decoder_layers": 6, "spatial_temp": 0.06, "do_recon": true, "do_clustering": true, "do_cls": true, "num_clusters": 16384, "recon_type": "vq" }, "stellar-b24": { "weights": "stellar-b24.safetensors", "category": "ablation", "backbone": "facebook/vit-mae-base", "image_size": 224, "patch_size": 16, "embed_dim": 768, "num_sparse_tokens": 24, "num_decoder_layers": 6, "spatial_temp": 0.06, "do_recon": true, "do_clustering": true, "do_cls": true, "num_clusters": 16384, "recon_type": "vq" } } }