diff --git "a/segmentation/summary.md" "b/segmentation/summary.md" --- "a/segmentation/summary.md" +++ "b/segmentation/summary.md" @@ -92,7 +92,7 @@ | completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | TGRS2025 | 12.8608 | 31.3805 | 7.7093 | 0.1029 | 0.2937 | 0.4161 | 0.6536 | 0.2259 | 0.2791 | 0.3006 | | completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | TGRS2025 | 35.8629 | 109.6158 | 7.7557 | 0.3940 | 0.3604 | 0.4820 | 0.6775 | 0.3004 | 0.3162 | 0.3162 | | completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | TGRS2025 | 35.8629 | 109.6158 | 7.0723 | 0.3940 | 0.4032 | 0.5467 | 0.6849 | 0.2880 | 0.1723 | 0.3015 | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | TGRS2025 | - | - | - | - | - | - | - | - | - | - | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | TGRS2025 | 35.8629 | 109.6158 | 8.6225 | 0.3940 | 0.3839 | 0.5238 | 0.6763 | 0.2742 | 0.3085 | 0.3322 | | completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | TGRS2025 | 11.7259 | 23.5509 | 4.9343 | 0.0876 | 0.3958 | 0.5167 | 0.7279 | 0.3298 | 0.3399 | 0.3399 | | completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | TGRS2025 | 11.7259 | 23.5509 | 4.7844 | 0.0876 | 0.3873 | 0.5091 | 0.7195 | 0.3228 | 0.3406 | 0.3406 | | completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | TGRS2025 | 11.7259 | 23.5509 | 5.0644 | 0.0876 | 0.3578 | 0.4943 | 0.6816 | 0.2752 | 0.3286 | 0.3286 | @@ -181,7 +181,7 @@ | completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | TGRS2025 | - | 0.2791 | - | 0.3006 | 0.3987 | 0.7175 | | completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | TGRS2025 | - | 0.3162 | - | 0.3162 | 0.4125 | 0.6766 | | completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | TGRS2025 | - | 0.1723 | - | 0.3015 | 0.4057 | 0.6379 | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | TGRS2025 | - | - | - | - | - | - | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | TGRS2025 | - | 0.3085 | - | 0.3322 | 0.4453 | 0.6725 | | completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | TGRS2025 | - | 0.3399 | - | 0.3399 | 0.4388 | 0.7646 | | completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | TGRS2025 | - | 0.3406 | - | 0.3406 | 0.4403 | 0.7242 | | completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | TGRS2025 | - | 0.3286 | - | 0.3286 | 0.4342 | 0.7247 | @@ -261,35 +261,35 @@ #### Methods related to vision foundation models -| status | model | backbone | loss | val_miou_present | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | -|:----------|:---------|:------------------------------------------|:---------------------------|:-------------------|:-----------|:--------------|:-----------------|:------------------|:---------------|:--------------------|:-----------------|:----------------|:--------|:--------------|:--------------|:--------------|:---------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2226 | 0.1125 | 0.0002 | 0.7274 | 0.0 | 0.554 | 0.1486 | 0.0072 | 0.0317 | 0.7444 | 0.1957 | 0.1421 | 0.2298 | 0.0 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.2237 | 0.1148 | 0.0051 | 0.7041 | 0.0363 | 0.5632 | 0.1687 | 0.0383 | 0.0432 | 0.7022 | 0.2138 | 0.1147 | 0.2032 | 0.0 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.2248 | 0.118 | 0.0046 | 0.7562 | 0.0 | 0.6064 | 0.1149 | 0.0065 | 0.0128 | 0.751 | 0.1902 | 0.1303 | 0.2316 | 0.0 | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.3104 | 0.1015 | 0.0 | 0.7134 | 0.0 | 0.6247 | 0.6719 | 0.176 | 0.2155 | 0.8072 | 0.2616 | 0.1836 | 0.2759 | 0.0 | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.2909 | 0.2431 | 0.0 | 0.6725 | 0.0 | 0.5426 | 0.6788 | 0.0305 | 0.2741 | 0.7007 | 0.2317 | 0.1473 | 0.2604 | 0.0 | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.2859 | 0.1339 | 0.0 | 0.7817 | 0.0 | 0.4701 | 0.5686 | 0.0286 | 0.2696 | 0.8318 | 0.1927 | 0.2125 | 0.2271 | 0.0 | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.2971 | 0.2083 | 0.0 | 0.7157 | 0.0 | 0.413 | 0.6491 | 0.0182 | 0.3926 | 0.8202 | 0.2039 | 0.2159 | 0.2254 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2242 | 0.1131 | 0.0 | 0.7295 | 0.0 | 0.4984 | 0.201 | 0.0047 | 0.0861 | 0.7436 | 0.2142 | 0.1024 | 0.222 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.2326 | 0.0406 | 0.0308 | 0.7612 | 0.0293 | 0.4463 | 0.3085 | 0.0314 | 0.099 | 0.7675 | 0.2151 | 0.0861 | 0.2084 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.2288 | 0.0958 | 0.0017 | 0.7499 | 0.0 | 0.4624 | 0.3107 | 0.0161 | 0.0719 | 0.7424 | 0.2096 | 0.1025 | 0.2108 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.2903 | 0.2215 | 0.0 | 0.7101 | 0.0 | 0.6559 | 0.3378 | 0.0272 | 0.3258 | 0.8101 | 0.2173 | 0.2135 | 0.2544 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2933 | 0.1862 | 0.0943 | 0.7681 | 0.0029 | 0.5044 | 0.4415 | 0.0284 | 0.349 | 0.7837 | 0.2183 | 0.1966 | 0.2391 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.2906 | 0.2497 | 0.0 | 0.7281 | 0.0 | 0.5613 | 0.4376 | 0.0134 | 0.3647 | 0.8286 | 0.1996 | 0.135 | 0.2599 | 0.0 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.2959 | 0.2226 | 0.0 | 0.7836 | 0.0 | 0.662 | 0.3555 | 0.0263 | 0.2885 | 0.8042 | 0.2741 | 0.1385 | 0.2912 | 0.0 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.3333 | 0.2853 | 0.1837 | 0.7512 | 0.0331 | 0.5979 | 0.5701 | 0.0385 | 0.4021 | 0.7482 | 0.2089 | 0.0936 | 0.2682 | 0.152 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.2841 | 0.2804 | 0.0 | 0.8023 | 0.0 | 0.6016 | 0.4233 | 0.0395 | 0.1251 | 0.8108 | 0.2196 | 0.1075 | 0.2833 | 0.0 | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.3094 | 0.2442 | 0.0 | 0.6983 | 0.0 | 0.5238 | 0.6614 | 0.0597 | 0.3171 | 0.8411 | 0.2016 | 0.1772 | 0.2974 | 0.0 | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.3035 | 0.3435 | 0.0 | 0.6946 | 0.0 | 0.4638 | 0.5973 | 0.0249 | 0.3706 | 0.7669 | 0.2361 | 0.1646 | 0.2833 | 0.0 | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.3214 | 0.3047 | 0.0704 | 0.6523 | 0.0775 | 0.3477 | 0.6681 | 0.1588 | 0.3414 | 0.792 | 0.2382 | 0.1579 | 0.2731 | 0.0959 | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.3078 | 0.2153 | 0.0 | 0.7418 | 0.0 | 0.5494 | 0.5569 | 0.0984 | 0.2907 | 0.8285 | 0.2431 | 0.1962 | 0.2809 | 0.0 | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3006 | 0.2044 | 0.0 | 0.752 | 0.0 | 0.5884 | 0.5621 | 0.1586 | 0.105 | 0.8109 | 0.2576 | 0.1881 | 0.2809 | 0.0 | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3162 | 0.3153 | 0.0 | 0.6773 | 0.0 | 0.6218 | 0.6591 | 0.0241 | 0.3258 | 0.8354 | 0.1881 | 0.1855 | 0.2779 | 0.0 | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.3015 | 0.4533 | 0.0 | 0.7477 | 0.0559 | 0.5386 | 0.0 | 0.0142 | 0.0 | 0.0 | 0.3457 | 0.015 | 0.2415 | 0.0 | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.3399 | 0.3305 | 0.0 | 0.8089 | 0.0 | 0.5578 | 0.6052 | 0.0297 | 0.4677 | 0.8301 | 0.305 | 0.188 | 0.2959 | 0.0 | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3406 | 0.2782 | 0.0 | 0.7491 | 0.0 | 0.5993 | 0.7111 | 0.031 | 0.4681 | 0.777 | 0.2665 | 0.2483 | 0.2992 | 0.0 | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.3286 | 0.1744 | 0.1238 | 0.776 | 0.0 | 0.5211 | 0.68 | 0.068 | 0.4502 | 0.7576 | 0.2769 | 0.1504 | 0.293 | 0.0 | +| status | model | backbone | loss | val_miou_present | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | +|:----------|:---------|:------------------------------------------|:---------------------------|-------------------:|-----------:|--------------:|-----------------:|------------------:|---------------:|--------------------:|-----------------:|----------------:|--------:|--------------:|--------------:|--------------:|---------:| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2226 | 0.1125 | 0.0002 | 0.7274 | 0.0000 | 0.5540 | 0.1486 | 0.0072 | 0.0317 | 0.7444 | 0.1957 | 0.1421 | 0.2298 | 0.0000 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.2237 | 0.1148 | 0.0051 | 0.7041 | 0.0363 | 0.5632 | 0.1687 | 0.0383 | 0.0432 | 0.7022 | 0.2138 | 0.1147 | 0.2032 | 0.0000 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.2248 | 0.1180 | 0.0046 | 0.7562 | 0.0000 | 0.6064 | 0.1149 | 0.0065 | 0.0128 | 0.7510 | 0.1902 | 0.1303 | 0.2316 | 0.0000 | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.3104 | 0.1015 | 0.0000 | 0.7134 | 0.0000 | 0.6247 | 0.6719 | 0.1760 | 0.2155 | 0.8072 | 0.2616 | 0.1836 | 0.2759 | 0.0000 | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.2909 | 0.2431 | 0.0000 | 0.6725 | 0.0000 | 0.5426 | 0.6788 | 0.0305 | 0.2741 | 0.7007 | 0.2317 | 0.1473 | 0.2604 | 0.0000 | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.2859 | 0.1339 | 0.0000 | 0.7817 | 0.0000 | 0.4701 | 0.5686 | 0.0286 | 0.2696 | 0.8318 | 0.1927 | 0.2125 | 0.2271 | 0.0000 | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.2971 | 0.2083 | 0.0000 | 0.7157 | 0.0000 | 0.4130 | 0.6491 | 0.0182 | 0.3926 | 0.8202 | 0.2039 | 0.2159 | 0.2254 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2242 | 0.1131 | 0.0000 | 0.7295 | 0.0000 | 0.4984 | 0.2010 | 0.0047 | 0.0861 | 0.7436 | 0.2142 | 0.1024 | 0.2220 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.2326 | 0.0406 | 0.0308 | 0.7612 | 0.0293 | 0.4463 | 0.3085 | 0.0314 | 0.0990 | 0.7675 | 0.2151 | 0.0861 | 0.2084 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.2288 | 0.0958 | 0.0017 | 0.7499 | 0.0000 | 0.4624 | 0.3107 | 0.0161 | 0.0719 | 0.7424 | 0.2096 | 0.1025 | 0.2108 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.2903 | 0.2215 | 0.0000 | 0.7101 | 0.0000 | 0.6559 | 0.3378 | 0.0272 | 0.3258 | 0.8101 | 0.2173 | 0.2135 | 0.2544 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2933 | 0.1862 | 0.0943 | 0.7681 | 0.0029 | 0.5044 | 0.4415 | 0.0284 | 0.3490 | 0.7837 | 0.2183 | 0.1966 | 0.2391 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.2906 | 0.2497 | 0.0000 | 0.7281 | 0.0000 | 0.5613 | 0.4376 | 0.0134 | 0.3647 | 0.8286 | 0.1996 | 0.1350 | 0.2599 | 0.0000 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.2959 | 0.2226 | 0.0000 | 0.7836 | 0.0000 | 0.6620 | 0.3555 | 0.0263 | 0.2885 | 0.8042 | 0.2741 | 0.1385 | 0.2912 | 0.0000 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.3333 | 0.2853 | 0.1837 | 0.7512 | 0.0331 | 0.5979 | 0.5701 | 0.0385 | 0.4021 | 0.7482 | 0.2089 | 0.0936 | 0.2682 | 0.1520 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.2841 | 0.2804 | 0.0000 | 0.8023 | 0.0000 | 0.6016 | 0.4233 | 0.0395 | 0.1251 | 0.8108 | 0.2196 | 0.1075 | 0.2833 | 0.0000 | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.3094 | 0.2442 | 0.0000 | 0.6983 | 0.0000 | 0.5238 | 0.6614 | 0.0597 | 0.3171 | 0.8411 | 0.2016 | 0.1772 | 0.2974 | 0.0000 | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.3035 | 0.3435 | 0.0000 | 0.6946 | 0.0000 | 0.4638 | 0.5973 | 0.0249 | 0.3706 | 0.7669 | 0.2361 | 0.1646 | 0.2833 | 0.0000 | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.3214 | 0.3047 | 0.0704 | 0.6523 | 0.0775 | 0.3477 | 0.6681 | 0.1588 | 0.3414 | 0.7920 | 0.2382 | 0.1579 | 0.2731 | 0.0959 | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.3078 | 0.2153 | 0.0000 | 0.7418 | 0.0000 | 0.5494 | 0.5569 | 0.0984 | 0.2907 | 0.8285 | 0.2431 | 0.1962 | 0.2809 | 0.0000 | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3006 | 0.2044 | 0.0000 | 0.7520 | 0.0000 | 0.5884 | 0.5621 | 0.1586 | 0.1050 | 0.8109 | 0.2576 | 0.1881 | 0.2809 | 0.0000 | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3162 | 0.3153 | 0.0000 | 0.6773 | 0.0000 | 0.6218 | 0.6591 | 0.0241 | 0.3258 | 0.8354 | 0.1881 | 0.1855 | 0.2779 | 0.0000 | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.3015 | 0.4533 | 0.0000 | 0.7477 | 0.0559 | 0.5386 | 0.0000 | 0.0142 | 0.0000 | 0.0000 | 0.3457 | 0.0150 | 0.2415 | 0.0000 | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.3322 | 0.3626 | 0.1104 | 0.6821 | 0.0910 | 0.5331 | 0.6413 | 0.0341 | 0.4602 | 0.7903 | 0.1838 | 0.1738 | 0.2421 | 0.0139 | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.3399 | 0.3305 | 0.0000 | 0.8089 | 0.0000 | 0.5578 | 0.6052 | 0.0297 | 0.4677 | 0.8301 | 0.3050 | 0.1880 | 0.2959 | 0.0000 | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3406 | 0.2782 | 0.0000 | 0.7491 | 0.0000 | 0.5993 | 0.7111 | 0.0310 | 0.4681 | 0.7770 | 0.2665 | 0.2483 | 0.2992 | 0.0000 | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.3286 | 0.1744 | 0.1238 | 0.7760 | 0.0000 | 0.5211 | 0.6800 | 0.0680 | 0.4502 | 0.7576 | 0.2769 | 0.1504 | 0.2930 | 0.0000 | ### Test @@ -364,35 +364,35 @@ #### Methods related to vision foundation models -| status | model | backbone | loss | test_miou_present | Building | Mining raft | Primary Forest | Water bodies | Agricultural crop | Gravel mounds | Type1 regen | Type2 regen | Bare ground | Sluice | -|:----------|:---------|:------------------------------------------|:---------------------------|:--------------------|:-----------|:--------------|:-----------------|:---------------|:--------------------|:----------------|:--------------|:--------------|:--------------|:---------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2485 | 0.2233 | 0.0211 | 0.6664 | 0.521 | 0.0429 | 0.13 | 0.2979 | 0.2299 | 0.353 | 0.0 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.2538 | 0.1961 | 0.0877 | 0.6578 | 0.4813 | 0.0741 | 0.1949 | 0.327 | 0.2207 | 0.2989 | 0.0 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.2503 | 0.2408 | 0.0521 | 0.7055 | 0.5072 | 0.0366 | 0.0794 | 0.2916 | 0.2327 | 0.3569 | 0.0 | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.2964 | 0.0894 | 0.0 | 0.6257 | 0.6902 | 0.2007 | 0.3997 | 0.3006 | 0.2397 | 0.4174 | 0.0 | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.2916 | 0.2048 | 0.0 | 0.662 | 0.6011 | 0.127 | 0.3726 | 0.2936 | 0.2437 | 0.4108 | 0.0 | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.2922 | 0.2637 | 0.0 | 0.7463 | 0.5706 | 0.1557 | 0.3117 | 0.271 | 0.2614 | 0.3418 | 0.0 | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.3241 | 0.2783 | 0.0 | 0.6849 | 0.6421 | 0.1958 | 0.4495 | 0.2846 | 0.267 | 0.4384 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2422 | 0.2552 | 0.0441 | 0.6777 | 0.4286 | 0.0149 | 0.2028 | 0.306 | 0.1635 | 0.3288 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.2207 | 0.0778 | 0.0403 | 0.685 | 0.3653 | 0.0532 | 0.2506 | 0.2871 | 0.1351 | 0.3102 | 0.0027 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.2351 | 0.2074 | 0.0479 | 0.696 | 0.3906 | 0.0482 | 0.1869 | 0.2984 | 0.1556 | 0.3204 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.2885 | 0.2944 | 0.0 | 0.6846 | 0.5456 | 0.1633 | 0.2935 | 0.2949 | 0.2355 | 0.3737 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2875 | 0.123 | 0.0774 | 0.7163 | 0.6069 | 0.1829 | 0.2916 | 0.2798 | 0.2168 | 0.3805 | 0.0 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.298 | 0.267 | 0.0 | 0.7298 | 0.6004 | 0.1825 | 0.3277 | 0.3039 | 0.1975 | 0.3712 | 0.0 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3263 | 0.3254 | 0.0 | 0.703 | 0.6784 | 0.255 | 0.3121 | 0.3022 | 0.2285 | 0.4579 | 0.0 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.3696 | 0.3694 | 0.1755 | 0.7118 | 0.697 | 0.3144 | 0.4291 | 0.3081 | 0.197 | 0.4374 | 0.0563 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.345 | 0.3239 | 0.0068 | 0.7604 | 0.7255 | 0.2763 | 0.3453 | 0.3057 | 0.232 | 0.4741 | 0.0 | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.3702 | 0.3508 | 0.0 | 0.7085 | 0.8338 | 0.2368 | 0.489 | 0.2883 | 0.243 | 0.5519 | 0.0 | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.3374 | 0.4018 | 0.0 | 0.6584 | 0.6353 | 0.2203 | 0.4785 | 0.3156 | 0.2347 | 0.4292 | 0.0 | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.3745 | 0.3669 | 0.1513 | 0.7198 | 0.7334 | 0.3035 | 0.4118 | 0.3048 | 0.2127 | 0.4463 | 0.0943 | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.3154 | 0.272 | 0.0 | 0.6887 | 0.7224 | 0.1825 | 0.3858 | 0.2794 | 0.1958 | 0.4277 | 0.0 | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.2937 | 0.2585 | 0.0 | 0.6911 | 0.5584 | 0.2844 | 0.2812 | 0.2907 | 0.2286 | 0.3438 | 0.0 | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3604 | 0.5642 | 0.0 | 0.6667 | 0.6537 | 0.2792 | 0.4624 | 0.3063 | 0.1918 | 0.48 | 0.0 | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.4032 | 0.5654 | 0.1813 | 0.6645 | 0.693 | 0.4172 | 0.4393 | 0.3048 | 0.2272 | 0.4512 | 0.0883 | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.3958 | 0.4708 | 0.0 | 0.7259 | 0.7281 | 0.4633 | 0.5327 | 0.3453 | 0.2184 | 0.4735 | 0.0 | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3873 | 0.4662 | 0.0 | 0.7098 | 0.7649 | 0.385 | 0.4858 | 0.3149 | 0.2631 | 0.4838 | 0.0 | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.3578 | 0.3334 | 0.1955 | 0.6817 | 0.6728 | 0.2858 | 0.4299 | 0.333 | 0.2123 | 0.4335 | 0.0 | +| status | model | backbone | loss | test_miou_present | Building | Mining raft | Primary Forest | Water bodies | Agricultural crop | Gravel mounds | Type1 regen | Type2 regen | Bare ground | Sluice | +|:----------|:---------|:------------------------------------------|:---------------------------|--------------------:|-----------:|--------------:|-----------------:|---------------:|--------------------:|----------------:|--------------:|--------------:|--------------:|---------:| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2485 | 0.2233 | 0.0211 | 0.6664 | 0.5210 | 0.0429 | 0.1300 | 0.2979 | 0.2299 | 0.3530 | 0.0000 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.2538 | 0.1961 | 0.0877 | 0.6578 | 0.4813 | 0.0741 | 0.1949 | 0.3270 | 0.2207 | 0.2989 | 0.0000 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.2503 | 0.2408 | 0.0521 | 0.7055 | 0.5072 | 0.0366 | 0.0794 | 0.2916 | 0.2327 | 0.3569 | 0.0000 | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.2964 | 0.0894 | 0.0000 | 0.6257 | 0.6902 | 0.2007 | 0.3997 | 0.3006 | 0.2397 | 0.4174 | 0.0000 | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.2916 | 0.2048 | 0.0000 | 0.6620 | 0.6011 | 0.1270 | 0.3726 | 0.2936 | 0.2437 | 0.4108 | 0.0000 | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.2922 | 0.2637 | 0.0000 | 0.7463 | 0.5706 | 0.1557 | 0.3117 | 0.2710 | 0.2614 | 0.3418 | 0.0000 | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.3241 | 0.2783 | 0.0000 | 0.6849 | 0.6421 | 0.1958 | 0.4495 | 0.2846 | 0.2670 | 0.4384 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2422 | 0.2552 | 0.0441 | 0.6777 | 0.4286 | 0.0149 | 0.2028 | 0.3060 | 0.1635 | 0.3288 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.2207 | 0.0778 | 0.0403 | 0.6850 | 0.3653 | 0.0532 | 0.2506 | 0.2871 | 0.1351 | 0.3102 | 0.0027 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.2351 | 0.2074 | 0.0479 | 0.6960 | 0.3906 | 0.0482 | 0.1869 | 0.2984 | 0.1556 | 0.3204 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.2885 | 0.2944 | 0.0000 | 0.6846 | 0.5456 | 0.1633 | 0.2935 | 0.2949 | 0.2355 | 0.3737 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2875 | 0.1230 | 0.0774 | 0.7163 | 0.6069 | 0.1829 | 0.2916 | 0.2798 | 0.2168 | 0.3805 | 0.0000 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.2980 | 0.2670 | 0.0000 | 0.7298 | 0.6004 | 0.1825 | 0.3277 | 0.3039 | 0.1975 | 0.3712 | 0.0000 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3263 | 0.3254 | 0.0000 | 0.7030 | 0.6784 | 0.2550 | 0.3121 | 0.3022 | 0.2285 | 0.4579 | 0.0000 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.3696 | 0.3694 | 0.1755 | 0.7118 | 0.6970 | 0.3144 | 0.4291 | 0.3081 | 0.1970 | 0.4374 | 0.0563 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.3450 | 0.3239 | 0.0068 | 0.7604 | 0.7255 | 0.2763 | 0.3453 | 0.3057 | 0.2320 | 0.4741 | 0.0000 | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.3702 | 0.3508 | 0.0000 | 0.7085 | 0.8338 | 0.2368 | 0.4890 | 0.2883 | 0.2430 | 0.5519 | 0.0000 | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.3374 | 0.4018 | 0.0000 | 0.6584 | 0.6353 | 0.2203 | 0.4785 | 0.3156 | 0.2347 | 0.4292 | 0.0000 | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.3745 | 0.3669 | 0.1513 | 0.7198 | 0.7334 | 0.3035 | 0.4118 | 0.3048 | 0.2127 | 0.4463 | 0.0943 | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.3154 | 0.2720 | 0.0000 | 0.6887 | 0.7224 | 0.1825 | 0.3858 | 0.2794 | 0.1958 | 0.4277 | 0.0000 | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.2937 | 0.2585 | 0.0000 | 0.6911 | 0.5584 | 0.2844 | 0.2812 | 0.2907 | 0.2286 | 0.3438 | 0.0000 | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3604 | 0.5642 | 0.0000 | 0.6667 | 0.6537 | 0.2792 | 0.4624 | 0.3063 | 0.1918 | 0.4800 | 0.0000 | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.4032 | 0.5654 | 0.1813 | 0.6645 | 0.6930 | 0.4172 | 0.4393 | 0.3048 | 0.2272 | 0.4512 | 0.0883 | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.3839 | 0.4388 | 0.2110 | 0.6440 | 0.7298 | 0.3573 | 0.4806 | 0.2910 | 0.1887 | 0.4537 | 0.0440 | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.3958 | 0.4708 | 0.0000 | 0.7259 | 0.7281 | 0.4633 | 0.5327 | 0.3453 | 0.2184 | 0.4735 | 0.0000 | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3873 | 0.4662 | 0.0000 | 0.7098 | 0.7649 | 0.3850 | 0.4858 | 0.3149 | 0.2631 | 0.4838 | 0.0000 | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.3578 | 0.3334 | 0.1955 | 0.6817 | 0.6728 | 0.2858 | 0.4299 | 0.3330 | 0.2123 | 0.4335 | 0.0000 | @@ -470,35 +470,35 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps #### Methods related to vision foundation models -| status | model | backbone | loss | cp | cr | cf1 | op | or | of1 | map | macro_f1 | micro_f1 | sample_f1 | -|:----------|:---------|:------------------------------------------|:---------------------------|:-------|:-------|:-------|:-------|:-------|:-------|:-------|:-----------|:-----------|:------------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2355 | 0.5864 | 0.3361 | 0.3986 | 0.9369 | 0.5592 | 0.4075 | 0.3792 | 0.5592 | 0.5593 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.2349 | 0.7073 | 0.3527 | 0.3736 | 0.9328 | 0.5335 | 0.4238 | 0.3532 | 0.5335 | 0.5301 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.2626 | 0.5864 | 0.3627 | 0.4156 | 0.9272 | 0.5739 | 0.4167 | 0.4089 | 0.5739 | 0.5847 | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.5128 | 0.4649 | 0.4877 | 0.7287 | 0.7158 | 0.7222 | 0.4248 | 0.6207 | 0.7222 | 0.7634 | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.5511 | 0.4662 | 0.5051 | 0.6861 | 0.7295 | 0.7071 | 0.4231 | 0.6135 | 0.7071 | 0.7282 | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.5192 | 0.4578 | 0.4866 | 0.7222 | 0.7416 | 0.7317 | 0.4200 | 0.5871 | 0.7317 | 0.7774 | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4133 | 0.5190 | 0.4602 | 0.6086 | 0.7911 | 0.6879 | 0.4381 | 0.5727 | 0.6879 | 0.7149 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2597 | 0.5792 | 0.3586 | 0.4626 | 0.9134 | 0.6142 | 0.4036 | 0.4507 | 0.6142 | 0.6247 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.2663 | 0.7744 | 0.3963 | 0.4428 | 0.9136 | 0.5965 | 0.4245 | 0.3837 | 0.5965 | 0.6216 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.3021 | 0.6078 | 0.4036 | 0.4850 | 0.9138 | 0.6336 | 0.4190 | 0.4576 | 0.6336 | 0.6419 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4659 | 0.4935 | 0.4793 | 0.7006 | 0.7490 | 0.7240 | 0.4392 | 0.5926 | 0.7240 | 0.7614 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.4550 | 0.6322 | 0.5292 | 0.6422 | 0.8003 | 0.7126 | 0.4711 | 0.4992 | 0.7126 | 0.7651 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.4567 | 0.5080 | 0.4810 | 0.6559 | 0.7778 | 0.7117 | 0.4388 | 0.5864 | 0.7117 | 0.7417 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3897 | 0.5442 | 0.4542 | 0.6344 | 0.8250 | 0.7173 | 0.4468 | 0.5610 | 0.7173 | 0.7767 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.4677 | 0.7451 | 0.5747 | 0.6376 | 0.8058 | 0.7119 | 0.5729 | 0.5353 | 0.7119 | 0.7611 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.4602 | 0.5203 | 0.4884 | 0.6902 | 0.8206 | 0.7498 | 0.4528 | 0.6050 | 0.7498 | 0.8055 | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.4653 | 0.4923 | 0.4784 | 0.6713 | 0.7035 | 0.6870 | 0.4363 | 0.5903 | 0.6870 | 0.7127 | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.3921 | 0.5559 | 0.4598 | 0.5948 | 0.7817 | 0.6755 | 0.4528 | 0.5535 | 0.6755 | 0.7050 | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.5323 | 0.6295 | 0.5768 | 0.6660 | 0.7097 | 0.6872 | 0.4991 | 0.5572 | 0.6872 | 0.7127 | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5471 | 0.4611 | 0.5005 | 0.7536 | 0.7242 | 0.7386 | 0.4279 | 0.6304 | 0.7386 | 0.7741 | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.4827 | 0.4964 | 0.4894 | 0.7089 | 0.7754 | 0.7407 | 0.4463 | 0.6205 | 0.7407 | 0.7816 | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3721 | 0.5759 | 0.4521 | 0.5735 | 0.8223 | 0.6758 | 0.4717 | 0.5728 | 0.6758 | 0.7050 | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.5954 | 0.7652 | 0.6697 | 0.5250 | 0.8421 | 0.6467 | 0.7194 | 0.6368 | 0.6467 | 0.6806 | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.4540 | 0.5659 | 0.5038 | 0.6690 | 0.8680 | 0.7556 | 0.4858 | 0.6341 | 0.7556 | 0.7976 | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3819 | 0.5878 | 0.4630 | 0.5996 | 0.8484 | 0.7026 | 0.4823 | 0.5800 | 0.7026 | 0.7387 | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.3739 | 0.6827 | 0.4832 | 0.5765 | 0.8616 | 0.6908 | 0.5260 | 0.5239 | 0.6908 | 0.7424 | +| status | model | backbone | loss | cp | cr | cf1 | op | or | of1 | map | macro_f1 | micro_f1 | sample_f1 | +|:----------|:---------|:------------------------------------------|:---------------------------|-------:|-------:|-------:|-------:|-------:|-------:|-------:|-----------:|-----------:|------------:| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2355 | 0.5864 | 0.3361 | 0.3986 | 0.9369 | 0.5592 | 0.4075 | 0.3792 | 0.5592 | 0.5593 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.2349 | 0.7073 | 0.3527 | 0.3736 | 0.9328 | 0.5335 | 0.4238 | 0.3532 | 0.5335 | 0.5301 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.2626 | 0.5864 | 0.3627 | 0.4156 | 0.9272 | 0.5739 | 0.4167 | 0.4089 | 0.5739 | 0.5847 | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.5128 | 0.4649 | 0.4877 | 0.7287 | 0.7158 | 0.7222 | 0.4248 | 0.6207 | 0.7222 | 0.7634 | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.5511 | 0.4662 | 0.5051 | 0.6861 | 0.7295 | 0.7071 | 0.4231 | 0.6135 | 0.7071 | 0.7282 | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.5192 | 0.4578 | 0.4866 | 0.7222 | 0.7416 | 0.7317 | 0.42 | 0.5871 | 0.7317 | 0.7774 | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4133 | 0.519 | 0.4602 | 0.6086 | 0.7911 | 0.6879 | 0.4381 | 0.5727 | 0.6879 | 0.7149 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2597 | 0.5792 | 0.3586 | 0.4626 | 0.9134 | 0.6142 | 0.4036 | 0.4507 | 0.6142 | 0.6247 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.2663 | 0.7744 | 0.3963 | 0.4428 | 0.9136 | 0.5965 | 0.4245 | 0.3837 | 0.5965 | 0.6216 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.3021 | 0.6078 | 0.4036 | 0.485 | 0.9138 | 0.6336 | 0.419 | 0.4576 | 0.6336 | 0.6419 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4659 | 0.4935 | 0.4793 | 0.7006 | 0.749 | 0.724 | 0.4392 | 0.5926 | 0.724 | 0.7614 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.455 | 0.6322 | 0.5292 | 0.6422 | 0.8003 | 0.7126 | 0.4711 | 0.4992 | 0.7126 | 0.7651 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.4567 | 0.508 | 0.481 | 0.6559 | 0.7778 | 0.7117 | 0.4388 | 0.5864 | 0.7117 | 0.7417 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3897 | 0.5442 | 0.4542 | 0.6344 | 0.825 | 0.7173 | 0.4468 | 0.561 | 0.7173 | 0.7767 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.4677 | 0.7451 | 0.5747 | 0.6376 | 0.8058 | 0.7119 | 0.5729 | 0.5353 | 0.7119 | 0.7611 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.4602 | 0.5203 | 0.4884 | 0.6902 | 0.8206 | 0.7498 | 0.4528 | 0.605 | 0.7498 | 0.8055 | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.4653 | 0.4923 | 0.4784 | 0.6713 | 0.7035 | 0.687 | 0.4363 | 0.5903 | 0.687 | 0.7127 | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.3921 | 0.5559 | 0.4598 | 0.5948 | 0.7817 | 0.6755 | 0.4528 | 0.5535 | 0.6755 | 0.705 | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.5323 | 0.6295 | 0.5768 | 0.666 | 0.7097 | 0.6872 | 0.4991 | 0.5572 | 0.6872 | 0.7127 | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5471 | 0.4611 | 0.5005 | 0.7536 | 0.7242 | 0.7386 | 0.4279 | 0.6304 | 0.7386 | 0.7741 | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.4827 | 0.4964 | 0.4894 | 0.7089 | 0.7754 | 0.7407 | 0.4463 | 0.6205 | 0.7407 | 0.7816 | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3721 | 0.5759 | 0.4521 | 0.5735 | 0.8223 | 0.6758 | 0.4717 | 0.5728 | 0.6758 | 0.705 | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.5954 | 0.7652 | 0.6697 | 0.525 | 0.8421 | 0.6467 | 0.7194 | 0.6368 | 0.6467 | 0.6806 | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.3894 | 0.7306 | 0.508 | 0.5649 | 0.8231 | 0.67 | 0.5747 | 0.4759 | 0.67 | 0.695 | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.454 | 0.5659 | 0.5038 | 0.669 | 0.868 | 0.7556 | 0.4858 | 0.6341 | 0.7556 | 0.7976 | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3819 | 0.5878 | 0.463 | 0.5996 | 0.8484 | 0.7026 | 0.4823 | 0.58 | 0.7026 | 0.7387 | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.3739 | 0.6827 | 0.4832 | 0.5765 | 0.8616 | 0.6908 | 0.526 | 0.5239 | 0.6908 | 0.7424 | #### Validation per-class precision @@ -570,35 +570,35 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps ##### Methods related to vision foundation models -| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | -|:----------|:---------|:------------------------------------------|:---------------------------|:-----------|:--------------|:-----------------|:------------------|:---------------|:--------------------|:-----------------|:----------------|:--------|:--------------|:--------------|:--------------|:---------|:-----------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.1538 | 0.0909 | 0.8171 | 0.0000 | 0.3927 | 0.1226 | 0.1424 | 0.1163 | 0.2996 | 0.2572 | 0.3201 | 0.3488 | 0.0000 | 0.0000 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1293 | 0.0479 | 0.8373 | 0.0165 | 0.3720 | 0.0944 | 0.2645 | 0.1210 | 0.2228 | 0.2512 | 0.3251 | 0.3718 | 0.0000 | 0.0000 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.3438 | 0.1200 | 0.8300 | 0.0000 | 0.3798 | 0.1432 | 0.1861 | 0.1507 | 0.3156 | 0.2696 | 0.3343 | 0.3402 | 0.0000 | 0.0000 | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.4865 | 0.0000 | 0.9335 | 0.0000 | 0.7403 | 0.9701 | 0.5975 | 0.2775 | 0.9854 | 0.5209 | 0.5806 | 0.5744 | 0.0000 | 0.0000 | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.5882 | 0.0000 | 0.9004 | 0.0000 | 0.6748 | 0.9533 | 0.7857 | 0.7578 | 0.9568 | 0.4869 | 0.5042 | 0.5562 | 0.0000 | 0.0000 | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.5122 | 0.0000 | 0.8997 | 0.0000 | 0.5544 | 0.7933 | 0.8824 | 0.4653 | 0.8673 | 0.6044 | 0.6062 | 0.5645 | 0.0000 | 0.0000 | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4464 | 0.0000 | 0.8341 | 0.0000 | 0.4672 | 0.5884 | 0.3820 | 0.5993 | 0.5725 | 0.4643 | 0.5651 | 0.4539 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.1855 | 0.0000 | 0.8074 | 0.0000 | 0.4709 | 0.2084 | 0.1457 | 0.1440 | 0.3253 | 0.2782 | 0.4139 | 0.3969 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.0533 | 0.0337 | 0.8235 | 0.0141 | 0.5108 | 0.1335 | 0.2759 | 0.1092 | 0.3170 | 0.3233 | 0.4558 | 0.4120 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.1197 | 0.1364 | 0.8121 | 0.0000 | 0.5321 | 0.1940 | 0.2849 | 0.1881 | 0.5520 | 0.2884 | 0.4260 | 0.3941 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.3945 | 0.0000 | 0.8804 | 0.0000 | 0.7228 | 0.7519 | 0.4815 | 0.2929 | 0.8296 | 0.5785 | 0.5538 | 0.5708 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.3609 | 0.2078 | 0.8565 | 0.0077 | 0.5520 | 0.5118 | 0.8571 | 0.2168 | 0.6870 | 0.5066 | 0.6240 | 0.5274 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.3392 | 0.0000 | 0.8877 | 0.0000 | 0.6847 | 0.5629 | 0.5897 | 0.4054 | 0.9165 | 0.3673 | 0.6132 | 0.5702 | 0.0000 | 0.0000 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.2336 | 0.0000 | 0.8866 | 0.0000 | 0.6964 | 0.4625 | 0.4417 | 0.2015 | 0.6843 | 0.4617 | 0.5249 | 0.4731 | 0.0000 | 0.0000 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.4286 | 0.2051 | 0.8933 | 0.0674 | 0.6260 | 0.8118 | 0.3783 | 0.3059 | 0.6560 | 0.4563 | 0.5283 | 0.4631 | 0.2593 | 0.0000 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.3439 | 0.0000 | 0.8400 | 0.0000 | 0.6892 | 0.7429 | 0.5618 | 0.3434 | 0.8080 | 0.5104 | 0.6251 | 0.5175 | 0.0000 | 0.0000 | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.4044 | 0.0000 | 0.9053 | 0.0000 | 0.5245 | 0.8696 | 0.5680 | 0.1716 | 0.9016 | 0.5726 | 0.5307 | 0.6011 | 0.0000 | 0.0000 | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.4823 | 0.0000 | 0.9090 | 0.0000 | 0.5169 | 0.5923 | 0.5138 | 0.1813 | 0.3968 | 0.4271 | 0.5960 | 0.4814 | 0.0000 | 0.0000 | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.4602 | 0.3846 | 0.9233 | 0.1724 | 0.4865 | 0.7904 | 0.5919 | 0.3402 | 0.8715 | 0.5404 | 0.5273 | 0.5990 | 0.2326 | 0.0000 | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5147 | 0.0000 | 0.9084 | 0.0000 | 0.7443 | 0.8941 | 0.7111 | 0.5970 | 0.9199 | 0.5982 | 0.5711 | 0.6532 | 0.0000 | 0.0000 | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3789 | 0.0000 | 0.8831 | 0.0000 | 0.6940 | 0.8204 | 0.6583 | 0.3478 | 0.8021 | 0.5506 | 0.5713 | 0.5682 | 0.0000 | 0.0000 | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3146 | 0.0000 | 0.8238 | 0.0000 | 0.4487 | 0.6193 | 0.3878 | 0.3004 | 0.5268 | 0.4755 | 0.4691 | 0.4721 | 0.0000 | 0.0000 | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.9630 | 0.0000 | 0.6205 | 0.2857 | 0.4143 | 0.0000 | 0.5618 | 0.0000 | 0.0000 | 0.9186 | 0.5112 | 0.4880 | 0.0000 | 0.0000 | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.4114 | 0.0000 | 0.8466 | 0.0000 | 0.5210 | 0.9171 | 0.3784 | 0.3625 | 0.7982 | 0.5515 | 0.6135 | 0.5022 | 0.0000 | 0.0000 | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3671 | 0.0000 | 0.8942 | 0.0000 | 0.5373 | 0.8089 | 0.2328 | 0.3293 | 0.2631 | 0.5029 | 0.5641 | 0.4654 | 0.0000 | 0.0000 | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.1257 | 0.2278 | 0.8474 | 0.0000 | 0.5212 | 0.7440 | 0.4138 | 0.1757 | 0.2598 | 0.4653 | 0.5556 | 0.5239 | 0.0000 | 0.0000 | +| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | +|:----------|:---------|:------------------------------------------|:---------------------------|-----------:|--------------:|-----------------:|------------------:|---------------:|--------------------:|-----------------:|----------------:|--------:|--------------:|--------------:|--------------:|---------:|-----------:| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.1538 | 0.0909 | 0.8171 | 0 | 0.3927 | 0.1226 | 0.1424 | 0.1163 | 0.2996 | 0.2572 | 0.3201 | 0.3488 | 0 | 0 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1293 | 0.0479 | 0.8373 | 0.0165 | 0.372 | 0.0944 | 0.2645 | 0.121 | 0.2228 | 0.2512 | 0.3251 | 0.3718 | 0 | 0 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.3438 | 0.12 | 0.83 | 0 | 0.3798 | 0.1432 | 0.1861 | 0.1507 | 0.3156 | 0.2696 | 0.3343 | 0.3402 | 0 | 0 | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.4865 | 0 | 0.9335 | 0 | 0.7403 | 0.9701 | 0.5975 | 0.2775 | 0.9854 | 0.5209 | 0.5806 | 0.5744 | 0 | 0 | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.5882 | 0 | 0.9004 | 0 | 0.6748 | 0.9533 | 0.7857 | 0.7578 | 0.9568 | 0.4869 | 0.5042 | 0.5562 | 0 | 0 | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.5122 | 0 | 0.8997 | 0 | 0.5544 | 0.7933 | 0.8824 | 0.4653 | 0.8673 | 0.6044 | 0.6062 | 0.5645 | 0 | 0 | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4464 | 0 | 0.8341 | 0 | 0.4672 | 0.5884 | 0.382 | 0.5993 | 0.5725 | 0.4643 | 0.5651 | 0.4539 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.1855 | 0 | 0.8074 | 0 | 0.4709 | 0.2084 | 0.1457 | 0.144 | 0.3253 | 0.2782 | 0.4139 | 0.3969 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.0533 | 0.0337 | 0.8235 | 0.0141 | 0.5108 | 0.1335 | 0.2759 | 0.1092 | 0.317 | 0.3233 | 0.4558 | 0.412 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.1197 | 0.1364 | 0.8121 | 0 | 0.5321 | 0.194 | 0.2849 | 0.1881 | 0.552 | 0.2884 | 0.426 | 0.3941 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.3945 | 0 | 0.8804 | 0 | 0.7228 | 0.7519 | 0.4815 | 0.2929 | 0.8296 | 0.5785 | 0.5538 | 0.5708 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.3609 | 0.2078 | 0.8565 | 0.0077 | 0.552 | 0.5118 | 0.8571 | 0.2168 | 0.687 | 0.5066 | 0.624 | 0.5274 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.3392 | 0 | 0.8877 | 0 | 0.6847 | 0.5629 | 0.5897 | 0.4054 | 0.9165 | 0.3673 | 0.6132 | 0.5702 | 0 | 0 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.2336 | 0 | 0.8866 | 0 | 0.6964 | 0.4625 | 0.4417 | 0.2015 | 0.6843 | 0.4617 | 0.5249 | 0.4731 | 0 | 0 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.4286 | 0.2051 | 0.8933 | 0.0674 | 0.626 | 0.8118 | 0.3783 | 0.3059 | 0.656 | 0.4563 | 0.5283 | 0.4631 | 0.2593 | 0 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.3439 | 0 | 0.84 | 0 | 0.6892 | 0.7429 | 0.5618 | 0.3434 | 0.808 | 0.5104 | 0.6251 | 0.5175 | 0 | 0 | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.4044 | 0 | 0.9053 | 0 | 0.5245 | 0.8696 | 0.568 | 0.1716 | 0.9016 | 0.5726 | 0.5307 | 0.6011 | 0 | 0 | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.4823 | 0 | 0.909 | 0 | 0.5169 | 0.5923 | 0.5138 | 0.1813 | 0.3968 | 0.4271 | 0.596 | 0.4814 | 0 | 0 | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.4602 | 0.3846 | 0.9233 | 0.1724 | 0.4865 | 0.7904 | 0.5919 | 0.3402 | 0.8715 | 0.5404 | 0.5273 | 0.599 | 0.2326 | 0 | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5147 | 0 | 0.9084 | 0 | 0.7443 | 0.8941 | 0.7111 | 0.597 | 0.9199 | 0.5982 | 0.5711 | 0.6532 | 0 | 0 | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3789 | 0 | 0.8831 | 0 | 0.694 | 0.8204 | 0.6583 | 0.3478 | 0.8021 | 0.5506 | 0.5713 | 0.5682 | 0 | 0 | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3146 | 0 | 0.8238 | 0 | 0.4487 | 0.6193 | 0.3878 | 0.3004 | 0.5268 | 0.4755 | 0.4691 | 0.4721 | 0 | 0 | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.963 | 0 | 0.6205 | 0.2857 | 0.4143 | 0 | 0.5618 | 0 | 0 | 0.9186 | 0.5112 | 0.488 | 0 | 0 | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.4731 | 0.0963 | 0.8188 | 0.037 | 0.3772 | 0.5354 | 0.3649 | 0.2771 | 0.4867 | 0.4954 | 0.5144 | 0.5133 | 0.0729 | 0 | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.4114 | 0 | 0.8466 | 0 | 0.521 | 0.9171 | 0.3784 | 0.3625 | 0.7982 | 0.5515 | 0.6135 | 0.5022 | 0 | 0 | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3671 | 0 | 0.8942 | 0 | 0.5373 | 0.8089 | 0.2328 | 0.3293 | 0.2631 | 0.5029 | 0.5641 | 0.4654 | 0 | 0 | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.1257 | 0.2278 | 0.8474 | 0 | 0.5212 | 0.744 | 0.4138 | 0.1757 | 0.2598 | 0.4653 | 0.5556 | 0.5239 | 0 | 0 | #### Validation per-class recall @@ -669,35 +669,35 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps ##### Methods related to vision foundation models -| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | -|:----------|:---------|:------------------------------------------|:---------------------------|:-----------|:--------------|:-----------------|:------------------|:---------------|:--------------------|:-----------------|:----------------|:--------|:--------------|:--------------|:--------------|:---------|:-----------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.4078 | 0.1111 | 0.9792 | 0.0000 | 0.9518 | 0.8068 | 0.1865 | 0.3493 | 0.9651 | 0.9747 | 0.9582 | 0.9323 | 0.0000 | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.3981 | 0.4444 | 0.9697 | 0.6667 | 0.9369 | 0.8893 | 0.5346 | 0.6028 | 0.9669 | 0.9796 | 0.8944 | 0.9117 | 0.0000 | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.4272 | 0.1667 | 0.9737 | 0.0000 | 0.9353 | 0.7907 | 0.3558 | 0.1859 | 0.9660 | 0.9532 | 0.9336 | 0.9357 | 0.0000 | - | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.3711 | 0.0000 | 0.7680 | 0.0000 | 0.7661 | 0.6331 | 0.2712 | 0.2845 | 0.9099 | 0.7920 | 0.5597 | 0.6878 | 0.0000 | - | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.3883 | 0.0000 | 0.7663 | 0.0000 | 0.7913 | 0.6368 | 0.0846 | 0.3437 | 0.8901 | 0.7713 | 0.6388 | 0.7500 | 0.0000 | - | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.2039 | 0.0000 | 0.8704 | 0.0000 | 0.8367 | 0.6408 | 0.0577 | 0.5662 | 0.9464 | 0.5337 | 0.6110 | 0.6842 | 0.0000 | - | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4854 | 0.0000 | 0.8433 | 0.0000 | 0.8731 | 0.7666 | 0.0654 | 0.4845 | 0.9705 | 0.7081 | 0.7177 | 0.8326 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.4951 | 0.0000 | 0.9870 | 0.0000 | 0.9045 | 0.6539 | 0.1538 | 0.6507 | 0.9589 | 0.9557 | 0.8569 | 0.9136 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.8155 | 0.8333 | 0.9813 | 0.8889 | 0.8523 | 0.8129 | 0.4558 | 0.7690 | 0.9768 | 0.9645 | 0.8126 | 0.9045 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.6311 | 0.1667 | 0.9862 | 0.0000 | 0.8967 | 0.7696 | 0.2788 | 0.5099 | 0.9535 | 0.9643 | 0.8267 | 0.9174 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4175 | 0.0000 | 0.7977 | 0.0000 | 0.8093 | 0.4970 | 0.0750 | 0.7211 | 0.9267 | 0.5982 | 0.7777 | 0.7957 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.4660 | 0.8889 | 0.9250 | 0.5556 | 0.8149 | 0.6529 | 0.0692 | 0.7690 | 0.9571 | 0.7334 | 0.6090 | 0.7770 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.5631 | 0.0000 | 0.8887 | 0.0000 | 0.7673 | 0.5986 | 0.0442 | 0.6338 | 0.9508 | 0.8495 | 0.5238 | 0.7839 | 0.0000 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.5534 | 0.0000 | 0.9093 | 0.0000 | 0.8420 | 0.5453 | 0.1385 | 0.7634 | 0.9374 | 0.8326 | 0.6804 | 0.8729 | 0.0000 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.6699 | 0.8889 | 0.8701 | 0.6667 | 0.8778 | 0.6640 | 0.2212 | 0.7972 | 0.9750 | 0.8621 | 0.5659 | 0.8505 | 0.7778 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.6311 | 0.0000 | 0.9675 | 0.0000 | 0.8470 | 0.6076 | 0.0962 | 0.4789 | 0.9330 | 0.7923 | 0.5310 | 0.8794 | 0.0000 | - | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.5340 | 0.0000 | 0.7313 | 0.0000 | 0.8743 | 0.6710 | 0.1365 | 0.5549 | 0.9580 | 0.5533 | 0.6301 | 0.7565 | 0.0000 | - | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.6602 | 0.0000 | 0.8001 | 0.0000 | 0.8414 | 0.7163 | 0.1077 | 0.7606 | 0.9821 | 0.8594 | 0.6236 | 0.8752 | 0.0000 | - | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.5049 | 0.2778 | 0.7106 | 0.5556 | 0.8106 | 0.7284 | 0.4212 | 0.6028 | 0.9517 | 0.6963 | 0.5918 | 0.7759 | 0.5556 | - | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.3398 | 0.0000 | 0.7923 | 0.0000 | 0.7477 | 0.5946 | 0.1846 | 0.3380 | 0.9446 | 0.6611 | 0.6395 | 0.7527 | 0.0000 | - | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3495 | 0.0000 | 0.8510 | 0.0000 | 0.8345 | 0.5976 | 0.2519 | 0.4507 | 0.9634 | 0.7092 | 0.6887 | 0.7561 | 0.0000 | - | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.6505 | 0.0000 | 0.8318 | 0.0000 | 0.9216 | 0.7414 | 0.2558 | 0.6761 | 0.9678 | 0.7487 | 0.8381 | 0.8554 | 0.0000 | - | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.8387 | - | 1.0000 | 0.6667 | 0.9363 | - | 0.3106 | - | - | 0.9471 | 0.4405 | 0.9819 | - | - | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.6990 | 0.0000 | 0.9640 | 0.0000 | 0.9095 | 0.6680 | 0.1346 | 0.5718 | 0.9508 | 0.8181 | 0.7459 | 0.8950 | 0.0000 | - | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.7379 | 0.0000 | 0.8616 | 0.0000 | 0.9170 | 0.7284 | 0.2212 | 0.6197 | 0.9812 | 0.8218 | 0.8461 | 0.9072 | 0.0000 | - | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.8835 | 1.0000 | 0.9237 | 0.0000 | 0.8818 | 0.7455 | 0.2308 | 0.7380 | 0.9812 | 0.8852 | 0.7352 | 0.8706 | 0.0000 | - | +| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | +|:----------|:---------|:------------------------------------------|:---------------------------|-----------:|:--------------|-----------------:|------------------:|---------------:|:--------------------|-----------------:|:----------------|:--------|--------------:|--------------:|--------------:|:---------|:-----------| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.4078 | 0.1111 | 0.9792 | 0 | 0.9518 | 0.8068 | 0.1865 | 0.3493 | 0.9651 | 0.9747 | 0.9582 | 0.9323 | 0.0000 | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.3981 | 0.4444 | 0.9697 | 0.6667 | 0.9369 | 0.8893 | 0.5346 | 0.6028 | 0.9669 | 0.9796 | 0.8944 | 0.9117 | 0.0000 | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.4272 | 0.1667 | 0.9737 | 0 | 0.9353 | 0.7907 | 0.3558 | 0.1859 | 0.9660 | 0.9532 | 0.9336 | 0.9357 | 0.0000 | - | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.3711 | 0.0000 | 0.768 | 0 | 0.7661 | 0.6331 | 0.2712 | 0.2845 | 0.9099 | 0.792 | 0.5597 | 0.6878 | 0.0000 | - | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.3883 | 0.0000 | 0.7663 | 0 | 0.7913 | 0.6368 | 0.0846 | 0.3437 | 0.8901 | 0.7713 | 0.6388 | 0.75 | 0.0000 | - | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.2039 | 0.0000 | 0.8704 | 0 | 0.8367 | 0.6408 | 0.0577 | 0.5662 | 0.9464 | 0.5337 | 0.611 | 0.6842 | 0.0000 | - | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4854 | 0.0000 | 0.8433 | 0 | 0.8731 | 0.7666 | 0.0654 | 0.4845 | 0.9705 | 0.7081 | 0.7177 | 0.8326 | 0.0000 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.4951 | 0.0000 | 0.987 | 0 | 0.9045 | 0.6539 | 0.1538 | 0.6507 | 0.9589 | 0.9557 | 0.8569 | 0.9136 | 0.0000 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.8155 | 0.8333 | 0.9813 | 0.8889 | 0.8523 | 0.8129 | 0.4558 | 0.7690 | 0.9768 | 0.9645 | 0.8126 | 0.9045 | 0.0000 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.6311 | 0.1667 | 0.9862 | 0 | 0.8967 | 0.7696 | 0.2788 | 0.5099 | 0.9535 | 0.9643 | 0.8267 | 0.9174 | 0.0000 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4175 | 0.0000 | 0.7977 | 0 | 0.8093 | 0.4970 | 0.075 | 0.7211 | 0.9267 | 0.5982 | 0.7777 | 0.7957 | 0.0000 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.466 | 0.8889 | 0.925 | 0.5556 | 0.8149 | 0.6529 | 0.0692 | 0.7690 | 0.9571 | 0.7334 | 0.609 | 0.777 | 0.0000 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.5631 | 0.0000 | 0.8887 | 0 | 0.7673 | 0.5986 | 0.0442 | 0.6338 | 0.9508 | 0.8495 | 0.5238 | 0.7839 | 0.0000 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.5534 | 0.0000 | 0.9093 | 0 | 0.842 | 0.5453 | 0.1385 | 0.7634 | 0.9374 | 0.8326 | 0.6804 | 0.8729 | 0.0000 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.6699 | 0.8889 | 0.8701 | 0.6667 | 0.8778 | 0.6640 | 0.2212 | 0.7972 | 0.9750 | 0.8621 | 0.5659 | 0.8505 | 0.7778 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.6311 | 0.0000 | 0.9675 | 0 | 0.847 | 0.6076 | 0.0962 | 0.4789 | 0.9330 | 0.7923 | 0.531 | 0.8794 | 0.0000 | - | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.534 | 0.0000 | 0.7313 | 0 | 0.8743 | 0.6710 | 0.1365 | 0.5549 | 0.9580 | 0.5533 | 0.6301 | 0.7565 | 0.0000 | - | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.6602 | 0.0000 | 0.8001 | 0 | 0.8414 | 0.7163 | 0.1077 | 0.7606 | 0.9821 | 0.8594 | 0.6236 | 0.8752 | 0.0000 | - | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.5049 | 0.2778 | 0.7106 | 0.5556 | 0.8106 | 0.7284 | 0.4212 | 0.6028 | 0.9517 | 0.6963 | 0.5918 | 0.7759 | 0.5556 | - | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.3398 | 0.0000 | 0.7923 | 0 | 0.7477 | 0.5946 | 0.1846 | 0.3380 | 0.9446 | 0.6611 | 0.6395 | 0.7527 | 0.0000 | - | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3495 | 0.0000 | 0.851 | 0 | 0.8345 | 0.5976 | 0.2519 | 0.4507 | 0.9634 | 0.7092 | 0.6887 | 0.7561 | 0.0000 | - | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.6505 | 0.0000 | 0.8318 | 0 | 0.9216 | 0.7414 | 0.2558 | 0.6761 | 0.9678 | 0.7487 | 0.8381 | 0.8554 | 0.0000 | - | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.8387 | - | 1 | 0.6667 | 0.9363 | - | 0.3106 | - | - | 0.9471 | 0.4405 | 0.9819 | - | - | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.767 | 1.0000 | 0.8516 | 0.4444 | 0.917 | 0.7978 | 0.2962 | 0.6986 | 0.9777 | 0.7683 | 0.7609 | 0.8291 | 0.3889 | - | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.699 | 0.0000 | 0.964 | 0 | 0.9095 | 0.6680 | 0.1346 | 0.5718 | 0.9508 | 0.8181 | 0.7459 | 0.895 | 0.0000 | - | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.7379 | 0.0000 | 0.8616 | 0 | 0.917 | 0.7284 | 0.2212 | 0.6197 | 0.9812 | 0.8218 | 0.8461 | 0.9072 | 0.0000 | - | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.8835 | 1.0000 | 0.9237 | 0 | 0.8818 | 0.7455 | 0.2308 | 0.7380 | 0.9812 | 0.8852 | 0.7352 | 0.8706 | 0.0000 | - | #### Validation per-class f1 @@ -768,35 +768,35 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps ##### Methods related to vision foundation models -| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | -|:----------|:---------|:------------------------------------------|:---------------------------|:-----------|:--------------|:-----------------|:------------------|:---------------|:--------------------|:-----------------|:----------------|:--------|:--------------|:--------------|:--------------|:---------|:-----------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2234 | 0.1000 | 0.8909 | - | 0.5560 | 0.2129 | 0.1615 | 0.1745 | 0.4572 | 0.4070 | 0.4799 | 0.5076 | - | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1952 | 0.0865 | 0.8986 | 0.0323 | 0.5326 | 0.1707 | 0.3539 | 0.2016 | 0.3621 | 0.3998 | 0.4769 | 0.5282 | - | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.3810 | 0.1395 | 0.8961 | - | 0.5402 | 0.2425 | 0.2444 | 0.1665 | 0.4758 | 0.4204 | 0.4923 | 0.4990 | - | - | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.4211 | - | 0.8427 | - | 0.7530 | 0.7662 | 0.3730 | 0.2809 | 0.9461 | 0.6284 | 0.5700 | 0.6260 | - | - | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.4678 | - | 0.8280 | - | 0.7284 | 0.7636 | 0.1528 | 0.4729 | 0.9222 | 0.5969 | 0.5636 | 0.6387 | - | - | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.2917 | - | 0.8848 | - | 0.6669 | 0.7090 | 0.1083 | 0.5108 | 0.9051 | 0.5669 | 0.6086 | 0.6186 | - | - | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4651 | - | 0.8387 | - | 0.6087 | 0.6658 | 0.1117 | 0.5358 | 0.7202 | 0.5609 | 0.6323 | 0.5875 | - | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2698 | - | 0.8882 | - | 0.6194 | 0.3161 | 0.1497 | 0.2358 | 0.4857 | 0.4310 | 0.5582 | 0.5534 | - | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.1001 | 0.0648 | 0.8955 | 0.0277 | 0.6388 | 0.2294 | 0.3437 | 0.1913 | 0.4787 | 0.4842 | 0.5840 | 0.5662 | - | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.2012 | 0.1500 | 0.8908 | - | 0.6679 | 0.3098 | 0.2818 | 0.2749 | 0.6992 | 0.4439 | 0.5622 | 0.5514 | - | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4057 | - | 0.8370 | - | 0.7636 | 0.5984 | 0.1298 | 0.4166 | 0.8755 | 0.5882 | 0.6469 | 0.6648 | - | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.4068 | 0.3368 | 0.8894 | 0.0151 | 0.6582 | 0.5738 | 0.1281 | 0.3383 | 0.7999 | 0.5993 | 0.6164 | 0.6283 | - | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.4234 | - | 0.8882 | - | 0.7237 | 0.5802 | 0.0823 | 0.4945 | 0.9333 | 0.5129 | 0.5650 | 0.6602 | - | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3285 | - | 0.8978 | - | 0.7623 | 0.5005 | 0.2108 | 0.3188 | 0.7911 | 0.5940 | 0.5926 | 0.6136 | - | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.5227 | 0.3333 | 0.8815 | 0.1224 | 0.7308 | 0.7305 | 0.2791 | 0.4422 | 0.7843 | 0.5967 | 0.5464 | 0.5997 | 0.3889 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.4452 | - | 0.8992 | - | 0.7600 | 0.6685 | 0.1642 | 0.4000 | 0.8660 | 0.6208 | 0.5742 | 0.6515 | - | - | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.4603 | - | 0.8091 | - | 0.6557 | 0.7575 | 0.2202 | 0.2621 | 0.9289 | 0.5628 | 0.5761 | 0.6699 | - | - | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.5574 | - | 0.8511 | - | 0.6404 | 0.6485 | 0.1781 | 0.2928 | 0.5652 | 0.5707 | 0.6095 | 0.6211 | - | - | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.4815 | 0.3226 | 0.8031 | 0.2632 | 0.6080 | 0.7581 | 0.4921 | 0.4350 | 0.9099 | 0.6085 | 0.5577 | 0.6761 | 0.3279 | - | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.4094 | - | 0.8464 | - | 0.7460 | 0.7142 | 0.2931 | 0.4317 | 0.9321 | 0.6281 | 0.6034 | 0.6994 | - | - | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3636 | - | 0.8668 | - | 0.7578 | 0.6915 | 0.3644 | 0.3926 | 0.8754 | 0.6199 | 0.6245 | 0.6488 | - | - | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.4241 | - | 0.8278 | - | 0.6036 | 0.6749 | 0.3082 | 0.4159 | 0.6822 | 0.5816 | 0.6015 | 0.6084 | - | - | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.8966 | - | 0.7658 | 0.4000 | 0.5744 | - | 0.4000 | - | - | 0.9326 | 0.4732 | 0.6520 | - | - | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.5180 | - | 0.9015 | - | 0.6625 | 0.7730 | 0.1986 | 0.4437 | 0.8679 | 0.6589 | 0.6733 | 0.6434 | - | - | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.4903 | - | 0.8776 | - | 0.6775 | 0.7665 | 0.2268 | 0.4301 | 0.4150 | 0.6240 | 0.6769 | 0.6152 | - | - | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.2201 | 0.3711 | 0.8839 | - | 0.6552 | 0.7447 | 0.2963 | 0.2839 | 0.4109 | 0.6099 | 0.6329 | 0.6542 | - | - | +| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | +|:----------|:---------|:------------------------------------------|:---------------------------|-----------:|:--------------|-----------------:|:------------------|---------------:|:--------------------|-----------------:|:----------------|:--------|--------------:|--------------:|--------------:|:---------|:-----------| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2234 | 0.1000 | 0.8909 | - | 0.556 | 0.2129 | 0.1615 | 0.1745 | 0.4572 | 0.407 | 0.4799 | 0.5076 | - | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1952 | 0.0865 | 0.8986 | 0.0323 | 0.5326 | 0.1707 | 0.3539 | 0.2016 | 0.3621 | 0.3998 | 0.4769 | 0.5282 | - | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.381 | 0.1395 | 0.8961 | - | 0.5402 | 0.2425 | 0.2444 | 0.1665 | 0.4758 | 0.4204 | 0.4923 | 0.499 | - | - | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.4211 | - | 0.8427 | - | 0.753 | 0.7662 | 0.373 | 0.2809 | 0.9461 | 0.6284 | 0.57 | 0.626 | - | - | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.4678 | - | 0.828 | - | 0.7284 | 0.7636 | 0.1528 | 0.4729 | 0.9222 | 0.5969 | 0.5636 | 0.6387 | - | - | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.2917 | - | 0.8848 | - | 0.6669 | 0.7090 | 0.1083 | 0.5108 | 0.9051 | 0.5669 | 0.6086 | 0.6186 | - | - | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4651 | - | 0.8387 | - | 0.6087 | 0.6658 | 0.1117 | 0.5358 | 0.7202 | 0.5609 | 0.6323 | 0.5875 | - | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2698 | - | 0.8882 | - | 0.6194 | 0.3161 | 0.1497 | 0.2358 | 0.4857 | 0.431 | 0.5582 | 0.5534 | - | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.1001 | 0.0648 | 0.8955 | 0.0277 | 0.6388 | 0.2294 | 0.3437 | 0.1913 | 0.4787 | 0.4842 | 0.584 | 0.5662 | - | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.2012 | 0.1500 | 0.8908 | - | 0.6679 | 0.3098 | 0.2818 | 0.2749 | 0.6992 | 0.4439 | 0.5622 | 0.5514 | - | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4057 | - | 0.837 | - | 0.7636 | 0.5984 | 0.1298 | 0.4166 | 0.8755 | 0.5882 | 0.6469 | 0.6648 | - | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.4068 | 0.3368 | 0.8894 | 0.0151 | 0.6582 | 0.5738 | 0.1281 | 0.3383 | 0.7999 | 0.5993 | 0.6164 | 0.6283 | - | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.4234 | - | 0.8882 | - | 0.7237 | 0.5802 | 0.0823 | 0.4945 | 0.9333 | 0.5129 | 0.565 | 0.6602 | - | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3285 | - | 0.8978 | - | 0.7623 | 0.5005 | 0.2108 | 0.3188 | 0.7911 | 0.594 | 0.5926 | 0.6136 | - | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.5227 | 0.3333 | 0.8815 | 0.1224 | 0.7308 | 0.7305 | 0.2791 | 0.4422 | 0.7843 | 0.5967 | 0.5464 | 0.5997 | 0.3889 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.4452 | - | 0.8992 | - | 0.76 | 0.6685 | 0.1642 | 0.4000 | 0.8660 | 0.6208 | 0.5742 | 0.6515 | - | - | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.4603 | - | 0.8091 | - | 0.6557 | 0.7575 | 0.2202 | 0.2621 | 0.9289 | 0.5628 | 0.5761 | 0.6699 | - | - | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.5574 | - | 0.8511 | - | 0.6404 | 0.6485 | 0.1781 | 0.2928 | 0.5652 | 0.5707 | 0.6095 | 0.6211 | - | - | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.4815 | 0.3226 | 0.8031 | 0.2632 | 0.608 | 0.7581 | 0.4921 | 0.4350 | 0.9099 | 0.6085 | 0.5577 | 0.6761 | 0.3279 | - | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.4094 | - | 0.8464 | - | 0.746 | 0.7142 | 0.2931 | 0.4317 | 0.9321 | 0.6281 | 0.6034 | 0.6994 | - | - | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3636 | - | 0.8668 | - | 0.7578 | 0.6915 | 0.3644 | 0.3926 | 0.8754 | 0.6199 | 0.6245 | 0.6488 | - | - | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.4241 | - | 0.8278 | - | 0.6036 | 0.6749 | 0.3082 | 0.4159 | 0.6822 | 0.5816 | 0.6015 | 0.6084 | - | - | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.8966 | - | 0.7658 | 0.4000 | 0.5744 | - | 0.4 | - | - | 0.9326 | 0.4732 | 0.652 | - | - | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.5852 | 0.1756 | 0.8348 | 0.0684 | 0.5345 | 0.6408 | 0.327 | 0.3968 | 0.6498 | 0.6024 | 0.6138 | 0.6341 | 0.1228 | - | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.518 | - | 0.9015 | - | 0.6625 | 0.7730 | 0.1986 | 0.4437 | 0.8679 | 0.6589 | 0.6733 | 0.6434 | - | - | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.4903 | - | 0.8776 | - | 0.6775 | 0.7665 | 0.2268 | 0.4301 | 0.4150 | 0.624 | 0.6769 | 0.6152 | - | - | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.2201 | 0.3711 | 0.8839 | - | 0.6552 | 0.7447 | 0.2963 | 0.2839 | 0.4109 | 0.6099 | 0.6329 | 0.6542 | - | - | #### Validation per-class ap @@ -867,35 +867,35 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps ##### Methods related to vision foundation models -| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | -|:----------|:---------|:------------------------------------------|:---------------------------|:-----------|:--------------|:-----------------|:------------------|:---------------|:--------------------|:-----------------|:----------------|:--------|:--------------|:--------------|:--------------|:---------|:-----------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2191 | 0.0096 | 0.9383 | 0.0069 | 0.8205 | 0.5164 | 0.1127 | 0.0951 | 0.9262 | 0.5653 | 0.4610 | 0.6260 | 0.0009 | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1944 | 0.0208 | 0.9429 | 0.3143 | 0.7978 | 0.4582 | 0.2012 | 0.0800 | 0.9001 | 0.5689 | 0.4237 | 0.6063 | 0.0009 | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.3224 | 0.0276 | 0.9435 | 0.0069 | 0.8053 | 0.5270 | 0.1235 | 0.0614 | 0.9164 | 0.5613 | 0.4695 | 0.6518 | 0.0009 | - | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.2031 | 0.0009 | 0.9465 | 0.0069 | 0.7645 | 0.6529 | 0.2829 | 0.1778 | 0.9155 | 0.5509 | 0.4488 | 0.5705 | 0.0009 | - | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.2971 | 0.0009 | 0.9396 | 0.0069 | 0.7492 | 0.6576 | 0.1918 | 0.3237 | 0.8937 | 0.5026 | 0.3845 | 0.5520 | 0.0009 | - | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.1807 | 0.0009 | 0.9488 | 0.0069 | 0.6934 | 0.6238 | 0.1810 | 0.3679 | 0.9455 | 0.5203 | 0.4782 | 0.5123 | 0.0009 | - | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.2762 | 0.0009 | 0.9334 | 0.0069 | 0.6358 | 0.7504 | 0.1578 | 0.4492 | 0.9548 | 0.5350 | 0.4824 | 0.5119 | 0.0009 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2528 | 0.0009 | 0.9470 | 0.0069 | 0.7846 | 0.4317 | 0.1195 | 0.2352 | 0.9104 | 0.5679 | 0.4376 | 0.5516 | 0.0009 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.0876 | 0.0913 | 0.9573 | 0.1113 | 0.7674 | 0.5730 | 0.2050 | 0.1898 | 0.9350 | 0.6007 | 0.4587 | 0.5404 | 0.0009 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.1419 | 0.0205 | 0.9528 | 0.0069 | 0.7885 | 0.5741 | 0.1858 | 0.2644 | 0.9339 | 0.5852 | 0.4557 | 0.5367 | 0.0009 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.2712 | 0.0009 | 0.9355 | 0.0069 | 0.8153 | 0.4620 | 0.1548 | 0.5399 | 0.9088 | 0.5377 | 0.4777 | 0.5982 | 0.0009 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2498 | 0.4262 | 0.9530 | 0.0147 | 0.7485 | 0.5467 | 0.1779 | 0.4906 | 0.9318 | 0.5421 | 0.4958 | 0.5461 | 0.0009 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.2932 | 0.0009 | 0.9518 | 0.0069 | 0.7747 | 0.5594 | 0.1462 | 0.4964 | 0.9502 | 0.4687 | 0.4718 | 0.5829 | 0.0009 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3176 | 0.0009 | 0.9518 | 0.0069 | 0.8274 | 0.4850 | 0.1898 | 0.4126 | 0.9261 | 0.5760 | 0.4695 | 0.6444 | 0.0009 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.4232 | 0.5554 | 0.9507 | 0.2181 | 0.8112 | 0.6726 | 0.1887 | 0.5730 | 0.9518 | 0.5181 | 0.4015 | 0.6179 | 0.5650 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.3914 | 0.0009 | 0.9553 | 0.0069 | 0.8028 | 0.6032 | 0.1957 | 0.2646 | 0.9265 | 0.5695 | 0.5141 | 0.6546 | 0.0009 | - | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.3024 | 0.0009 | 0.9297 | 0.0069 | 0.6820 | 0.6814 | 0.2076 | 0.3745 | 0.9558 | 0.4783 | 0.4177 | 0.6337 | 0.0009 | - | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.3990 | 0.0009 | 0.9479 | 0.0069 | 0.6335 | 0.6909 | 0.1685 | 0.4685 | 0.9400 | 0.5327 | 0.4665 | 0.6298 | 0.0009 | - | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.3311 | 0.2015 | 0.9259 | 0.1437 | 0.4898 | 0.7242 | 0.3809 | 0.4366 | 0.9460 | 0.5164 | 0.4052 | 0.5957 | 0.3914 | - | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.2059 | 0.0009 | 0.9447 | 0.0069 | 0.7510 | 0.5947 | 0.2537 | 0.2804 | 0.9399 | 0.5364 | 0.4639 | 0.5836 | 0.0009 | - | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.2503 | 0.0009 | 0.9455 | 0.0069 | 0.8007 | 0.6104 | 0.2966 | 0.3153 | 0.9411 | 0.5561 | 0.4659 | 0.6112 | 0.0009 | - | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3704 | 0.0009 | 0.9285 | 0.0069 | 0.8234 | 0.7275 | 0.2129 | 0.4812 | 0.9546 | 0.5150 | 0.4467 | 0.6631 | 0.0009 | - | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.8448 | - | 0.9281 | 0.6017 | 0.8329 | - | 0.3077 | - | - | 0.9305 | 0.4889 | 0.8205 | - | - | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.3950 | 0.0009 | 0.9601 | 0.0069 | 0.7797 | 0.6850 | 0.1662 | 0.4741 | 0.9393 | 0.6425 | 0.5790 | 0.6866 | 0.0009 | - | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3487 | 0.0009 | 0.9593 | 0.0069 | 0.7939 | 0.7416 | 0.1531 | 0.5089 | 0.9538 | 0.5833 | 0.5272 | 0.6908 | 0.0009 | - | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.4842 | 0.4589 | 0.9581 | 0.0067 | 0.7518 | 0.7517 | 0.2067 | 0.5239 | 0.9575 | 0.5892 | 0.5018 | 0.6461 | 0.0009 | - | +| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | +|:----------|:---------|:------------------------------------------|:---------------------------|-----------:|:--------------|-----------------:|------------------:|---------------:|:--------------------|-----------------:|:----------------|:--------|--------------:|--------------:|--------------:|:---------|:-----------| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2191 | 0.0096 | 0.9383 | 0.0069 | 0.8205 | 0.5164 | 0.1127 | 0.0951 | 0.9262 | 0.5653 | 0.461 | 0.626 | 0.0009 | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1944 | 0.0208 | 0.9429 | 0.3143 | 0.7978 | 0.4582 | 0.2012 | 0.0800 | 0.9001 | 0.5689 | 0.4237 | 0.6063 | 0.0009 | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.3224 | 0.0276 | 0.9435 | 0.0069 | 0.8053 | 0.5270 | 0.1235 | 0.0614 | 0.9164 | 0.5613 | 0.4695 | 0.6518 | 0.0009 | - | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.2031 | 0.0009 | 0.9465 | 0.0069 | 0.7645 | 0.6529 | 0.2829 | 0.1778 | 0.9155 | 0.5509 | 0.4488 | 0.5705 | 0.0009 | - | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.2971 | 0.0009 | 0.9396 | 0.0069 | 0.7492 | 0.6576 | 0.1918 | 0.3237 | 0.8937 | 0.5026 | 0.3845 | 0.552 | 0.0009 | - | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.1807 | 0.0009 | 0.9488 | 0.0069 | 0.6934 | 0.6238 | 0.181 | 0.3679 | 0.9455 | 0.5203 | 0.4782 | 0.5123 | 0.0009 | - | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.2762 | 0.0009 | 0.9334 | 0.0069 | 0.6358 | 0.7504 | 0.1578 | 0.4492 | 0.9548 | 0.535 | 0.4824 | 0.5119 | 0.0009 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2528 | 0.0009 | 0.947 | 0.0069 | 0.7846 | 0.4317 | 0.1195 | 0.2352 | 0.9104 | 0.5679 | 0.4376 | 0.5516 | 0.0009 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.0876 | 0.0913 | 0.9573 | 0.1113 | 0.7674 | 0.5730 | 0.205 | 0.1898 | 0.9350 | 0.6007 | 0.4587 | 0.5404 | 0.0009 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.1419 | 0.0205 | 0.9528 | 0.0069 | 0.7885 | 0.5741 | 0.1858 | 0.2644 | 0.9339 | 0.5852 | 0.4557 | 0.5367 | 0.0009 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.2712 | 0.0009 | 0.9355 | 0.0069 | 0.8153 | 0.4620 | 0.1548 | 0.5399 | 0.9088 | 0.5377 | 0.4777 | 0.5982 | 0.0009 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2498 | 0.4262 | 0.953 | 0.0147 | 0.7485 | 0.5467 | 0.1779 | 0.4906 | 0.9318 | 0.5421 | 0.4958 | 0.5461 | 0.0009 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.2932 | 0.0009 | 0.9518 | 0.0069 | 0.7747 | 0.5594 | 0.1462 | 0.4964 | 0.9502 | 0.4687 | 0.4718 | 0.5829 | 0.0009 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3176 | 0.0009 | 0.9518 | 0.0069 | 0.8274 | 0.4850 | 0.1898 | 0.4126 | 0.9261 | 0.576 | 0.4695 | 0.6444 | 0.0009 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.4232 | 0.5554 | 0.9507 | 0.2181 | 0.8112 | 0.6726 | 0.1887 | 0.5730 | 0.9518 | 0.5181 | 0.4015 | 0.6179 | 0.5650 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.3914 | 0.0009 | 0.9553 | 0.0069 | 0.8028 | 0.6032 | 0.1957 | 0.2646 | 0.9265 | 0.5695 | 0.5141 | 0.6546 | 0.0009 | - | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.3024 | 0.0009 | 0.9297 | 0.0069 | 0.682 | 0.6814 | 0.2076 | 0.3745 | 0.9558 | 0.4783 | 0.4177 | 0.6337 | 0.0009 | - | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.399 | 0.0009 | 0.9479 | 0.0069 | 0.6335 | 0.6909 | 0.1685 | 0.4685 | 0.9400 | 0.5327 | 0.4665 | 0.6298 | 0.0009 | - | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.3311 | 0.2015 | 0.9259 | 0.1437 | 0.4898 | 0.7242 | 0.3809 | 0.4366 | 0.9460 | 0.5164 | 0.4052 | 0.5957 | 0.3914 | - | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.2059 | 0.0009 | 0.9447 | 0.0069 | 0.751 | 0.5947 | 0.2537 | 0.2804 | 0.9399 | 0.5364 | 0.4639 | 0.5836 | 0.0009 | - | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.2503 | 0.0009 | 0.9455 | 0.0069 | 0.8007 | 0.6104 | 0.2966 | 0.3153 | 0.9411 | 0.5561 | 0.4659 | 0.6112 | 0.0009 | - | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3704 | 0.0009 | 0.9285 | 0.0069 | 0.8234 | 0.7275 | 0.2129 | 0.4812 | 0.9546 | 0.515 | 0.4467 | 0.6631 | 0.0009 | - | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.8448 | - | 0.9281 | 0.6017 | 0.8329 | - | 0.3077 | - | - | 0.9305 | 0.4889 | 0.8205 | - | - | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.469 | 0.7479 | 0.9258 | 0.3874 | 0.7718 | 0.7614 | 0.2654 | 0.5617 | 0.9629 | 0.5125 | 0.4578 | 0.6069 | 0.0413 | - | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.395 | 0.0009 | 0.9601 | 0.0069 | 0.7797 | 0.6850 | 0.1662 | 0.4741 | 0.9393 | 0.6425 | 0.579 | 0.6866 | 0.0009 | - | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3487 | 0.0009 | 0.9593 | 0.0069 | 0.7939 | 0.7416 | 0.1531 | 0.5089 | 0.9538 | 0.5833 | 0.5272 | 0.6908 | 0.0009 | - | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.4842 | 0.4589 | 0.9581 | 0.0067 | 0.7518 | 0.7517 | 0.2067 | 0.5239 | 0.9575 | 0.5892 | 0.5018 | 0.6461 | 0.0009 | - | ### Test @@ -966,35 +966,35 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps #### Methods related to vision foundation models -| status | model | backbone | loss | cp | cr | cf1 | op | or | of1 | map | macro_f1 | micro_f1 | sample_f1 | -|:----------|:---------|:------------------------------------------|:---------------------------|:-------|:-------|:-------|:-------|:-------|:-------|:-------|:-----------|:-----------|:------------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.3647 | 0.6824 | 0.4754 | 0.4954 | 0.9257 | 0.6455 | 0.4749 | 0.5098 | 0.6455 | 0.6488 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.3280 | 0.7370 | 0.4540 | 0.4455 | 0.9243 | 0.6012 | 0.4625 | 0.4226 | 0.6012 | 0.5995 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.3846 | 0.6560 | 0.4849 | 0.5066 | 0.9178 | 0.6529 | 0.4821 | 0.5258 | 0.6529 | 0.6623 | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.5300 | 0.5205 | 0.5252 | 0.7355 | 0.7214 | 0.7284 | 0.4666 | 0.6442 | 0.7284 | 0.7352 | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.5355 | 0.5312 | 0.5334 | 0.7243 | 0.7374 | 0.7308 | 0.4615 | 0.6571 | 0.7308 | 0.7269 | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.4921 | 0.5071 | 0.4995 | 0.7213 | 0.7331 | 0.7271 | 0.4528 | 0.6172 | 0.7271 | 0.7409 | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4799 | 0.5933 | 0.5306 | 0.6829 | 0.7843 | 0.7301 | 0.4944 | 0.6442 | 0.7301 | 0.7384 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.3745 | 0.6554 | 0.4767 | 0.5165 | 0.9060 | 0.6579 | 0.4621 | 0.5117 | 0.6579 | 0.6603 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.3157 | 0.7515 | 0.4446 | 0.4238 | 0.9081 | 0.5779 | 0.4107 | 0.4031 | 0.5779 | 0.5986 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.3508 | 0.6742 | 0.4615 | 0.4933 | 0.9156 | 0.6412 | 0.4541 | 0.4904 | 0.6412 | 0.6411 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4654 | 0.5394 | 0.4996 | 0.6785 | 0.7464 | 0.7108 | 0.4595 | 0.6116 | 0.7108 | 0.7148 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.4270 | 0.6527 | 0.5163 | 0.6359 | 0.7738 | 0.6981 | 0.4850 | 0.5313 | 0.6981 | 0.7258 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.4484 | 0.5770 | 0.5046 | 0.6897 | 0.7728 | 0.7289 | 0.4640 | 0.6143 | 0.7289 | 0.7440 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.4322 | 0.6280 | 0.5121 | 0.6393 | 0.8147 | 0.7164 | 0.5046 | 0.6171 | 0.7164 | 0.7400 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.4842 | 0.7614 | 0.5920 | 0.6559 | 0.8140 | 0.7264 | 0.5869 | 0.5666 | 0.7264 | 0.7512 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.5499 | 0.6354 | 0.5896 | 0.7046 | 0.8230 | 0.7592 | 0.5454 | 0.6147 | 0.7592 | 0.7843 | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.5133 | 0.5665 | 0.5386 | 0.7381 | 0.7526 | 0.7453 | 0.5240 | 0.6678 | 0.7453 | 0.7725 | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.4574 | 0.6230 | 0.5275 | 0.6502 | 0.7846 | 0.7111 | 0.5218 | 0.6394 | 0.7111 | 0.7161 | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.5660 | 0.6809 | 0.6181 | 0.7081 | 0.7544 | 0.7305 | 0.5983 | 0.6064 | 0.7305 | 0.7553 | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5193 | 0.5399 | 0.5294 | 0.7338 | 0.7367 | 0.7353 | 0.4916 | 0.6593 | 0.7353 | 0.7460 | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.4616 | 0.5574 | 0.5050 | 0.6664 | 0.7606 | 0.7104 | 0.4664 | 0.6238 | 0.7104 | 0.7155 | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.4261 | 0.6917 | 0.5273 | 0.6085 | 0.8824 | 0.7203 | 0.5617 | 0.6430 | 0.7203 | 0.7340 | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.4344 | 0.8610 | 0.5774 | 0.5777 | 0.8897 | 0.7005 | 0.6645 | 0.5444 | 0.7005 | 0.7203 | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.5221 | 0.6390 | 0.5747 | 0.6912 | 0.8521 | 0.7633 | 0.5646 | 0.7105 | 0.7633 | 0.7838 | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.4633 | 0.6671 | 0.5468 | 0.6343 | 0.8535 | 0.7278 | 0.5612 | 0.6704 | 0.7278 | 0.7533 | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.4444 | 0.7464 | 0.5571 | 0.6075 | 0.8561 | 0.7107 | 0.5828 | 0.5893 | 0.7107 | 0.7314 | +| status | model | backbone | loss | cp | cr | cf1 | op | or | of1 | map | macro_f1 | micro_f1 | sample_f1 | +|:----------|:---------|:------------------------------------------|:---------------------------|-------:|-------:|-------:|-------:|-------:|-------:|-------:|-----------:|-----------:|------------:| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.3647 | 0.6824 | 0.4754 | 0.4954 | 0.9257 | 0.6455 | 0.4749 | 0.5098 | 0.6455 | 0.6488 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.328 | 0.737 | 0.454 | 0.4455 | 0.9243 | 0.6012 | 0.4625 | 0.4226 | 0.6012 | 0.5995 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.3846 | 0.656 | 0.4849 | 0.5066 | 0.9178 | 0.6529 | 0.4821 | 0.5258 | 0.6529 | 0.6623 | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.53 | 0.5205 | 0.5252 | 0.7355 | 0.7214 | 0.7284 | 0.4666 | 0.6442 | 0.7284 | 0.7352 | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.5355 | 0.5312 | 0.5334 | 0.7243 | 0.7374 | 0.7308 | 0.4615 | 0.6571 | 0.7308 | 0.7269 | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.4921 | 0.5071 | 0.4995 | 0.7213 | 0.7331 | 0.7271 | 0.4528 | 0.6172 | 0.7271 | 0.7409 | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4799 | 0.5933 | 0.5306 | 0.6829 | 0.7843 | 0.7301 | 0.4944 | 0.6442 | 0.7301 | 0.7384 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.3745 | 0.6554 | 0.4767 | 0.5165 | 0.906 | 0.6579 | 0.4621 | 0.5117 | 0.6579 | 0.6603 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.3157 | 0.7515 | 0.4446 | 0.4238 | 0.9081 | 0.5779 | 0.4107 | 0.4031 | 0.5779 | 0.5986 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.3508 | 0.6742 | 0.4615 | 0.4933 | 0.9156 | 0.6412 | 0.4541 | 0.4904 | 0.6412 | 0.6411 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4654 | 0.5394 | 0.4996 | 0.6785 | 0.7464 | 0.7108 | 0.4595 | 0.6116 | 0.7108 | 0.7148 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.427 | 0.6527 | 0.5163 | 0.6359 | 0.7738 | 0.6981 | 0.485 | 0.5313 | 0.6981 | 0.7258 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.4484 | 0.577 | 0.5046 | 0.6897 | 0.7728 | 0.7289 | 0.464 | 0.6143 | 0.7289 | 0.744 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.4322 | 0.628 | 0.5121 | 0.6393 | 0.8147 | 0.7164 | 0.5046 | 0.6171 | 0.7164 | 0.74 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.4842 | 0.7614 | 0.592 | 0.6559 | 0.814 | 0.7264 | 0.5869 | 0.5666 | 0.7264 | 0.7512 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.5499 | 0.6354 | 0.5896 | 0.7046 | 0.823 | 0.7592 | 0.5454 | 0.6147 | 0.7592 | 0.7843 | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.5133 | 0.5665 | 0.5386 | 0.7381 | 0.7526 | 0.7453 | 0.524 | 0.6678 | 0.7453 | 0.7725 | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.4574 | 0.623 | 0.5275 | 0.6502 | 0.7846 | 0.7111 | 0.5218 | 0.6394 | 0.7111 | 0.7161 | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.566 | 0.6809 | 0.6181 | 0.7081 | 0.7544 | 0.7305 | 0.5983 | 0.6064 | 0.7305 | 0.7553 | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5193 | 0.5399 | 0.5294 | 0.7338 | 0.7367 | 0.7353 | 0.4916 | 0.6593 | 0.7353 | 0.746 | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.4616 | 0.5574 | 0.505 | 0.6664 | 0.7606 | 0.7104 | 0.4664 | 0.6238 | 0.7104 | 0.7155 | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.4261 | 0.6917 | 0.5273 | 0.6085 | 0.8824 | 0.7203 | 0.5617 | 0.643 | 0.7203 | 0.734 | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.4344 | 0.861 | 0.5774 | 0.5777 | 0.8897 | 0.7005 | 0.6645 | 0.5444 | 0.7005 | 0.7203 | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.4458 | 0.8443 | 0.5835 | 0.586 | 0.8794 | 0.7033 | 0.6557 | 0.5535 | 0.7033 | 0.7236 | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.5221 | 0.639 | 0.5747 | 0.6912 | 0.8521 | 0.7633 | 0.5646 | 0.7105 | 0.7633 | 0.7838 | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.4633 | 0.6671 | 0.5468 | 0.6343 | 0.8535 | 0.7278 | 0.5612 | 0.6704 | 0.7278 | 0.7533 | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.4444 | 0.7464 | 0.5571 | 0.6075 | 0.8561 | 0.7107 | 0.5828 | 0.5893 | 0.7107 | 0.7314 | #### Test per-class precision @@ -1066,35 +1066,35 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps ##### Methods related to vision foundation models -| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | -|:----------|:---------|:------------------------------------------|:---------------------------|:-----------|:--------------|:-----------------|:------------------|:---------------|:--------------------|:-----------------|:----------------|:--------|:--------------|:--------------|:--------------|:---------|:-----------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.1642 | 0.2628 | 0.7596 | 0.0000 | 0.6915 | 0.0932 | 0.0000 | 0.3299 | 0.0000 | 0.4504 | 0.3656 | 0.5303 | 0.0000 | 0.0000 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1097 | 0.0752 | 0.7819 | 0.0000 | 0.7005 | 0.0484 | 0.0000 | 0.2468 | 0.0000 | 0.3989 | 0.3780 | 0.5331 | 0.0078 | 0.0000 | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.2821 | 0.2330 | 0.7806 | 0.0000 | 0.7276 | 0.0956 | 0.0000 | 0.3904 | 0.0000 | 0.4500 | 0.3719 | 0.5143 | 0.0000 | 0.0000 | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.4260 | 0.0000 | 0.8795 | 0.0000 | 0.8971 | 0.3010 | 0.0000 | 0.8786 | 0.0000 | 0.7204 | 0.5090 | 0.6879 | 0.0000 | 0.0000 | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.5424 | 0.0000 | 0.8576 | 0.0000 | 0.8970 | 0.3295 | 0.0000 | 0.8533 | 0.0000 | 0.6987 | 0.5005 | 0.6764 | 0.0000 | 0.0000 | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.5833 | 0.0000 | 0.8558 | 0.0000 | 0.8432 | 0.2320 | 0.0000 | 0.4288 | 0.0000 | 0.7416 | 0.5724 | 0.6635 | 0.0000 | 0.0000 | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.3704 | 0.0000 | 0.8420 | 0.0000 | 0.8471 | 0.1822 | 0.0000 | 0.6568 | 0.0000 | 0.7283 | 0.5458 | 0.6267 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.1826 | 0.2879 | 0.7338 | 0.0000 | 0.7313 | 0.1422 | 0.0000 | 0.2540 | 0.0000 | 0.4758 | 0.4148 | 0.5228 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.0425 | 0.0387 | 0.7292 | 0.0000 | 0.7062 | 0.0470 | 0.0000 | 0.2082 | 0.0000 | 0.4253 | 0.4150 | 0.5260 | 0.0185 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.0918 | 0.2706 | 0.7267 | 0.0000 | 0.7112 | 0.0637 | 0.0000 | 0.3047 | 0.0000 | 0.4282 | 0.4006 | 0.5104 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.3894 | 0.0000 | 0.8472 | 0.0000 | 0.8654 | 0.3226 | 0.0000 | 0.3635 | 0.0000 | 0.7393 | 0.4823 | 0.6439 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.1896 | 0.1053 | 0.8089 | 0.0000 | 0.8472 | 0.1454 | 0.0000 | 0.2988 | 0.0000 | 0.6884 | 0.5393 | 0.6472 | 0.0000 | 0.0000 | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.2987 | 0.0000 | 0.8236 | 0.0000 | 0.8752 | 0.2180 | 0.0000 | 0.4111 | 0.0000 | 0.6653 | 0.5497 | 0.6423 | 0.0000 | 0.0000 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3065 | 0.0000 | 0.7871 | 0.0000 | 0.8696 | 0.2297 | 0.0000 | 0.2873 | 0.0000 | 0.6841 | 0.5050 | 0.6531 | 0.0000 | 0.0000 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.3820 | 0.1764 | 0.8387 | 0.0000 | 0.8184 | 0.2743 | 0.0000 | 0.3753 | 0.0000 | 0.6305 | 0.5225 | 0.6682 | 0.1559 | 0.0000 | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.2515 | 0.7647 | 0.7850 | 0.0000 | 0.8595 | 0.4046 | 0.0000 | 0.4709 | 0.0000 | 0.7151 | 0.5746 | 0.6732 | 0.0000 | 0.0000 | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.5446 | 0.0000 | 0.8812 | 0.0000 | 0.8828 | 0.3282 | 0.0000 | 0.5233 | 0.0000 | 0.6938 | 0.5248 | 0.7544 | 0.0000 | 0.0000 | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.5019 | 0.0000 | 0.8541 | 0.0000 | 0.8905 | 0.2329 | 0.0000 | 0.3482 | 0.0000 | 0.6271 | 0.4995 | 0.6197 | 0.0000 | 0.0000 | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.5229 | 0.4379 | 0.8741 | 0.0000 | 0.8896 | 0.3430 | 0.0000 | 0.4421 | 0.0000 | 0.6800 | 0.5329 | 0.7083 | 0.2289 | 0.0000 | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5744 | 0.0000 | 0.8760 | 0.0000 | 0.9030 | 0.2948 | 0.0000 | 0.6229 | 0.0000 | 0.7017 | 0.5000 | 0.7207 | 0.0000 | 0.0000 | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3295 | 0.0000 | 0.8389 | 0.0000 | 0.8222 | 0.3500 | 0.0000 | 0.4527 | 0.0000 | 0.6768 | 0.5114 | 0.6348 | 0.0000 | 0.0000 | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3796 | 0.0000 | 0.7491 | 0.0000 | 0.7905 | 0.1939 | 0.0000 | 0.4111 | 0.0000 | 0.6528 | 0.4595 | 0.6242 | 0.0000 | 0.0000 | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.2440 | 0.1799 | 0.7769 | 0.0000 | 0.8181 | 0.2000 | 0.0000 | 0.3526 | 0.0000 | 0.5895 | 0.4553 | 0.5858 | 0.1417 | 0.0000 | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.5664 | 0.0000 | 0.7863 | 0.0000 | 0.8405 | 0.6527 | 0.0000 | 0.4908 | 0.0000 | 0.6953 | 0.5353 | 0.6537 | 0.0000 | 0.0000 | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3989 | 0.0000 | 0.8331 | 0.0000 | 0.8574 | 0.3754 | 0.0000 | 0.3989 | 0.0000 | 0.6343 | 0.5154 | 0.6196 | 0.0000 | 0.0000 | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.2264 | 0.3356 | 0.8400 | 0.0000 | 0.8748 | 0.1943 | 0.0000 | 0.2942 | 0.0000 | 0.5882 | 0.4869 | 0.6031 | 0.0000 | 0.0000 | +| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | +|:----------|:---------|:------------------------------------------|:---------------------------|-----------:|--------------:|-----------------:|------------------:|---------------:|--------------------:|-----------------:|----------------:|--------:|--------------:|--------------:|--------------:|---------:|-----------:| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.1642 | 0.2628 | 0.7596 | 0 | 0.6915 | 0.0932 | 0 | 0.3299 | 0 | 0.4504 | 0.3656 | 0.5303 | 0 | 0 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1097 | 0.0752 | 0.7819 | 0 | 0.7005 | 0.0484 | 0 | 0.2468 | 0 | 0.3989 | 0.378 | 0.5331 | 0.0078 | 0 | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.2821 | 0.233 | 0.7806 | 0 | 0.7276 | 0.0956 | 0 | 0.3904 | 0 | 0.45 | 0.3719 | 0.5143 | 0 | 0 | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.426 | 0 | 0.8795 | 0 | 0.8971 | 0.301 | 0 | 0.8786 | 0 | 0.7204 | 0.509 | 0.6879 | 0 | 0 | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.5424 | 0 | 0.8576 | 0 | 0.897 | 0.3295 | 0 | 0.8533 | 0 | 0.6987 | 0.5005 | 0.6764 | 0 | 0 | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.5833 | 0 | 0.8558 | 0 | 0.8432 | 0.232 | 0 | 0.4288 | 0 | 0.7416 | 0.5724 | 0.6635 | 0 | 0 | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.3704 | 0 | 0.842 | 0 | 0.8471 | 0.1822 | 0 | 0.6568 | 0 | 0.7283 | 0.5458 | 0.6267 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.1826 | 0.2879 | 0.7338 | 0 | 0.7313 | 0.1422 | 0 | 0.254 | 0 | 0.4758 | 0.4148 | 0.5228 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.0425 | 0.0387 | 0.7292 | 0 | 0.7062 | 0.047 | 0 | 0.2082 | 0 | 0.4253 | 0.415 | 0.526 | 0.0185 | 0 | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.0918 | 0.2706 | 0.7267 | 0 | 0.7112 | 0.0637 | 0 | 0.3047 | 0 | 0.4282 | 0.4006 | 0.5104 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.3894 | 0 | 0.8472 | 0 | 0.8654 | 0.3226 | 0 | 0.3635 | 0 | 0.7393 | 0.4823 | 0.6439 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.1896 | 0.1053 | 0.8089 | 0 | 0.8472 | 0.1454 | 0 | 0.2988 | 0 | 0.6884 | 0.5393 | 0.6472 | 0 | 0 | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.2987 | 0 | 0.8236 | 0 | 0.8752 | 0.218 | 0 | 0.4111 | 0 | 0.6653 | 0.5497 | 0.6423 | 0 | 0 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.3065 | 0 | 0.7871 | 0 | 0.8696 | 0.2297 | 0 | 0.2873 | 0 | 0.6841 | 0.505 | 0.6531 | 0 | 0 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.382 | 0.1764 | 0.8387 | 0 | 0.8184 | 0.2743 | 0 | 0.3753 | 0 | 0.6305 | 0.5225 | 0.6682 | 0.1559 | 0 | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.2515 | 0.7647 | 0.785 | 0 | 0.8595 | 0.4046 | 0 | 0.4709 | 0 | 0.7151 | 0.5746 | 0.6732 | 0 | 0 | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.5446 | 0 | 0.8812 | 0 | 0.8828 | 0.3282 | 0 | 0.5233 | 0 | 0.6938 | 0.5248 | 0.7544 | 0 | 0 | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.5019 | 0 | 0.8541 | 0 | 0.8905 | 0.2329 | 0 | 0.3482 | 0 | 0.6271 | 0.4995 | 0.6197 | 0 | 0 | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.5229 | 0.4379 | 0.8741 | 0 | 0.8896 | 0.343 | 0 | 0.4421 | 0 | 0.68 | 0.5329 | 0.7083 | 0.2289 | 0 | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5744 | 0 | 0.876 | 0 | 0.903 | 0.2948 | 0 | 0.6229 | 0 | 0.7017 | 0.5 | 0.7207 | 0 | 0 | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.3295 | 0 | 0.8389 | 0 | 0.8222 | 0.35 | 0 | 0.4527 | 0 | 0.6768 | 0.5114 | 0.6348 | 0 | 0 | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.3796 | 0 | 0.7491 | 0 | 0.7905 | 0.1939 | 0 | 0.4111 | 0 | 0.6528 | 0.4595 | 0.6242 | 0 | 0 | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.244 | 0.1799 | 0.7769 | 0 | 0.8181 | 0.2 | 0 | 0.3526 | 0 | 0.5895 | 0.4553 | 0.5858 | 0.1417 | 0 | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.3733 | 0.1513 | 0.7528 | 0 | 0.7911 | 0.1688 | 0 | 0.3331 | 0 | 0.6184 | 0.4654 | 0.6391 | 0.1649 | 0 | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.5664 | 0 | 0.7863 | 0 | 0.8405 | 0.6527 | 0 | 0.4908 | 0 | 0.6953 | 0.5353 | 0.6537 | 0 | 0 | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.3989 | 0 | 0.8331 | 0 | 0.8574 | 0.3754 | 0 | 0.3989 | 0 | 0.6343 | 0.5154 | 0.6196 | 0 | 0 | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.2264 | 0.3356 | 0.84 | 0 | 0.8748 | 0.1943 | 0 | 0.2942 | 0 | 0.5882 | 0.4869 | 0.6031 | 0 | 0 | #### Test per-class recall @@ -1165,35 +1165,35 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps ##### Methods related to vision foundation models -| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | -|:----------|:---------|:------------------------------------------|:---------------------------|:-----------|:--------------|:-----------------|:------------------|:---------------|:--------------------|:-----------------|:----------------|:--------|:--------------|:--------------|:--------------|:---------|:-----------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.6865 | 0.2867 | 0.9189 | - | 0.9585 | 0.4664 | - | 0.6606 | - | 0.9328 | 0.9600 | 0.9539 | 0.0000 | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.6708 | 0.5315 | 0.9004 | - | 0.9443 | 0.6462 | - | 0.8055 | - | 0.9615 | 0.9401 | 0.9482 | 0.0213 | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.6270 | 0.2867 | 0.9137 | - | 0.9473 | 0.3918 | - | 0.5443 | - | 0.9342 | 0.9527 | 0.9622 | 0.0000 | - | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.5256 | 0.0000 | 0.6920 | - | 0.8414 | 0.5044 | - | 0.5263 | - | 0.6798 | 0.6253 | 0.8097 | 0.0000 | - | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.6614 | 0.0000 | 0.7480 | - | 0.7663 | 0.3816 | - | 0.5300 | - | 0.7055 | 0.6713 | 0.8477 | 0.0000 | - | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.4828 | 0.0000 | 0.8219 | - | 0.7975 | 0.2822 | - | 0.7031 | - | 0.5805 | 0.6039 | 0.7995 | 0.0000 | - | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.6364 | 0.0000 | 0.8008 | - | 0.8451 | 0.6784 | - | 0.7047 | - | 0.6804 | 0.6922 | 0.8956 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.7429 | 0.2657 | 0.9516 | - | 0.8607 | 0.1871 | - | 0.7610 | - | 0.9362 | 0.8880 | 0.9611 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.8715 | 0.6923 | 0.9483 | - | 0.8569 | 0.3670 | - | 0.8744 | - | 0.9674 | 0.8400 | 0.9589 | 0.1383 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.7962 | 0.3217 | 0.9580 | - | 0.8732 | 0.2354 | - | 0.7396 | - | 0.9611 | 0.8887 | 0.9684 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.6677 | 0.0000 | 0.7863 | - | 0.7587 | 0.2939 | - | 0.6930 | - | 0.6469 | 0.7110 | 0.8362 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.6426 | 0.7832 | 0.8553 | - | 0.8189 | 0.6023 | - | 0.6968 | - | 0.6978 | 0.5801 | 0.8499 | 0.0000 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.7304 | 0.0000 | 0.8626 | - | 0.7851 | 0.4985 | - | 0.7333 | - | 0.7674 | 0.5350 | 0.8580 | 0.0000 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.7524 | 0.0000 | 0.8379 | - | 0.8443 | 0.6067 | - | 0.8694 | - | 0.7665 | 0.7069 | 0.8961 | 0.0000 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.7962 | 0.8462 | 0.8273 | - | 0.8847 | 0.6608 | - | 0.8492 | - | 0.8435 | 0.6133 | 0.8567 | 0.4362 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.8025 | 0.1818 | 0.9151 | - | 0.8675 | 0.5453 | - | 0.7812 | - | 0.7501 | 0.6202 | 0.8901 | 0.0000 | - | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.6897 | 0.0000 | 0.7552 | - | 0.8895 | 0.4708 | - | 0.7871 | - | 0.6587 | 0.5646 | 0.8499 | 0.0000 | - | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.8213 | 0.0000 | 0.7625 | - | 0.8136 | 0.5921 | - | 0.8908 | - | 0.8408 | 0.6081 | 0.9010 | 0.0000 | - | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.7524 | 0.4685 | 0.7842 | - | 0.8521 | 0.5556 | - | 0.8543 | - | 0.7668 | 0.4680 | 0.8182 | 0.4894 | - | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.6050 | 0.0000 | 0.7599 | - | 0.8284 | 0.3991 | - | 0.7430 | - | 0.7294 | 0.5424 | 0.7921 | 0.0000 | - | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.6364 | 0.0000 | 0.7913 | - | 0.7884 | 0.4401 | - | 0.6888 | - | 0.7237 | 0.6612 | 0.8445 | 0.0000 | - | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.9231 | 0.0000 | 0.8827 | - | 0.9247 | 0.6770 | - | 0.8979 | - | 0.8471 | 0.8181 | 0.9460 | 0.0000 | - | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.9561 | 0.7133 | 0.8817 | - | 0.9115 | 0.6915 | - | 0.9030 | - | 0.8808 | 0.8436 | 0.9347 | 0.8936 | - | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.8025 | 0.0000 | 0.8812 | - | 0.9131 | 0.5000 | - | 0.8442 | - | 0.8116 | 0.7333 | 0.9041 | 0.0000 | - | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.9216 | 0.0000 | 0.8222 | - | 0.9145 | 0.5789 | - | 0.8795 | - | 0.8548 | 0.7759 | 0.9236 | 0.0000 | - | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.9467 | 0.6783 | 0.8294 | - | 0.8701 | 0.6213 | - | 0.9147 | - | 0.9227 | 0.7654 | 0.9154 | 0.0000 | - | +| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | +|:----------|:---------|:------------------------------------------|:---------------------------|-----------:|--------------:|-----------------:|:------------------|---------------:|--------------------:|:-----------------|----------------:|:--------|--------------:|--------------:|--------------:|---------:|:-----------| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.6865 | 0.2867 | 0.9189 | - | 0.9585 | 0.4664 | - | 0.6606 | - | 0.9328 | 0.96 | 0.9539 | 0 | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.6708 | 0.5315 | 0.9004 | - | 0.9443 | 0.6462 | - | 0.8055 | - | 0.9615 | 0.9401 | 0.9482 | 0.0213 | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.627 | 0.2867 | 0.9137 | - | 0.9473 | 0.3918 | - | 0.5443 | - | 0.9342 | 0.9527 | 0.9622 | 0 | - | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.5256 | 0 | 0.692 | - | 0.8414 | 0.5044 | - | 0.5263 | - | 0.6798 | 0.6253 | 0.8097 | 0 | - | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.6614 | 0 | 0.748 | - | 0.7663 | 0.3816 | - | 0.53 | - | 0.7055 | 0.6713 | 0.8477 | 0 | - | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.4828 | 0 | 0.8219 | - | 0.7975 | 0.2822 | - | 0.7031 | - | 0.5805 | 0.6039 | 0.7995 | 0 | - | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.6364 | 0 | 0.8008 | - | 0.8451 | 0.6784 | - | 0.7047 | - | 0.6804 | 0.6922 | 0.8956 | 0 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.7429 | 0.2657 | 0.9516 | - | 0.8607 | 0.1871 | - | 0.761 | - | 0.9362 | 0.888 | 0.9611 | 0 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.8715 | 0.6923 | 0.9483 | - | 0.8569 | 0.367 | - | 0.8744 | - | 0.9674 | 0.84 | 0.9589 | 0.1383 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.7962 | 0.3217 | 0.958 | - | 0.8732 | 0.2354 | - | 0.7396 | - | 0.9611 | 0.8887 | 0.9684 | 0 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.6677 | 0 | 0.7863 | - | 0.7587 | 0.2939 | - | 0.693 | - | 0.6469 | 0.711 | 0.8362 | 0 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.6426 | 0.7832 | 0.8553 | - | 0.8189 | 0.6023 | - | 0.6968 | - | 0.6978 | 0.5801 | 0.8499 | 0 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.7304 | 0 | 0.8626 | - | 0.7851 | 0.4985 | - | 0.7333 | - | 0.7674 | 0.535 | 0.858 | 0 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.7524 | 0 | 0.8379 | - | 0.8443 | 0.6067 | - | 0.8694 | - | 0.7665 | 0.7069 | 0.8961 | 0 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.7962 | 0.8462 | 0.8273 | - | 0.8847 | 0.6608 | - | 0.8492 | - | 0.8435 | 0.6133 | 0.8567 | 0.4362 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.8025 | 0.1818 | 0.9151 | - | 0.8675 | 0.5453 | - | 0.7812 | - | 0.7501 | 0.6202 | 0.8901 | 0 | - | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.6897 | 0 | 0.7552 | - | 0.8895 | 0.4708 | - | 0.7871 | - | 0.6587 | 0.5646 | 0.8499 | 0 | - | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.8213 | 0 | 0.7625 | - | 0.8136 | 0.5921 | - | 0.8908 | - | 0.8408 | 0.6081 | 0.901 | 0 | - | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.7524 | 0.4685 | 0.7842 | - | 0.8521 | 0.5556 | - | 0.8543 | - | 0.7668 | 0.468 | 0.8182 | 0.4894 | - | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.605 | 0 | 0.7599 | - | 0.8284 | 0.3991 | - | 0.743 | - | 0.7294 | 0.5424 | 0.7921 | 0 | - | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.6364 | 0 | 0.7913 | - | 0.7884 | 0.4401 | - | 0.6888 | - | 0.7237 | 0.6612 | 0.8445 | 0 | - | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.9231 | 0 | 0.8827 | - | 0.9247 | 0.677 | - | 0.8979 | - | 0.8471 | 0.8181 | 0.946 | 0 | - | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.9561 | 0.7133 | 0.8817 | - | 0.9115 | 0.6915 | - | 0.903 | - | 0.8808 | 0.8436 | 0.9347 | 0.8936 | - | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.9467 | 0.9301 | 0.8703 | - | 0.9288 | 0.7471 | - | 0.9311 | - | 0.866 | 0.7976 | 0.9149 | 0.5106 | - | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.8025 | 0 | 0.8812 | - | 0.9131 | 0.5 | - | 0.8442 | - | 0.8116 | 0.7333 | 0.9041 | 0 | - | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.9216 | 0 | 0.8222 | - | 0.9145 | 0.5789 | - | 0.8795 | - | 0.8548 | 0.7759 | 0.9236 | 0 | - | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.9467 | 0.6783 | 0.8294 | - | 0.8701 | 0.6213 | - | 0.9147 | - | 0.9227 | 0.7654 | 0.9154 | 0 | - | #### Test per-class f1 @@ -1264,35 +1264,35 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps ##### Methods related to vision foundation models -| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | -|:----------|:---------|:------------------------------------------|:---------------------------|:-----------|:--------------|:-----------------|:------------------|:---------------|:--------------------|:-----------------|:----------------|:--------|:--------------|:--------------|:--------------|:---------|:-----------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.2650 | 0.2742 | 0.8317 | - | 0.8034 | 0.1554 | - | 0.4401 | - | 0.6075 | 0.5295 | 0.6816 | - | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1885 | 0.1317 | 0.8370 | - | 0.8043 | 0.0900 | - | 0.3779 | - | 0.5638 | 0.5392 | 0.6825 | 0.0114 | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.3891 | 0.2571 | 0.8420 | - | 0.8230 | 0.1538 | - | 0.4547 | - | 0.6074 | 0.5350 | 0.6704 | - | - | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.4706 | - | 0.7746 | - | 0.8683 | 0.3770 | - | 0.6583 | - | 0.6995 | 0.5612 | 0.7438 | - | - | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.5960 | - | 0.7991 | - | 0.8265 | 0.3537 | - | 0.6539 | - | 0.7021 | 0.5735 | 0.7524 | - | - | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.5283 | - | 0.8385 | - | 0.8197 | 0.2546 | - | 0.5327 | - | 0.6512 | 0.5877 | 0.7252 | - | - | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4683 | - | 0.8209 | - | 0.8461 | 0.2873 | - | 0.6799 | - | 0.7035 | 0.6103 | 0.7374 | - | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2931 | 0.2764 | 0.8286 | - | 0.7907 | 0.1616 | - | 0.3809 | - | 0.6310 | 0.5655 | 0.6772 | - | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.0811 | 0.0733 | 0.8244 | - | 0.7743 | 0.0833 | - | 0.3363 | - | 0.5908 | 0.5555 | 0.6794 | 0.0327 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.1646 | 0.2939 | 0.8265 | - | 0.7839 | 0.1003 | - | 0.4316 | - | 0.5924 | 0.5522 | 0.6685 | - | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4919 | - | 0.8156 | - | 0.8086 | 0.3076 | - | 0.4769 | - | 0.6901 | 0.5747 | 0.7276 | - | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2929 | 0.1856 | 0.8314 | - | 0.8328 | 0.2342 | - | 0.4182 | - | 0.6931 | 0.5589 | 0.7348 | - | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.4240 | - | 0.8426 | - | 0.8277 | 0.3034 | - | 0.5269 | - | 0.7127 | 0.5422 | 0.7347 | - | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.4356 | - | 0.8117 | - | 0.8568 | 0.3332 | - | 0.4318 | - | 0.7229 | 0.5892 | 0.7556 | - | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.5163 | 0.2919 | 0.8330 | - | 0.8503 | 0.3877 | - | 0.5205 | - | 0.7216 | 0.5643 | 0.7508 | 0.2297 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.3829 | 0.2938 | 0.8451 | - | 0.8635 | 0.4645 | - | 0.5876 | - | 0.7322 | 0.5965 | 0.7666 | - | - | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.6086 | - | 0.8133 | - | 0.8861 | 0.3868 | - | 0.6286 | - | 0.6758 | 0.5440 | 0.7993 | - | - | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.6231 | - | 0.8057 | - | 0.8503 | 0.3343 | - | 0.5007 | - | 0.7184 | 0.5485 | 0.7344 | - | - | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.6170 | 0.4527 | 0.8267 | - | 0.8704 | 0.4241 | - | 0.5826 | - | 0.7208 | 0.4983 | 0.7593 | 0.3119 | - | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5893 | - | 0.8138 | - | 0.8641 | 0.3391 | - | 0.6776 | - | 0.7153 | 0.5203 | 0.7547 | - | - | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.4342 | - | 0.8144 | - | 0.8050 | 0.3899 | - | 0.5463 | - | 0.6995 | 0.5767 | 0.7248 | - | - | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.5380 | - | 0.8104 | - | 0.8524 | 0.3014 | - | 0.5640 | - | 0.7374 | 0.5885 | 0.7521 | - | - | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.3888 | 0.2873 | 0.8260 | - | 0.8623 | 0.3103 | - | 0.5072 | - | 0.7063 | 0.5914 | 0.7202 | 0.2445 | - | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.6641 | - | 0.8310 | - | 0.8753 | 0.5662 | - | 0.6208 | - | 0.7490 | 0.6188 | 0.7588 | - | - | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.5568 | - | 0.8276 | - | 0.8850 | 0.4554 | - | 0.5489 | - | 0.7282 | 0.6194 | 0.7417 | - | - | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.3654 | 0.4491 | 0.8347 | - | 0.8724 | 0.2961 | - | 0.4452 | - | 0.7184 | 0.5952 | 0.7271 | - | - | +| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | +|:----------|:---------|:------------------------------------------|:---------------------------|-----------:|:--------------|-----------------:|:------------------|---------------:|--------------------:|:-----------------|----------------:|:--------|--------------:|--------------:|--------------:|:---------|:-----------| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.265 | 0.2742 | 0.8317 | - | 0.8034 | 0.1554 | - | 0.4401 | - | 0.6075 | 0.5295 | 0.6816 | - | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.1885 | 0.1317 | 0.837 | - | 0.8043 | 0.09 | - | 0.3779 | - | 0.5638 | 0.5392 | 0.6825 | 0.0114 | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.3891 | 0.2571 | 0.842 | - | 0.823 | 0.1538 | - | 0.4547 | - | 0.6074 | 0.535 | 0.6704 | - | - | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.4706 | - | 0.7746 | - | 0.8683 | 0.377 | - | 0.6583 | - | 0.6995 | 0.5612 | 0.7438 | - | - | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.596 | - | 0.7991 | - | 0.8265 | 0.3537 | - | 0.6539 | - | 0.7021 | 0.5735 | 0.7524 | - | - | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.5283 | - | 0.8385 | - | 0.8197 | 0.2546 | - | 0.5327 | - | 0.6512 | 0.5877 | 0.7252 | - | - | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4683 | - | 0.8209 | - | 0.8461 | 0.2873 | - | 0.6799 | - | 0.7035 | 0.6103 | 0.7374 | - | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.2931 | 0.2764 | 0.8286 | - | 0.7907 | 0.1616 | - | 0.3809 | - | 0.631 | 0.5655 | 0.6772 | - | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.0811 | 0.0733 | 0.8244 | - | 0.7743 | 0.0833 | - | 0.3363 | - | 0.5908 | 0.5555 | 0.6794 | 0.0327 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.1646 | 0.2939 | 0.8265 | - | 0.7839 | 0.1003 | - | 0.4316 | - | 0.5924 | 0.5522 | 0.6685 | - | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4919 | - | 0.8156 | - | 0.8086 | 0.3076 | - | 0.4769 | - | 0.6901 | 0.5747 | 0.7276 | - | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2929 | 0.1856 | 0.8314 | - | 0.8328 | 0.2342 | - | 0.4182 | - | 0.6931 | 0.5589 | 0.7348 | - | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.424 | - | 0.8426 | - | 0.8277 | 0.3034 | - | 0.5269 | - | 0.7127 | 0.5422 | 0.7347 | - | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.4356 | - | 0.8117 | - | 0.8568 | 0.3332 | - | 0.4318 | - | 0.7229 | 0.5892 | 0.7556 | - | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.5163 | 0.2919 | 0.833 | - | 0.8503 | 0.3877 | - | 0.5205 | - | 0.7216 | 0.5643 | 0.7508 | 0.2297 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.3829 | 0.2938 | 0.8451 | - | 0.8635 | 0.4645 | - | 0.5876 | - | 0.7322 | 0.5965 | 0.7666 | - | - | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.6086 | - | 0.8133 | - | 0.8861 | 0.3868 | - | 0.6286 | - | 0.6758 | 0.544 | 0.7993 | - | - | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.6231 | - | 0.8057 | - | 0.8503 | 0.3343 | - | 0.5007 | - | 0.7184 | 0.5485 | 0.7344 | - | - | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.617 | 0.4527 | 0.8267 | - | 0.8704 | 0.4241 | - | 0.5826 | - | 0.7208 | 0.4983 | 0.7593 | 0.3119 | - | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.5893 | - | 0.8138 | - | 0.8641 | 0.3391 | - | 0.6776 | - | 0.7153 | 0.5203 | 0.7547 | - | - | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.4342 | - | 0.8144 | - | 0.805 | 0.3899 | - | 0.5463 | - | 0.6995 | 0.5767 | 0.7248 | - | - | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.538 | - | 0.8104 | - | 0.8524 | 0.3014 | - | 0.564 | - | 0.7374 | 0.5885 | 0.7521 | - | - | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.3888 | 0.2873 | 0.826 | - | 0.8623 | 0.3103 | - | 0.5072 | - | 0.7063 | 0.5914 | 0.7202 | 0.2445 | - | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.5355 | 0.2603 | 0.8073 | - | 0.8544 | 0.2753 | - | 0.4907 | - | 0.7216 | 0.5878 | 0.7525 | 0.2494 | - | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.6641 | - | 0.831 | - | 0.8753 | 0.5662 | - | 0.6208 | - | 0.749 | 0.6188 | 0.7588 | - | - | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.5568 | - | 0.8276 | - | 0.885 | 0.4554 | - | 0.5489 | - | 0.7282 | 0.6194 | 0.7417 | - | - | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.3654 | 0.4491 | 0.8347 | - | 0.8724 | 0.2961 | - | 0.4452 | - | 0.7184 | 0.5952 | 0.7271 | - | - | #### Test per-class ap @@ -1363,34 +1363,34 @@ Protocol: image-level labels are derived from predicted and GT segmentation maps ##### Methods related to vision foundation models -| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | -|:----------|:---------|:------------------------------------------|:---------------------------|:-----------|:--------------|:-----------------|:------------------|:---------------|:--------------------|:-----------------|:----------------|:--------|:--------------|:--------------|:--------------|:---------|:-----------| -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.4167 | 0.1321 | 0.8749 | - | 0.9146 | 0.1273 | - | 0.5248 | - | 0.7358 | 0.4594 | 0.5535 | 0.0100 | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.3655 | 0.1955 | 0.8802 | - | 0.8954 | 0.1129 | - | 0.4819 | - | 0.7210 | 0.4390 | 0.5242 | 0.0095 | - | -| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.4746 | 0.1810 | 0.8791 | - | 0.9106 | 0.1158 | - | 0.4782 | - | 0.7145 | 0.4888 | 0.5688 | 0.0100 | - | -| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.2258 | 0.0189 | 0.7980 | - | 0.9012 | 0.3196 | - | 0.6350 | - | 0.6556 | 0.4541 | 0.6473 | 0.0100 | - | -| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.4057 | 0.0189 | 0.8107 | - | 0.8679 | 0.1417 | - | 0.6313 | - | 0.6680 | 0.4534 | 0.6074 | 0.0100 | - | -| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.3986 | 0.0189 | 0.8033 | - | 0.8646 | 0.1710 | - | 0.5149 | - | 0.6742 | 0.5325 | 0.5399 | 0.0100 | - | -| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4161 | 0.0189 | 0.8251 | - | 0.8991 | 0.2690 | - | 0.6813 | - | 0.7122 | 0.4914 | 0.6211 | 0.0100 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.4801 | 0.1719 | 0.8524 | - | 0.8667 | 0.0801 | - | 0.5118 | - | 0.7099 | 0.4239 | 0.5145 | 0.0100 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.1094 | 0.1042 | 0.8711 | - | 0.8678 | 0.0610 | - | 0.4988 | - | 0.6710 | 0.4103 | 0.5014 | 0.0118 | - | -| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.3368 | 0.2089 | 0.8769 | - | 0.8726 | 0.0737 | - | 0.5452 | - | 0.6877 | 0.4242 | 0.5045 | 0.0100 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4621 | 0.0189 | 0.8062 | - | 0.8480 | 0.2161 | - | 0.5420 | - | 0.6930 | 0.4542 | 0.5449 | 0.0100 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2097 | 0.3964 | 0.8205 | - | 0.8782 | 0.3169 | - | 0.4935 | - | 0.6721 | 0.4716 | 0.5810 | 0.0100 | - | -| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.3830 | 0.0189 | 0.8162 | - | 0.8574 | 0.2637 | - | 0.5548 | - | 0.6786 | 0.4799 | 0.5779 | 0.0100 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.5349 | 0.0189 | 0.8133 | - | 0.9040 | 0.3774 | - | 0.5414 | - | 0.7021 | 0.4758 | 0.6680 | 0.0100 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.6478 | 0.4530 | 0.8247 | - | 0.9060 | 0.4637 | - | 0.6663 | - | 0.6742 | 0.4601 | 0.6346 | 0.1382 | - | -| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.4918 | 0.1961 | 0.8341 | - | 0.9069 | 0.3793 | - | 0.6757 | - | 0.7176 | 0.5535 | 0.6892 | 0.0100 | - | -| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.5604 | 0.0189 | 0.8095 | - | 0.9243 | 0.2812 | - | 0.7034 | - | 0.6390 | 0.4708 | 0.8223 | 0.0100 | - | -| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.7206 | 0.0189 | 0.8215 | - | 0.8942 | 0.3063 | - | 0.7198 | - | 0.6778 | 0.4354 | 0.6132 | 0.0100 | - | -| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.6534 | 0.3786 | 0.8071 | - | 0.9099 | 0.3939 | - | 0.7260 | - | 0.6695 | 0.4531 | 0.6719 | 0.3191 | - | -| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.4507 | 0.0189 | 0.8040 | - | 0.8935 | 0.2952 | - | 0.7062 | - | 0.6423 | 0.4369 | 0.6587 | 0.0100 | - | -| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.4024 | 0.0185 | 0.8114 | - | 0.8520 | 0.2933 | - | 0.6000 | - | 0.6710 | 0.4585 | 0.5470 | 0.0100 | - | -| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.7823 | 0.0194 | 0.8482 | - | 0.9273 | 0.4235 | - | 0.7551 | - | 0.7357 | 0.4317 | 0.6840 | 0.0102 | - | -| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.8213 | 0.5013 | 0.8504 | - | 0.9285 | 0.5011 | - | 0.7783 | - | 0.7158 | 0.4493 | 0.6483 | 0.4510 | - | -| running | SESSRS | MANet (weighted) | t1/t2 search + postprocess | - | - | - | - | - | - | - | - | - | - | - | - | - | - | -| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.7391 | 0.0189 | 0.8217 | - | 0.9338 | 0.4927 | - | 0.7362 | - | 0.7263 | 0.4957 | 0.6716 | 0.0100 | - | -| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.7689 | 0.0189 | 0.8402 | - | 0.9317 | 0.4354 | - | 0.6956 | - | 0.6916 | 0.5005 | 0.7197 | 0.0100 | - | -| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.7647 | 0.4332 | 0.8399 | - | 0.9235 | 0.3672 | - | 0.7290 | - | 0.6839 | 0.4542 | 0.6225 | 0.0100 | - | +| status | model | backbone | loss | Building | Mining raft | Primary Forest | Heavy machinery | Water bodies | Agricultural crop | Compact mounds | Gravel mounds | Grass | Type1 regen | Type2 regen | Bare ground | Sluice | Vehicles | +|:----------|:---------|:------------------------------------------|:---------------------------|-----------:|--------------:|-----------------:|:------------------|---------------:|--------------------:|:-----------------|----------------:|:--------|--------------:|--------------:|--------------:|---------:|:-----------| +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | ce+dice | 0.4167 | 0.1321 | 0.8749 | - | 0.9146 | 0.1273 | - | 0.5248 | - | 0.7358 | 0.4594 | 0.5535 | 0.01 | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | weighted_ce+dice | 0.3655 | 0.1955 | 0.8802 | - | 0.8954 | 0.1129 | - | 0.4819 | - | 0.721 | 0.439 | 0.5242 | 0.0095 | - | +| completed | HQ-SAM | ViT-B + HQ decoder (full finetune, msfpn) | focal+dice | 0.4746 | 0.181 | 0.8791 | - | 0.9106 | 0.1158 | - | 0.4782 | - | 0.7145 | 0.4888 | 0.5688 | 0.01 | - | +| completed | SAM_RS | ABCNet + SAM priors | seg+bdy+obj (native) | 0.2258 | 0.0189 | 0.798 | - | 0.9012 | 0.3196 | - | 0.635 | - | 0.6556 | 0.4541 | 0.6473 | 0.01 | - | +| completed | SAM_RS | CMTFNet + SAM priors | seg+bdy+obj (native) | 0.4057 | 0.0189 | 0.8107 | - | 0.8679 | 0.1417 | - | 0.6313 | - | 0.668 | 0.4534 | 0.6074 | 0.01 | - | +| completed | SAM_RS | FTUNetFormer + SAM priors | seg+bdy+obj (native) | 0.3986 | 0.0189 | 0.8033 | - | 0.8646 | 0.171 | - | 0.5149 | - | 0.6742 | 0.5325 | 0.5399 | 0.01 | - | +| completed | SAM_RS | UNetFormer + SAM priors | seg+bdy+obj (native) | 0.4161 | 0.0189 | 0.8251 | - | 0.8991 | 0.269 | - | 0.6813 | - | 0.7122 | 0.4914 | 0.6211 | 0.01 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | ce+dice | 0.4801 | 0.1719 | 0.8524 | - | 0.8667 | 0.0801 | - | 0.5118 | - | 0.7099 | 0.4239 | 0.5145 | 0.01 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | weighted_ce+dice | 0.1094 | 0.1042 | 0.8711 | - | 0.8678 | 0.061 | - | 0.4988 | - | 0.671 | 0.4103 | 0.5014 | 0.0118 | - | +| completed | SAM2.1 | Hiera-B+ (frozen backbone, msfpn) | focal+dice | 0.3368 | 0.2089 | 0.8769 | - | 0.8726 | 0.0737 | - | 0.5452 | - | 0.6877 | 0.4242 | 0.5045 | 0.01 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | ce+dice | 0.4621 | 0.0189 | 0.8062 | - | 0.848 | 0.2161 | - | 0.542 | - | 0.693 | 0.4542 | 0.5449 | 0.01 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | weighted_ce+dice | 0.2097 | 0.3964 | 0.8205 | - | 0.8782 | 0.3169 | - | 0.4935 | - | 0.6721 | 0.4716 | 0.581 | 0.01 | - | +| completed | SAM2.1 | Hiera-B+ (full finetune, msfpn) | focal+dice | 0.383 | 0.0189 | 0.8162 | - | 0.8574 | 0.2637 | - | 0.5548 | - | 0.6786 | 0.4799 | 0.5779 | 0.01 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | ce+dice | 0.5349 | 0.0189 | 0.8133 | - | 0.904 | 0.3774 | - | 0.5414 | - | 0.7021 | 0.4758 | 0.668 | 0.01 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | weighted_ce+dice | 0.6478 | 0.453 | 0.8247 | - | 0.906 | 0.4637 | - | 0.6663 | - | 0.6742 | 0.4601 | 0.6346 | 0.1382 | - | +| completed | RSAM-Seg | SAM-ViT-B (frozen encoder) | focal+dice | 0.4918 | 0.1961 | 0.8341 | - | 0.9069 | 0.3793 | - | 0.6757 | - | 0.7176 | 0.5535 | 0.6892 | 0.01 | - | +| completed | SESSRS | A2FPN (ce+dice) | t1/t2 search + postprocess | 0.5604 | 0.0189 | 0.8095 | - | 0.9243 | 0.2812 | - | 0.7034 | - | 0.639 | 0.4708 | 0.8223 | 0.01 | - | +| completed | SESSRS | A2FPN (focal) | t1/t2 search + postprocess | 0.7206 | 0.0189 | 0.8215 | - | 0.8942 | 0.3063 | - | 0.7198 | - | 0.6778 | 0.4354 | 0.6132 | 0.01 | - | +| completed | SESSRS | A2FPN (weighted) | t1/t2 search + postprocess | 0.6534 | 0.3786 | 0.8071 | - | 0.9099 | 0.3939 | - | 0.726 | - | 0.6695 | 0.4531 | 0.6719 | 0.3191 | - | +| completed | SESSRS | ABCNet (ce+dice+aux) | t1/t2 search + postprocess | 0.4507 | 0.0189 | 0.804 | - | 0.8935 | 0.2952 | - | 0.7062 | - | 0.6423 | 0.4369 | 0.6587 | 0.01 | - | +| completed | SESSRS | BANet (ce+dice) | t1/t2 search + postprocess | 0.4024 | 0.0185 | 0.8114 | - | 0.852 | 0.2933 | - | 0.6 | - | 0.671 | 0.4585 | 0.547 | 0.01 | - | +| completed | SESSRS | MANet (ce+dice) | t1/t2 search + postprocess | 0.7823 | 0.0194 | 0.8482 | - | 0.9273 | 0.4235 | - | 0.7551 | - | 0.7357 | 0.4317 | 0.684 | 0.0102 | - | +| completed | SESSRS | MANet (focal) | t1/t2 search + postprocess | 0.8213 | 0.5013 | 0.8504 | - | 0.9285 | 0.5011 | - | 0.7783 | - | 0.7158 | 0.4493 | 0.6483 | 0.451 | - | +| completed | SESSRS | MANet (weighted) | t1/t2 search + postprocess | 0.8665 | 0.6566 | 0.844 | - | 0.9322 | 0.4919 | - | 0.7666 | - | 0.6882 | 0.4221 | 0.6778 | 0.2113 | - | +| completed | SESSRS | UNetFormer (ce+dice) | t1/t2 search + postprocess | 0.7391 | 0.0189 | 0.8217 | - | 0.9338 | 0.4927 | - | 0.7362 | - | 0.7263 | 0.4957 | 0.6716 | 0.01 | - | +| completed | SESSRS | UNetFormer (focal) | t1/t2 search + postprocess | 0.7689 | 0.0189 | 0.8402 | - | 0.9317 | 0.4354 | - | 0.6956 | - | 0.6916 | 0.5005 | 0.7197 | 0.01 | - | +| completed | SESSRS | UNetFormer (weighted) | t1/t2 search + postprocess | 0.7647 | 0.4332 | 0.8399 | - | 0.9235 | 0.3672 | - | 0.729 | - | 0.6839 | 0.4542 | 0.6225 | 0.01 | - |