end mmdet for now
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- mmdet/cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora/20250614_124757.log.json +0 -0
- mmdet/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona/20250610_212914.log.json +0 -0
- mmdet/pretrained_model/swin_base_mona_random_0.5.pth +3 -0
- mmdet/pretrained_model/swin_base_mona_taylor_0.5.pth +3 -0
- mmdet/pretrained_model/swin_base_mona_wanda_act_60000_0.5.pth +3 -0
- mmdet/pretrained_model/swin_base_mona_wanda_act_60000_0.875.pth +3 -0
- mmdet/pretrained_model/swin_base_mona_wanda_act_60000_0.875_llama_moe_7.pth +3 -0
- mmdet/pretrained_model/swin_base_patch4_window7_224_22k.pth +3 -0
- mmdet/results/prune_log/mona/taylor_importance.json +3 -0
- mmdet/results/prune_log/mona/wanda_12000.json +3 -0
- mmdet/results/prune_log/mona/wanda_6000.json +3 -0
- mmdet/results/prune_log/mona/wanda_60000.json +3 -0
- mmdet/results/prune_log/mona/wanda_act_60000.json +3 -0
- mmdet/results/train/llama_moe_4_16_1e-4/20250620_161720.log +585 -0
- mmdet/results/train/llama_moe_4_16_1e-4/20250620_161720.log.json +3 -0
- mmdet/results/train/llama_moe_4_16_1e-4/cascade_mask_swin_base_3x_coco_sample_1_bs_16_llama_moe.py +438 -0
- mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora → results/train/lora}/20250614_124757.log +0 -0
- mmdet/results/train/lora/20250614_124757.log.json +3 -0
- mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora → results/train/lora}/cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora.py +0 -0
- mmdet/results/train/lora/epoch_1.pth +3 -0
- mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora → results/train/lora}/epoch_36.pth +0 -0
- mmdet/results/train/lora/latest.pth +1 -0
- mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona → results/train/mona}/20250610_212914.log +0 -0
- mmdet/results/train/mona/20250610_212914.log.json +3 -0
- mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona → results/train/mona}/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona.py +0 -0
- mmdet/results/train/mona/epoch_1.pth +3 -0
- mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona → results/train/mona}/epoch_36.pth +0 -0
- mmdet/results/train/mona/latest.pth +1 -0
- mmdet/results/train/mona_llama_moe_2_8_1e-4/20250624_193305.log +0 -0
- mmdet/results/train/mona_llama_moe_2_8_1e-4/20250624_193305.log.json +3 -0
- mmdet/results/train/mona_llama_moe_2_8_1e-4/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_llama_moe.py +438 -0
- mmdet/results/train/mona_llama_moe_2_8_1e-4/epoch_1.pth +3 -0
- mmdet/results/train/mona_llama_moe_2_8_1e-4/epoch_36.pth +3 -0
- mmdet/results/train/mona_llama_moe_2_8_1e-4/latest.pth +1 -0
- mmdet/results/train/mona_llama_moe_5_8_1e-4/20250702_125523.log +613 -0
- mmdet/results/train/mona_llama_moe_5_8_1e-4/20250702_125523.log.json +3 -0
- mmdet/results/train/mona_llama_moe_5_8_1e-4/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_llama_moe.py +438 -0
- mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/20250620_180057.log +0 -0
- mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/20250620_180057.log.json +3 -0
- mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_llama_moe_distill.py +438 -0
- mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/epoch_1.pth +3 -0
- mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/latest.pth +1 -0
- mmdet/results/train/mona_moe_4_16_1e-4_balance/20250619_111115.log +0 -0
- mmdet/results/train/mona_moe_4_16_1e-4_balance/20250619_111115.log.json +3 -0
- mmdet/results/train/mona_moe_4_16_1e-4_balance/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_moe.py +438 -0
- mmdet/results/train/mona_moe_4_16_1e-4_balance/epoch_1.pth +3 -0
- mmdet/{checkpoints/swin_base_mona_moe_4_16_epoch_4.pth → results/train/mona_moe_4_16_1e-4_balance/epoch_2.pth} +1 -1
- mmdet/results/train/mona_moe_4_16_1e-4_balance/latest.pth +1 -0
- mmdet/results/train/mona_moe_4_16_1e-4_gate/20250618_110426.log +0 -0
- mmdet/results/train/mona_moe_4_16_1e-4_gate/20250618_110426.log.json +3 -0
mmdet/cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora/20250614_124757.log.json
DELETED
|
The diff for this file is too large to render.
See raw diff
|
|
|
mmdet/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona/20250610_212914.log.json
DELETED
|
The diff for this file is too large to render.
See raw diff
|
|
|
mmdet/pretrained_model/swin_base_mona_random_0.5.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1b0c2e1fff5fdf347a6f123083168813038cf5dea2c7d4c608e7bb3292272fca
|
| 3 |
+
size 483804422
|
mmdet/pretrained_model/swin_base_mona_taylor_0.5.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:57e513866a763f3d4b28a56a991d4d573c8062ee62ece1d938ddd68b2f964a3d
|
| 3 |
+
size 483804422
|
mmdet/pretrained_model/swin_base_mona_wanda_act_60000_0.5.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5d48fa5fa66f359e145b79924d92631d011dfc01d9d1caf8018947fc853bfcc1
|
| 3 |
+
size 483815897
|
mmdet/pretrained_model/swin_base_mona_wanda_act_60000_0.875.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e13ce27ca763d38ada08eabe3f4cb41e396cfda24b9c1315352689bbaf358b58
|
| 3 |
+
size 399991183
|
mmdet/pretrained_model/swin_base_mona_wanda_act_60000_0.875_llama_moe_7.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86219e85cac6ea91fa5e8ca4512de5ad80877ec8909abb63134a35d61898a8ce
|
| 3 |
+
size 595631763
|
mmdet/pretrained_model/swin_base_patch4_window7_224_22k.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:15a79f43baab4503128490da8fe75817a9ceb696aef9ae66ba455f9a251dafb5
|
| 3 |
+
size 438213867
|
mmdet/results/prune_log/mona/taylor_importance.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc1630befd7add277a1716a00dfee3dfa709947d4af137a5b7c0ca172b2e34ac
|
| 3 |
+
size 552510
|
mmdet/results/prune_log/mona/wanda_12000.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f88d06c85374cc94f0b70a2eb710bd97fb0095a2fe347935d0e551598c065f43
|
| 3 |
+
size 552510
|
mmdet/results/prune_log/mona/wanda_6000.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2d9c298c529a7d4278df9d8637b44101d829c380f6b43ba9148cb740db5aaaa5
|
| 3 |
+
size 552510
|
mmdet/results/prune_log/mona/wanda_60000.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea849bed5a063a2702238c5e71bfc82b5944eb31bd266f2f433ef228eb4ec8eb
|
| 3 |
+
size 552510
|
mmdet/results/prune_log/mona/wanda_act_60000.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:61c2629fde77ad5f952260155bb9d7dba036046be315ffddfc6301a8f8eecde9
|
| 3 |
+
size 552510
|
mmdet/results/train/llama_moe_4_16_1e-4/20250620_161720.log
ADDED
|
@@ -0,0 +1,585 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2025-06-20 16:17:20,333 - mmdet - INFO - Environment info:
|
| 2 |
+
------------------------------------------------------------
|
| 3 |
+
sys.platform: linux
|
| 4 |
+
Python: 3.8.20 (default, Oct 3 2024, 15:24:27) [GCC 11.2.0]
|
| 5 |
+
CUDA available: True
|
| 6 |
+
GPU 0,1,2,3,4,5,6,7: NVIDIA GeForce RTX 4090
|
| 7 |
+
CUDA_HOME: /root/autodl-tmp/cuda/cuda-11.7
|
| 8 |
+
NVCC: Cuda compilation tools, release 11.7, V11.7.64
|
| 9 |
+
GCC: gcc (Ubuntu 9.4.0-1ubuntu1~20.04.1) 9.4.0
|
| 10 |
+
PyTorch: 1.13.1+cu117
|
| 11 |
+
PyTorch compiling details: PyTorch built with:
|
| 12 |
+
- GCC 9.3
|
| 13 |
+
- C++ Version: 201402
|
| 14 |
+
- Intel(R) Math Kernel Library Version 2020.0.0 Product Build 20191122 for Intel(R) 64 architecture applications
|
| 15 |
+
- Intel(R) MKL-DNN v2.6.0 (Git Hash 52b5f107dd9cf10910aaa19cb47f3abf9b349815)
|
| 16 |
+
- OpenMP 201511 (a.k.a. OpenMP 4.5)
|
| 17 |
+
- LAPACK is enabled (usually provided by MKL)
|
| 18 |
+
- NNPACK is enabled
|
| 19 |
+
- CPU capability usage: AVX2
|
| 20 |
+
- CUDA Runtime 11.7
|
| 21 |
+
- NVCC architecture flags: -gencode;arch=compute_37,code=sm_37;-gencode;arch=compute_50,code=sm_50;-gencode;arch=compute_60,code=sm_60;-gencode;arch=compute_70,code=sm_70;-gencode;arch=compute_75,code=sm_75;-gencode;arch=compute_80,code=sm_80;-gencode;arch=compute_86,code=sm_86
|
| 22 |
+
- CuDNN 8.5
|
| 23 |
+
- Magma 2.6.1
|
| 24 |
+
- Build settings: BLAS_INFO=mkl, BUILD_TYPE=Release, CUDA_VERSION=11.7, CUDNN_VERSION=8.5.0, CXX_COMPILER=/opt/rh/devtoolset-9/root/usr/bin/c++, CXX_FLAGS= -fabi-version=11 -Wno-deprecated -fvisibility-inlines-hidden -DUSE_PTHREADPOOL -fopenmp -DNDEBUG -DUSE_KINETO -DUSE_FBGEMM -DUSE_QNNPACK -DUSE_PYTORCH_QNNPACK -DUSE_XNNPACK -DSYMBOLICATE_MOBILE_DEBUG_HANDLE -DEDGE_PROFILER_USE_KINETO -O2 -fPIC -Wno-narrowing -Wall -Wextra -Werror=return-type -Werror=non-virtual-dtor -Wno-missing-field-initializers -Wno-type-limits -Wno-array-bounds -Wno-unknown-pragmas -Wunused-local-typedefs -Wno-unused-parameter -Wno-unused-function -Wno-unused-result -Wno-strict-overflow -Wno-strict-aliasing -Wno-error=deprecated-declarations -Wno-stringop-overflow -Wno-psabi -Wno-error=pedantic -Wno-error=redundant-decls -Wno-error=old-style-cast -fdiagnostics-color=always -faligned-new -Wno-unused-but-set-variable -Wno-maybe-uninitialized -fno-math-errno -fno-trapping-math -Werror=format -Werror=cast-function-type -Wno-stringop-overflow, LAPACK_INFO=mkl, PERF_WITH_AVX=1, PERF_WITH_AVX2=1, PERF_WITH_AVX512=1, TORCH_VERSION=1.13.1, USE_CUDA=ON, USE_CUDNN=ON, USE_EXCEPTION_PTR=1, USE_GFLAGS=OFF, USE_GLOG=OFF, USE_MKL=ON, USE_MKLDNN=ON, USE_MPI=OFF, USE_NCCL=ON, USE_NNPACK=ON, USE_OPENMP=ON, USE_ROCM=OFF,
|
| 25 |
+
|
| 26 |
+
TorchVision: 0.14.1+cu117
|
| 27 |
+
OpenCV: 4.11.0
|
| 28 |
+
MMCV: 1.7.2
|
| 29 |
+
MMCV Compiler: GCC 9.3
|
| 30 |
+
MMCV CUDA Compiler: 11.7
|
| 31 |
+
MMDetection: 2.11.0+b6242b2
|
| 32 |
+
------------------------------------------------------------
|
| 33 |
+
|
| 34 |
+
2025-06-20 16:17:23,940 - mmdet - INFO - Distributed training: True
|
| 35 |
+
2025-06-20 16:17:27,149 - mmdet - INFO - Config:
|
| 36 |
+
model = dict(
|
| 37 |
+
type='CascadeRCNN_loss',
|
| 38 |
+
pretrained=None,
|
| 39 |
+
backbone=dict(
|
| 40 |
+
type='SwinTransformer_llama_moe',
|
| 41 |
+
embed_dim=128,
|
| 42 |
+
depths=[2, 2, 18, 2],
|
| 43 |
+
num_heads=[4, 8, 16, 32],
|
| 44 |
+
window_size=7,
|
| 45 |
+
mlp_ratio=4.0,
|
| 46 |
+
qkv_bias=True,
|
| 47 |
+
qk_scale=None,
|
| 48 |
+
drop_rate=0.0,
|
| 49 |
+
attn_drop_rate=0.0,
|
| 50 |
+
drop_path_rate=0.3,
|
| 51 |
+
ape=False,
|
| 52 |
+
patch_norm=True,
|
| 53 |
+
out_indices=(0, 1, 2, 3),
|
| 54 |
+
use_checkpoint=False),
|
| 55 |
+
neck=dict(
|
| 56 |
+
type='FPN',
|
| 57 |
+
in_channels=[128, 256, 512, 1024],
|
| 58 |
+
out_channels=256,
|
| 59 |
+
num_outs=5),
|
| 60 |
+
rpn_head=dict(
|
| 61 |
+
type='RPNHead',
|
| 62 |
+
in_channels=256,
|
| 63 |
+
feat_channels=256,
|
| 64 |
+
anchor_generator=dict(
|
| 65 |
+
type='AnchorGenerator',
|
| 66 |
+
scales=[8],
|
| 67 |
+
ratios=[0.5, 1.0, 2.0],
|
| 68 |
+
strides=[4, 8, 16, 32, 64]),
|
| 69 |
+
bbox_coder=dict(
|
| 70 |
+
type='DeltaXYWHBBoxCoder',
|
| 71 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 72 |
+
target_stds=[1.0, 1.0, 1.0, 1.0]),
|
| 73 |
+
loss_cls=dict(
|
| 74 |
+
type='CrossEntropyLoss', use_sigmoid=True, loss_weight=1.0),
|
| 75 |
+
loss_bbox=dict(
|
| 76 |
+
type='SmoothL1Loss', beta=0.1111111111111111, loss_weight=1.0)),
|
| 77 |
+
roi_head=dict(
|
| 78 |
+
type='CascadeRoIHead',
|
| 79 |
+
num_stages=3,
|
| 80 |
+
stage_loss_weights=[1, 0.5, 0.25],
|
| 81 |
+
bbox_roi_extractor=dict(
|
| 82 |
+
type='SingleRoIExtractor',
|
| 83 |
+
roi_layer=dict(type='RoIAlign', output_size=7, sampling_ratio=0),
|
| 84 |
+
out_channels=256,
|
| 85 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 86 |
+
bbox_head=[
|
| 87 |
+
dict(
|
| 88 |
+
type='ConvFCBBoxHead',
|
| 89 |
+
num_shared_convs=4,
|
| 90 |
+
num_shared_fcs=1,
|
| 91 |
+
in_channels=256,
|
| 92 |
+
conv_out_channels=256,
|
| 93 |
+
fc_out_channels=1024,
|
| 94 |
+
roi_feat_size=7,
|
| 95 |
+
num_classes=80,
|
| 96 |
+
bbox_coder=dict(
|
| 97 |
+
type='DeltaXYWHBBoxCoder',
|
| 98 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 99 |
+
target_stds=[0.1, 0.1, 0.2, 0.2]),
|
| 100 |
+
reg_class_agnostic=False,
|
| 101 |
+
reg_decoded_bbox=True,
|
| 102 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 103 |
+
loss_cls=dict(
|
| 104 |
+
type='CrossEntropyLoss',
|
| 105 |
+
use_sigmoid=False,
|
| 106 |
+
loss_weight=1.0),
|
| 107 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 108 |
+
dict(
|
| 109 |
+
type='ConvFCBBoxHead',
|
| 110 |
+
num_shared_convs=4,
|
| 111 |
+
num_shared_fcs=1,
|
| 112 |
+
in_channels=256,
|
| 113 |
+
conv_out_channels=256,
|
| 114 |
+
fc_out_channels=1024,
|
| 115 |
+
roi_feat_size=7,
|
| 116 |
+
num_classes=80,
|
| 117 |
+
bbox_coder=dict(
|
| 118 |
+
type='DeltaXYWHBBoxCoder',
|
| 119 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 120 |
+
target_stds=[0.05, 0.05, 0.1, 0.1]),
|
| 121 |
+
reg_class_agnostic=False,
|
| 122 |
+
reg_decoded_bbox=True,
|
| 123 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 124 |
+
loss_cls=dict(
|
| 125 |
+
type='CrossEntropyLoss',
|
| 126 |
+
use_sigmoid=False,
|
| 127 |
+
loss_weight=1.0),
|
| 128 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 129 |
+
dict(
|
| 130 |
+
type='ConvFCBBoxHead',
|
| 131 |
+
num_shared_convs=4,
|
| 132 |
+
num_shared_fcs=1,
|
| 133 |
+
in_channels=256,
|
| 134 |
+
conv_out_channels=256,
|
| 135 |
+
fc_out_channels=1024,
|
| 136 |
+
roi_feat_size=7,
|
| 137 |
+
num_classes=80,
|
| 138 |
+
bbox_coder=dict(
|
| 139 |
+
type='DeltaXYWHBBoxCoder',
|
| 140 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 141 |
+
target_stds=[0.033, 0.033, 0.067, 0.067]),
|
| 142 |
+
reg_class_agnostic=False,
|
| 143 |
+
reg_decoded_bbox=True,
|
| 144 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 145 |
+
loss_cls=dict(
|
| 146 |
+
type='CrossEntropyLoss',
|
| 147 |
+
use_sigmoid=False,
|
| 148 |
+
loss_weight=1.0),
|
| 149 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
|
| 150 |
+
],
|
| 151 |
+
mask_roi_extractor=dict(
|
| 152 |
+
type='SingleRoIExtractor',
|
| 153 |
+
roi_layer=dict(type='RoIAlign', output_size=14, sampling_ratio=0),
|
| 154 |
+
out_channels=256,
|
| 155 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 156 |
+
mask_head=dict(
|
| 157 |
+
type='FCNMaskHead',
|
| 158 |
+
num_convs=4,
|
| 159 |
+
in_channels=256,
|
| 160 |
+
conv_out_channels=256,
|
| 161 |
+
num_classes=80,
|
| 162 |
+
loss_mask=dict(
|
| 163 |
+
type='CrossEntropyLoss', use_mask=True, loss_weight=1.0))),
|
| 164 |
+
train_cfg=dict(
|
| 165 |
+
rpn=dict(
|
| 166 |
+
assigner=dict(
|
| 167 |
+
type='MaxIoUAssigner',
|
| 168 |
+
pos_iou_thr=0.7,
|
| 169 |
+
neg_iou_thr=0.3,
|
| 170 |
+
min_pos_iou=0.3,
|
| 171 |
+
match_low_quality=True,
|
| 172 |
+
ignore_iof_thr=-1),
|
| 173 |
+
sampler=dict(
|
| 174 |
+
type='RandomSampler',
|
| 175 |
+
num=256,
|
| 176 |
+
pos_fraction=0.5,
|
| 177 |
+
neg_pos_ub=-1,
|
| 178 |
+
add_gt_as_proposals=False),
|
| 179 |
+
allowed_border=0,
|
| 180 |
+
pos_weight=-1,
|
| 181 |
+
debug=False),
|
| 182 |
+
rpn_proposal=dict(
|
| 183 |
+
nms_across_levels=False,
|
| 184 |
+
nms_pre=2000,
|
| 185 |
+
nms_post=2000,
|
| 186 |
+
max_per_img=2000,
|
| 187 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 188 |
+
min_bbox_size=0),
|
| 189 |
+
rcnn=[
|
| 190 |
+
dict(
|
| 191 |
+
assigner=dict(
|
| 192 |
+
type='MaxIoUAssigner',
|
| 193 |
+
pos_iou_thr=0.5,
|
| 194 |
+
neg_iou_thr=0.5,
|
| 195 |
+
min_pos_iou=0.5,
|
| 196 |
+
match_low_quality=False,
|
| 197 |
+
ignore_iof_thr=-1),
|
| 198 |
+
sampler=dict(
|
| 199 |
+
type='RandomSampler',
|
| 200 |
+
num=512,
|
| 201 |
+
pos_fraction=0.25,
|
| 202 |
+
neg_pos_ub=-1,
|
| 203 |
+
add_gt_as_proposals=True),
|
| 204 |
+
mask_size=28,
|
| 205 |
+
pos_weight=-1,
|
| 206 |
+
debug=False),
|
| 207 |
+
dict(
|
| 208 |
+
assigner=dict(
|
| 209 |
+
type='MaxIoUAssigner',
|
| 210 |
+
pos_iou_thr=0.6,
|
| 211 |
+
neg_iou_thr=0.6,
|
| 212 |
+
min_pos_iou=0.6,
|
| 213 |
+
match_low_quality=False,
|
| 214 |
+
ignore_iof_thr=-1),
|
| 215 |
+
sampler=dict(
|
| 216 |
+
type='RandomSampler',
|
| 217 |
+
num=512,
|
| 218 |
+
pos_fraction=0.25,
|
| 219 |
+
neg_pos_ub=-1,
|
| 220 |
+
add_gt_as_proposals=True),
|
| 221 |
+
mask_size=28,
|
| 222 |
+
pos_weight=-1,
|
| 223 |
+
debug=False),
|
| 224 |
+
dict(
|
| 225 |
+
assigner=dict(
|
| 226 |
+
type='MaxIoUAssigner',
|
| 227 |
+
pos_iou_thr=0.7,
|
| 228 |
+
neg_iou_thr=0.7,
|
| 229 |
+
min_pos_iou=0.7,
|
| 230 |
+
match_low_quality=False,
|
| 231 |
+
ignore_iof_thr=-1),
|
| 232 |
+
sampler=dict(
|
| 233 |
+
type='RandomSampler',
|
| 234 |
+
num=512,
|
| 235 |
+
pos_fraction=0.25,
|
| 236 |
+
neg_pos_ub=-1,
|
| 237 |
+
add_gt_as_proposals=True),
|
| 238 |
+
mask_size=28,
|
| 239 |
+
pos_weight=-1,
|
| 240 |
+
debug=False)
|
| 241 |
+
]),
|
| 242 |
+
test_cfg=dict(
|
| 243 |
+
rpn=dict(
|
| 244 |
+
nms_across_levels=False,
|
| 245 |
+
nms_pre=1000,
|
| 246 |
+
nms_post=1000,
|
| 247 |
+
max_per_img=1000,
|
| 248 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 249 |
+
min_bbox_size=0),
|
| 250 |
+
rcnn=dict(
|
| 251 |
+
score_thr=0.05,
|
| 252 |
+
nms=dict(type='nms', iou_threshold=0.5),
|
| 253 |
+
max_per_img=100,
|
| 254 |
+
mask_thr_binary=0.5)))
|
| 255 |
+
dataset_type = 'CocoDataset'
|
| 256 |
+
data_root = '/root/autodl-tmp/COCO2017/'
|
| 257 |
+
img_norm_cfg = dict(
|
| 258 |
+
mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
|
| 259 |
+
train_pipeline = [
|
| 260 |
+
dict(type='LoadImageFromFile'),
|
| 261 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 262 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 263 |
+
dict(
|
| 264 |
+
type='AutoAugment',
|
| 265 |
+
policies=[[{
|
| 266 |
+
'type':
|
| 267 |
+
'Resize',
|
| 268 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333), (576, 1333),
|
| 269 |
+
(608, 1333), (640, 1333), (672, 1333), (704, 1333),
|
| 270 |
+
(736, 1333), (768, 1333), (800, 1333)],
|
| 271 |
+
'multiscale_mode':
|
| 272 |
+
'value',
|
| 273 |
+
'keep_ratio':
|
| 274 |
+
True
|
| 275 |
+
}],
|
| 276 |
+
[{
|
| 277 |
+
'type': 'Resize',
|
| 278 |
+
'img_scale': [(400, 1333), (500, 1333), (600, 1333)],
|
| 279 |
+
'multiscale_mode': 'value',
|
| 280 |
+
'keep_ratio': True
|
| 281 |
+
}, {
|
| 282 |
+
'type': 'RandomCrop',
|
| 283 |
+
'crop_type': 'absolute_range',
|
| 284 |
+
'crop_size': (384, 600),
|
| 285 |
+
'allow_negative_crop': True
|
| 286 |
+
}, {
|
| 287 |
+
'type':
|
| 288 |
+
'Resize',
|
| 289 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 290 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 291 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 292 |
+
(768, 1333), (800, 1333)],
|
| 293 |
+
'multiscale_mode':
|
| 294 |
+
'value',
|
| 295 |
+
'override':
|
| 296 |
+
True,
|
| 297 |
+
'keep_ratio':
|
| 298 |
+
True
|
| 299 |
+
}]]),
|
| 300 |
+
dict(
|
| 301 |
+
type='Normalize',
|
| 302 |
+
mean=[123.675, 116.28, 103.53],
|
| 303 |
+
std=[58.395, 57.12, 57.375],
|
| 304 |
+
to_rgb=True),
|
| 305 |
+
dict(type='Pad', size_divisor=32),
|
| 306 |
+
dict(type='DefaultFormatBundle'),
|
| 307 |
+
dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 308 |
+
]
|
| 309 |
+
test_pipeline = [
|
| 310 |
+
dict(type='LoadImageFromFile'),
|
| 311 |
+
dict(
|
| 312 |
+
type='MultiScaleFlipAug',
|
| 313 |
+
img_scale=(1333, 800),
|
| 314 |
+
flip=False,
|
| 315 |
+
transforms=[
|
| 316 |
+
dict(type='Resize', keep_ratio=True),
|
| 317 |
+
dict(type='RandomFlip'),
|
| 318 |
+
dict(
|
| 319 |
+
type='Normalize',
|
| 320 |
+
mean=[123.675, 116.28, 103.53],
|
| 321 |
+
std=[58.395, 57.12, 57.375],
|
| 322 |
+
to_rgb=True),
|
| 323 |
+
dict(type='Pad', size_divisor=32),
|
| 324 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 325 |
+
dict(type='Collect', keys=['img'])
|
| 326 |
+
])
|
| 327 |
+
]
|
| 328 |
+
data = dict(
|
| 329 |
+
samples_per_gpu=2,
|
| 330 |
+
workers_per_gpu=4,
|
| 331 |
+
train=dict(
|
| 332 |
+
type='CocoDataset',
|
| 333 |
+
ann_file=
|
| 334 |
+
'/root/autodl-tmp/COCO2017/annotations/instances_train2017.json',
|
| 335 |
+
img_prefix='/root/autodl-tmp/COCO2017/train2017/',
|
| 336 |
+
pipeline=[
|
| 337 |
+
dict(type='LoadImageFromFile'),
|
| 338 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 339 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 340 |
+
dict(
|
| 341 |
+
type='AutoAugment',
|
| 342 |
+
policies=[[{
|
| 343 |
+
'type':
|
| 344 |
+
'Resize',
|
| 345 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 346 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 347 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 348 |
+
(768, 1333), (800, 1333)],
|
| 349 |
+
'multiscale_mode':
|
| 350 |
+
'value',
|
| 351 |
+
'keep_ratio':
|
| 352 |
+
True
|
| 353 |
+
}],
|
| 354 |
+
[{
|
| 355 |
+
'type': 'Resize',
|
| 356 |
+
'img_scale': [(400, 1333), (500, 1333),
|
| 357 |
+
(600, 1333)],
|
| 358 |
+
'multiscale_mode': 'value',
|
| 359 |
+
'keep_ratio': True
|
| 360 |
+
}, {
|
| 361 |
+
'type': 'RandomCrop',
|
| 362 |
+
'crop_type': 'absolute_range',
|
| 363 |
+
'crop_size': (384, 600),
|
| 364 |
+
'allow_negative_crop': True
|
| 365 |
+
}, {
|
| 366 |
+
'type':
|
| 367 |
+
'Resize',
|
| 368 |
+
'img_scale': [(480, 1333), (512, 1333),
|
| 369 |
+
(544, 1333), (576, 1333),
|
| 370 |
+
(608, 1333), (640, 1333),
|
| 371 |
+
(672, 1333), (704, 1333),
|
| 372 |
+
(736, 1333), (768, 1333),
|
| 373 |
+
(800, 1333)],
|
| 374 |
+
'multiscale_mode':
|
| 375 |
+
'value',
|
| 376 |
+
'override':
|
| 377 |
+
True,
|
| 378 |
+
'keep_ratio':
|
| 379 |
+
True
|
| 380 |
+
}]]),
|
| 381 |
+
dict(
|
| 382 |
+
type='Normalize',
|
| 383 |
+
mean=[123.675, 116.28, 103.53],
|
| 384 |
+
std=[58.395, 57.12, 57.375],
|
| 385 |
+
to_rgb=True),
|
| 386 |
+
dict(type='Pad', size_divisor=32),
|
| 387 |
+
dict(type='DefaultFormatBundle'),
|
| 388 |
+
dict(
|
| 389 |
+
type='Collect',
|
| 390 |
+
keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 391 |
+
]),
|
| 392 |
+
val=dict(
|
| 393 |
+
type='CocoDataset',
|
| 394 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 395 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 396 |
+
pipeline=[
|
| 397 |
+
dict(type='LoadImageFromFile'),
|
| 398 |
+
dict(
|
| 399 |
+
type='MultiScaleFlipAug',
|
| 400 |
+
img_scale=(1333, 800),
|
| 401 |
+
flip=False,
|
| 402 |
+
transforms=[
|
| 403 |
+
dict(type='Resize', keep_ratio=True),
|
| 404 |
+
dict(type='RandomFlip'),
|
| 405 |
+
dict(
|
| 406 |
+
type='Normalize',
|
| 407 |
+
mean=[123.675, 116.28, 103.53],
|
| 408 |
+
std=[58.395, 57.12, 57.375],
|
| 409 |
+
to_rgb=True),
|
| 410 |
+
dict(type='Pad', size_divisor=32),
|
| 411 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 412 |
+
dict(type='Collect', keys=['img'])
|
| 413 |
+
])
|
| 414 |
+
]),
|
| 415 |
+
test=dict(
|
| 416 |
+
type='CocoDataset',
|
| 417 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 418 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 419 |
+
pipeline=[
|
| 420 |
+
dict(type='LoadImageFromFile'),
|
| 421 |
+
dict(
|
| 422 |
+
type='MultiScaleFlipAug',
|
| 423 |
+
img_scale=(1333, 800),
|
| 424 |
+
flip=False,
|
| 425 |
+
transforms=[
|
| 426 |
+
dict(type='Resize', keep_ratio=True),
|
| 427 |
+
dict(type='RandomFlip'),
|
| 428 |
+
dict(
|
| 429 |
+
type='Normalize',
|
| 430 |
+
mean=[123.675, 116.28, 103.53],
|
| 431 |
+
std=[58.395, 57.12, 57.375],
|
| 432 |
+
to_rgb=True),
|
| 433 |
+
dict(type='Pad', size_divisor=32),
|
| 434 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 435 |
+
dict(type='Collect', keys=['img'])
|
| 436 |
+
])
|
| 437 |
+
]))
|
| 438 |
+
evaluation = dict(metric=['bbox', 'segm'], gpu_collect=True)
|
| 439 |
+
optimizer = dict(
|
| 440 |
+
type='AdamW',
|
| 441 |
+
lr=0.0001,
|
| 442 |
+
betas=(0.9, 0.999),
|
| 443 |
+
weight_decay=0.05,
|
| 444 |
+
paramwise_cfg=dict(
|
| 445 |
+
custom_keys=dict(
|
| 446 |
+
absolute_pos_embed=dict(decay_mult=0.0),
|
| 447 |
+
relative_position_bias_table=dict(decay_mult=0.0),
|
| 448 |
+
norm=dict(decay_mult=0.0))))
|
| 449 |
+
optimizer_config = dict(
|
| 450 |
+
grad_clip=None,
|
| 451 |
+
type='DistOptimizerHook',
|
| 452 |
+
update_interval=1,
|
| 453 |
+
coalesce=True,
|
| 454 |
+
bucket_size_mb=-1,
|
| 455 |
+
use_fp16=True)
|
| 456 |
+
lr_config = dict(
|
| 457 |
+
policy='step',
|
| 458 |
+
warmup='linear',
|
| 459 |
+
warmup_iters=500,
|
| 460 |
+
warmup_ratio=0.001,
|
| 461 |
+
step=[27, 33])
|
| 462 |
+
runner = dict(type='EpochBasedRunnerAmp', max_epochs=36)
|
| 463 |
+
checkpoint_config = dict(interval=1)
|
| 464 |
+
log_config = dict(interval=50, hooks=[dict(type='TextLoggerHook')])
|
| 465 |
+
custom_hooks = [dict(type='NumClassCheckHook')]
|
| 466 |
+
dist_params = dict(backend='nccl')
|
| 467 |
+
log_level = 'INFO'
|
| 468 |
+
load_from = '/root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/pretrained_model/swin_base_llama_moe_16.pth'
|
| 469 |
+
resume_from = None
|
| 470 |
+
workflow = [('train', 1)]
|
| 471 |
+
fp16 = None
|
| 472 |
+
work_dir = './results/train/llama_moe_4_16_1e-4/'
|
| 473 |
+
gpu_ids = range(0, 8)
|
| 474 |
+
|
| 475 |
+
2025-06-20 16:18:09,321 - mmdet - INFO - load checkpoint from local path: /root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/pretrained_model/swin_base_llama_moe_16.pth
|
| 476 |
+
2025-06-20 16:18:09,704 - mmdet - WARNING - The model and loaded state dict do not match exactly
|
| 477 |
+
|
| 478 |
+
unexpected key in source state_dict: backbone.norm.weight, backbone.norm.bias, backbone.head.weight, backbone.head.bias, backbone.layers.0.blocks.1.attn_mask, backbone.layers.1.blocks.1.attn_mask, backbone.layers.2.blocks.1.attn_mask, backbone.layers.2.blocks.3.attn_mask, backbone.layers.2.blocks.5.attn_mask, backbone.layers.2.blocks.7.attn_mask, backbone.layers.2.blocks.9.attn_mask, backbone.layers.2.blocks.11.attn_mask, backbone.layers.2.blocks.13.attn_mask, backbone.layers.2.blocks.15.attn_mask, backbone.layers.2.blocks.17.attn_mask
|
| 479 |
+
|
| 480 |
+
missing keys in source state_dict: backbone.layers.0.blocks.0.mlp.fc1.gate.gate_network.0.weight, backbone.layers.0.blocks.0.mlp.fc1.gate.gate_network.2.weight, backbone.layers.0.blocks.0.mlp.fc1.gate.weight_noise.weight, backbone.layers.0.blocks.0.mlp.fc1.calculator.experts.weight_gate, backbone.layers.0.blocks.0.mlp.fc1.calculator.experts.bias_gate, backbone.layers.0.blocks.1.mlp.fc1.gate.gate_network.0.weight, backbone.layers.0.blocks.1.mlp.fc1.gate.gate_network.2.weight, backbone.layers.0.blocks.1.mlp.fc1.gate.weight_noise.weight, backbone.layers.0.blocks.1.mlp.fc1.calculator.experts.weight_gate, backbone.layers.0.blocks.1.mlp.fc1.calculator.experts.bias_gate, backbone.layers.1.blocks.0.mlp.fc1.gate.gate_network.0.weight, backbone.layers.1.blocks.0.mlp.fc1.gate.gate_network.2.weight, backbone.layers.1.blocks.0.mlp.fc1.gate.weight_noise.weight, backbone.layers.1.blocks.0.mlp.fc1.calculator.experts.weight_gate, backbone.layers.1.blocks.0.mlp.fc1.calculator.experts.bias_gate, backbone.layers.1.blocks.1.mlp.fc1.gate.gate_network.0.weight, backbone.layers.1.blocks.1.mlp.fc1.gate.gate_network.2.weight, backbone.layers.1.blocks.1.mlp.fc1.gate.weight_noise.weight, backbone.layers.1.blocks.1.mlp.fc1.calculator.experts.weight_gate, backbone.layers.1.blocks.1.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.0.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.0.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.0.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.0.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.0.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.1.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.1.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.1.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.1.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.1.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.2.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.2.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.2.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.2.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.2.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.3.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.3.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.3.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.3.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.3.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.4.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.4.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.4.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.4.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.4.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.5.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.5.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.5.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.5.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.5.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.6.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.6.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.6.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.6.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.6.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.7.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.7.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.7.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.7.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.7.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.8.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.8.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.8.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.8.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.8.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.9.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.9.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.9.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.9.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.9.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.10.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.10.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.10.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.10.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.10.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.11.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.11.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.11.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.11.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.11.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.12.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.12.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.12.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.12.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.12.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.13.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.13.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.13.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.13.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.13.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.14.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.14.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.14.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.14.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.14.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.15.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.15.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.15.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.15.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.15.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.16.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.16.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.16.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.16.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.16.mlp.fc1.calculator.experts.bias_gate, backbone.layers.2.blocks.17.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.17.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.17.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.17.mlp.fc1.calculator.experts.weight_gate, backbone.layers.2.blocks.17.mlp.fc1.calculator.experts.bias_gate, backbone.layers.3.blocks.0.mlp.fc1.gate.gate_network.0.weight, backbone.layers.3.blocks.0.mlp.fc1.gate.gate_network.2.weight, backbone.layers.3.blocks.0.mlp.fc1.gate.weight_noise.weight, backbone.layers.3.blocks.0.mlp.fc1.calculator.experts.weight_gate, backbone.layers.3.blocks.0.mlp.fc1.calculator.experts.bias_gate, backbone.layers.3.blocks.1.mlp.fc1.gate.gate_network.0.weight, backbone.layers.3.blocks.1.mlp.fc1.gate.gate_network.2.weight, backbone.layers.3.blocks.1.mlp.fc1.gate.weight_noise.weight, backbone.layers.3.blocks.1.mlp.fc1.calculator.experts.weight_gate, backbone.layers.3.blocks.1.mlp.fc1.calculator.experts.bias_gate, backbone.norm0.weight, backbone.norm0.bias, backbone.norm1.weight, backbone.norm1.bias, backbone.norm2.weight, backbone.norm2.bias, backbone.norm3.weight, backbone.norm3.bias, neck.lateral_convs.0.conv.weight, neck.lateral_convs.0.conv.bias, neck.lateral_convs.1.conv.weight, neck.lateral_convs.1.conv.bias, neck.lateral_convs.2.conv.weight, neck.lateral_convs.2.conv.bias, neck.lateral_convs.3.conv.weight, neck.lateral_convs.3.conv.bias, neck.fpn_convs.0.conv.weight, neck.fpn_convs.0.conv.bias, neck.fpn_convs.1.conv.weight, neck.fpn_convs.1.conv.bias, neck.fpn_convs.2.conv.weight, neck.fpn_convs.2.conv.bias, neck.fpn_convs.3.conv.weight, neck.fpn_convs.3.conv.bias, rpn_head.rpn_conv.weight, rpn_head.rpn_conv.bias, rpn_head.rpn_cls.weight, rpn_head.rpn_cls.bias, rpn_head.rpn_reg.weight, rpn_head.rpn_reg.bias, roi_head.bbox_head.0.fc_cls.weight, roi_head.bbox_head.0.fc_cls.bias, roi_head.bbox_head.0.fc_reg.weight, roi_head.bbox_head.0.fc_reg.bias, roi_head.bbox_head.0.shared_convs.0.conv.weight, roi_head.bbox_head.0.shared_convs.0.bn.weight, roi_head.bbox_head.0.shared_convs.0.bn.bias, roi_head.bbox_head.0.shared_convs.0.bn.running_mean, roi_head.bbox_head.0.shared_convs.0.bn.running_var, roi_head.bbox_head.0.shared_convs.1.conv.weight, roi_head.bbox_head.0.shared_convs.1.bn.weight, roi_head.bbox_head.0.shared_convs.1.bn.bias, roi_head.bbox_head.0.shared_convs.1.bn.running_mean, roi_head.bbox_head.0.shared_convs.1.bn.running_var, roi_head.bbox_head.0.shared_convs.2.conv.weight, roi_head.bbox_head.0.shared_convs.2.bn.weight, roi_head.bbox_head.0.shared_convs.2.bn.bias, roi_head.bbox_head.0.shared_convs.2.bn.running_mean, roi_head.bbox_head.0.shared_convs.2.bn.running_var, roi_head.bbox_head.0.shared_convs.3.conv.weight, roi_head.bbox_head.0.shared_convs.3.bn.weight, roi_head.bbox_head.0.shared_convs.3.bn.bias, roi_head.bbox_head.0.shared_convs.3.bn.running_mean, roi_head.bbox_head.0.shared_convs.3.bn.running_var, roi_head.bbox_head.0.shared_fcs.0.weight, roi_head.bbox_head.0.shared_fcs.0.bias, roi_head.bbox_head.1.fc_cls.weight, roi_head.bbox_head.1.fc_cls.bias, roi_head.bbox_head.1.fc_reg.weight, roi_head.bbox_head.1.fc_reg.bias, roi_head.bbox_head.1.shared_convs.0.conv.weight, roi_head.bbox_head.1.shared_convs.0.bn.weight, roi_head.bbox_head.1.shared_convs.0.bn.bias, roi_head.bbox_head.1.shared_convs.0.bn.running_mean, roi_head.bbox_head.1.shared_convs.0.bn.running_var, roi_head.bbox_head.1.shared_convs.1.conv.weight, roi_head.bbox_head.1.shared_convs.1.bn.weight, roi_head.bbox_head.1.shared_convs.1.bn.bias, roi_head.bbox_head.1.shared_convs.1.bn.running_mean, roi_head.bbox_head.1.shared_convs.1.bn.running_var, roi_head.bbox_head.1.shared_convs.2.conv.weight, roi_head.bbox_head.1.shared_convs.2.bn.weight, roi_head.bbox_head.1.shared_convs.2.bn.bias, roi_head.bbox_head.1.shared_convs.2.bn.running_mean, roi_head.bbox_head.1.shared_convs.2.bn.running_var, roi_head.bbox_head.1.shared_convs.3.conv.weight, roi_head.bbox_head.1.shared_convs.3.bn.weight, roi_head.bbox_head.1.shared_convs.3.bn.bias, roi_head.bbox_head.1.shared_convs.3.bn.running_mean, roi_head.bbox_head.1.shared_convs.3.bn.running_var, roi_head.bbox_head.1.shared_fcs.0.weight, roi_head.bbox_head.1.shared_fcs.0.bias, roi_head.bbox_head.2.fc_cls.weight, roi_head.bbox_head.2.fc_cls.bias, roi_head.bbox_head.2.fc_reg.weight, roi_head.bbox_head.2.fc_reg.bias, roi_head.bbox_head.2.shared_convs.0.conv.weight, roi_head.bbox_head.2.shared_convs.0.bn.weight, roi_head.bbox_head.2.shared_convs.0.bn.bias, roi_head.bbox_head.2.shared_convs.0.bn.running_mean, roi_head.bbox_head.2.shared_convs.0.bn.running_var, roi_head.bbox_head.2.shared_convs.1.conv.weight, roi_head.bbox_head.2.shared_convs.1.bn.weight, roi_head.bbox_head.2.shared_convs.1.bn.bias, roi_head.bbox_head.2.shared_convs.1.bn.running_mean, roi_head.bbox_head.2.shared_convs.1.bn.running_var, roi_head.bbox_head.2.shared_convs.2.conv.weight, roi_head.bbox_head.2.shared_convs.2.bn.weight, roi_head.bbox_head.2.shared_convs.2.bn.bias, roi_head.bbox_head.2.shared_convs.2.bn.running_mean, roi_head.bbox_head.2.shared_convs.2.bn.running_var, roi_head.bbox_head.2.shared_convs.3.conv.weight, roi_head.bbox_head.2.shared_convs.3.bn.weight, roi_head.bbox_head.2.shared_convs.3.bn.bias, roi_head.bbox_head.2.shared_convs.3.bn.running_mean, roi_head.bbox_head.2.shared_convs.3.bn.running_var, roi_head.bbox_head.2.shared_fcs.0.weight, roi_head.bbox_head.2.shared_fcs.0.bias, roi_head.mask_head.0.convs.0.conv.weight, roi_head.mask_head.0.convs.0.conv.bias, roi_head.mask_head.0.convs.1.conv.weight, roi_head.mask_head.0.convs.1.conv.bias, roi_head.mask_head.0.convs.2.conv.weight, roi_head.mask_head.0.convs.2.conv.bias, roi_head.mask_head.0.convs.3.conv.weight, roi_head.mask_head.0.convs.3.conv.bias, roi_head.mask_head.0.upsample.weight, roi_head.mask_head.0.upsample.bias, roi_head.mask_head.0.conv_logits.weight, roi_head.mask_head.0.conv_logits.bias, roi_head.mask_head.1.convs.0.conv.weight, roi_head.mask_head.1.convs.0.conv.bias, roi_head.mask_head.1.convs.1.conv.weight, roi_head.mask_head.1.convs.1.conv.bias, roi_head.mask_head.1.convs.2.conv.weight, roi_head.mask_head.1.convs.2.conv.bias, roi_head.mask_head.1.convs.3.conv.weight, roi_head.mask_head.1.convs.3.conv.bias, roi_head.mask_head.1.upsample.weight, roi_head.mask_head.1.upsample.bias, roi_head.mask_head.1.conv_logits.weight, roi_head.mask_head.1.conv_logits.bias, roi_head.mask_head.2.convs.0.conv.weight, roi_head.mask_head.2.convs.0.conv.bias, roi_head.mask_head.2.convs.1.conv.weight, roi_head.mask_head.2.convs.1.conv.bias, roi_head.mask_head.2.convs.2.conv.weight, roi_head.mask_head.2.convs.2.conv.bias, roi_head.mask_head.2.convs.3.conv.weight, roi_head.mask_head.2.convs.3.conv.bias, roi_head.mask_head.2.upsample.weight, roi_head.mask_head.2.upsample.bias, roi_head.mask_head.2.conv_logits.weight, roi_head.mask_head.2.conv_logits.bias
|
| 481 |
+
|
| 482 |
+
2025-06-20 16:18:09,744 - mmdet - INFO - Start running, host: root@autodl-container-313040b114-67ed2cfc, work_dir: /root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/results/train/llama_moe_4_16_1e-4
|
| 483 |
+
2025-06-20 16:18:09,744 - mmdet - INFO - Hooks will be executed in the following order:
|
| 484 |
+
before_run:
|
| 485 |
+
(VERY_HIGH ) StepLrUpdaterHook
|
| 486 |
+
(ABOVE_NORMAL) DistOptimizerHook
|
| 487 |
+
(NORMAL ) CheckpointHook
|
| 488 |
+
(NORMAL ) DistEvalHook
|
| 489 |
+
(VERY_LOW ) TextLoggerHook
|
| 490 |
+
--------------------
|
| 491 |
+
before_train_epoch:
|
| 492 |
+
(VERY_HIGH ) StepLrUpdaterHook
|
| 493 |
+
(NORMAL ) DistSamplerSeedHook
|
| 494 |
+
(NORMAL ) DistEvalHook
|
| 495 |
+
(NORMAL ) NumClassCheckHook
|
| 496 |
+
(LOW ) IterTimerHook
|
| 497 |
+
(VERY_LOW ) TextLoggerHook
|
| 498 |
+
--------------------
|
| 499 |
+
before_train_iter:
|
| 500 |
+
(VERY_HIGH ) StepLrUpdaterHook
|
| 501 |
+
(LOW ) IterTimerHook
|
| 502 |
+
--------------------
|
| 503 |
+
after_train_iter:
|
| 504 |
+
(ABOVE_NORMAL) DistOptimizerHook
|
| 505 |
+
(NORMAL ) CheckpointHook
|
| 506 |
+
(NORMAL ) DistEvalHook
|
| 507 |
+
(LOW ) IterTimerHook
|
| 508 |
+
(VERY_LOW ) TextLoggerHook
|
| 509 |
+
--------------------
|
| 510 |
+
after_train_epoch:
|
| 511 |
+
(NORMAL ) CheckpointHook
|
| 512 |
+
(NORMAL ) DistEvalHook
|
| 513 |
+
(VERY_LOW ) TextLoggerHook
|
| 514 |
+
--------------------
|
| 515 |
+
before_val_epoch:
|
| 516 |
+
(NORMAL ) DistSamplerSeedHook
|
| 517 |
+
(NORMAL ) NumClassCheckHook
|
| 518 |
+
(LOW ) IterTimerHook
|
| 519 |
+
(VERY_LOW ) TextLoggerHook
|
| 520 |
+
--------------------
|
| 521 |
+
before_val_iter:
|
| 522 |
+
(LOW ) IterTimerHook
|
| 523 |
+
--------------------
|
| 524 |
+
after_val_iter:
|
| 525 |
+
(LOW ) IterTimerHook
|
| 526 |
+
--------------------
|
| 527 |
+
after_val_epoch:
|
| 528 |
+
(VERY_LOW ) TextLoggerHook
|
| 529 |
+
--------------------
|
| 530 |
+
after_run:
|
| 531 |
+
(VERY_LOW ) TextLoggerHook
|
| 532 |
+
--------------------
|
| 533 |
+
2025-06-20 16:18:09,745 - mmdet - INFO - workflow: [('train', 1)], max: 36 epochs
|
| 534 |
+
2025-06-20 16:18:09,745 - mmdet - INFO - Checkpoints will be saved to /root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/results/train/llama_moe_4_16_1e-4 by HardDiskBackend.
|
| 535 |
+
2025-06-20 16:20:20,612 - mmdet - INFO - Epoch [1][50/7330] lr: 9.890e-06, eta: 7 days, 23:47:01, time: 2.617, data_time: 1.562, memory: 18485, r_loss: 0.0355, loss_rpn_cls: 0.6260, loss_rpn_bbox: 0.0672, s0.loss_cls: 2.8746, s0.acc: 65.0957, s0.loss_bbox: 0.0785, s0.loss_mask: 0.8793, s1.loss_cls: 1.2573, s1.acc: 76.6528, s1.loss_bbox: 0.0108, s1.loss_mask: 0.4882, s2.loss_cls: 0.6631, s2.acc: 73.5295, s2.loss_bbox: 0.0013, s2.loss_mask: 0.2481, loss: 7.2297
|
| 536 |
+
2025-06-20 16:21:08,205 - mmdet - INFO - Epoch [1][100/7330] lr: 1.988e-05, eta: 5 days, 10:45:11, time: 0.952, data_time: 0.025, memory: 18485, r_loss: 0.0240, loss_rpn_cls: 0.3321, loss_rpn_bbox: 0.0649, s0.loss_cls: 0.4256, s0.acc: 94.5229, s0.loss_bbox: 0.1852, s0.loss_mask: 0.7326, s1.loss_cls: 0.1195, s1.acc: 97.2224, s1.loss_bbox: 0.0259, s1.loss_mask: 0.3772, s2.loss_cls: 0.0434, s2.acc: 98.2791, s2.loss_bbox: 0.0030, s2.loss_mask: 0.1887, loss: 2.5220
|
| 537 |
+
2025-06-20 16:21:55,857 - mmdet - INFO - Epoch [1][150/7330] lr: 2.987e-05, eta: 4 days, 14:24:56, time: 0.953, data_time: 0.025, memory: 18485, r_loss: 0.0084, loss_rpn_cls: 0.2450, loss_rpn_bbox: 0.0575, s0.loss_cls: 0.3917, s0.acc: 94.2341, s0.loss_bbox: 0.1942, s0.loss_mask: 0.6949, s1.loss_cls: 0.1153, s1.acc: 96.9961, s1.loss_bbox: 0.0287, s1.loss_mask: 0.3492, s2.loss_cls: 0.0394, s2.acc: 98.1492, s2.loss_bbox: 0.0034, s2.loss_mask: 0.1747, loss: 2.3023
|
| 538 |
+
2025-06-20 16:22:45,898 - mmdet - INFO - Epoch [1][200/7330] lr: 3.986e-05, eta: 4 days, 5:07:19, time: 1.001, data_time: 0.021, memory: 19202, r_loss: 0.0035, loss_rpn_cls: 0.2456, loss_rpn_bbox: 0.0594, s0.loss_cls: 0.3909, s0.acc: 94.0952, s0.loss_bbox: 0.1961, s0.loss_mask: 0.6847, s1.loss_cls: 0.1178, s1.acc: 96.8430, s1.loss_bbox: 0.0301, s1.loss_mask: 0.3402, s2.loss_cls: 0.0397, s2.acc: 98.0442, s2.loss_bbox: 0.0037, s2.loss_mask: 0.1696, loss: 2.2811
|
| 539 |
+
2025-06-20 16:23:39,549 - mmdet - INFO - Epoch [1][250/7330] lr: 4.985e-05, eta: 4 days, 0:36:04, time: 1.073, data_time: 0.024, memory: 19202, r_loss: 0.0027, loss_rpn_cls: 0.2432, loss_rpn_bbox: 0.0600, s0.loss_cls: 0.3807, s0.acc: 94.1726, s0.loss_bbox: 0.1956, s0.loss_mask: 0.6734, s1.loss_cls: 0.1136, s1.acc: 96.9294, s1.loss_bbox: 0.0292, s1.loss_mask: 0.3337, s2.loss_cls: 0.0384, s2.acc: 98.0957, s2.loss_bbox: 0.0035, s2.loss_mask: 0.1657, loss: 2.2397
|
| 540 |
+
2025-06-20 16:24:25,080 - mmdet - INFO - Epoch [1][300/7330] lr: 5.984e-05, eta: 3 days, 19:35:37, time: 0.910, data_time: 0.027, memory: 19202, r_loss: 0.0023, loss_rpn_cls: 0.2318, loss_rpn_bbox: 0.0567, s0.loss_cls: 0.3617, s0.acc: 94.3884, s0.loss_bbox: 0.1881, s0.loss_mask: 0.6636, s1.loss_cls: 0.1080, s1.acc: 97.0325, s1.loss_bbox: 0.0282, s1.loss_mask: 0.3271, s2.loss_cls: 0.0366, s2.acc: 98.1499, s2.loss_bbox: 0.0035, s2.loss_mask: 0.1626, loss: 2.1701
|
| 541 |
+
2025-06-20 16:25:10,065 - mmdet - INFO - Epoch [1][350/7330] lr: 6.983e-05, eta: 3 days, 15:54:08, time: 0.900, data_time: 0.023, memory: 19202, r_loss: 0.0018, loss_rpn_cls: 0.2192, loss_rpn_bbox: 0.0557, s0.loss_cls: 0.3440, s0.acc: 94.6101, s0.loss_bbox: 0.1816, s0.loss_mask: 0.6611, s1.loss_cls: 0.1030, s1.acc: 97.1196, s1.loss_bbox: 0.0281, s1.loss_mask: 0.3243, s2.loss_cls: 0.0343, s2.acc: 98.2356, s2.loss_bbox: 0.0034, s2.loss_mask: 0.1605, loss: 2.1171
|
| 542 |
+
2025-06-20 16:25:56,499 - mmdet - INFO - Epoch [1][400/7330] lr: 7.982e-05, eta: 3 days, 13:23:35, time: 0.928, data_time: 0.027, memory: 19748, r_loss: 0.0017, loss_rpn_cls: 0.2164, loss_rpn_bbox: 0.0618, s0.loss_cls: 0.3681, s0.acc: 94.2371, s0.loss_bbox: 0.1945, s0.loss_mask: 0.6470, s1.loss_cls: 0.1097, s1.acc: 96.9456, s1.loss_bbox: 0.0294, s1.loss_mask: 0.3164, s2.loss_cls: 0.0367, s2.acc: 98.1011, s2.loss_bbox: 0.0036, s2.loss_mask: 0.1558, loss: 2.1411
|
| 543 |
+
2025-06-20 16:26:44,498 - mmdet - INFO - Epoch [1][450/7330] lr: 8.981e-05, eta: 3 days, 11:41:44, time: 0.960, data_time: 0.025, memory: 19748, r_loss: 0.0018, loss_rpn_cls: 0.1919, loss_rpn_bbox: 0.0569, s0.loss_cls: 0.3892, s0.acc: 93.9355, s0.loss_bbox: 0.2113, s0.loss_mask: 0.6423, s1.loss_cls: 0.1115, s1.acc: 96.9028, s1.loss_bbox: 0.0315, s1.loss_mask: 0.3143, s2.loss_cls: 0.0366, s2.acc: 98.1306, s2.loss_bbox: 0.0040, s2.loss_mask: 0.1534, loss: 2.1447
|
| 544 |
+
2025-06-20 16:27:37,437 - mmdet - INFO - Epoch [1][500/7330] lr: 9.980e-05, eta: 3 days, 11:03:44, time: 1.059, data_time: 0.020, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1916, loss_rpn_bbox: 0.0559, s0.loss_cls: 0.3960, s0.acc: 93.7881, s0.loss_bbox: 0.2180, s0.loss_mask: 0.6349, s1.loss_cls: 0.1132, s1.acc: 96.8503, s1.loss_bbox: 0.0321, s1.loss_mask: 0.3104, s2.loss_cls: 0.0367, s2.acc: 98.1179, s2.loss_bbox: 0.0040, s2.loss_mask: 0.1511, loss: 2.1454
|
| 545 |
+
2025-06-20 16:28:24,605 - mmdet - INFO - Epoch [1][550/7330] lr: 1.000e-04, eta: 3 days, 9:46:11, time: 0.943, data_time: 0.023, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1926, loss_rpn_bbox: 0.0552, s0.loss_cls: 0.4150, s0.acc: 93.6028, s0.loss_bbox: 0.2266, s0.loss_mask: 0.6272, s1.loss_cls: 0.1165, s1.acc: 96.7849, s1.loss_bbox: 0.0335, s1.loss_mask: 0.3049, s2.loss_cls: 0.0371, s2.acc: 98.1091, s2.loss_bbox: 0.0041, s2.loss_mask: 0.1478, loss: 2.1620
|
| 546 |
+
2025-06-20 16:29:09,770 - mmdet - INFO - Epoch [1][600/7330] lr: 1.000e-04, eta: 3 days, 8:26:44, time: 0.903, data_time: 0.020, memory: 19748, r_loss: 0.0022, loss_rpn_cls: 0.1819, loss_rpn_bbox: 0.0560, s0.loss_cls: 0.4558, s0.acc: 92.9470, s0.loss_bbox: 0.2558, s0.loss_mask: 0.6124, s1.loss_cls: 0.1240, s1.acc: 96.5686, s1.loss_bbox: 0.0368, s1.loss_mask: 0.2987, s2.loss_cls: 0.0383, s2.acc: 98.0356, s2.loss_bbox: 0.0044, s2.loss_mask: 0.1443, loss: 2.2106
|
| 547 |
+
2025-06-20 16:29:54,658 - mmdet - INFO - Epoch [1][650/7330] lr: 1.000e-04, eta: 3 days, 7:17:35, time: 0.898, data_time: 0.025, memory: 19748, r_loss: 0.0016, loss_rpn_cls: 0.1900, loss_rpn_bbox: 0.0575, s0.loss_cls: 0.4505, s0.acc: 92.9016, s0.loss_bbox: 0.2567, s0.loss_mask: 0.6052, s1.loss_cls: 0.1222, s1.acc: 96.5630, s1.loss_bbox: 0.0369, s1.loss_mask: 0.2964, s2.loss_cls: 0.0373, s2.acc: 98.0469, s2.loss_bbox: 0.0043, s2.loss_mask: 0.1444, loss: 2.2032
|
| 548 |
+
2025-06-20 16:30:43,057 - mmdet - INFO - Epoch [1][700/7330] lr: 1.000e-04, eta: 3 days, 6:40:09, time: 0.968, data_time: 0.022, memory: 19748, r_loss: 0.0014, loss_rpn_cls: 0.1937, loss_rpn_bbox: 0.0587, s0.loss_cls: 0.4761, s0.acc: 92.3748, s0.loss_bbox: 0.2762, s0.loss_mask: 0.5948, s1.loss_cls: 0.1297, s1.acc: 96.2668, s1.loss_bbox: 0.0406, s1.loss_mask: 0.2906, s2.loss_cls: 0.0395, s2.acc: 97.8875, s2.loss_bbox: 0.0048, s2.loss_mask: 0.1416, loss: 2.2477
|
| 549 |
+
2025-06-20 16:31:39,203 - mmdet - INFO - Epoch [1][750/7330] lr: 1.000e-04, eta: 3 days, 6:52:56, time: 1.123, data_time: 0.023, memory: 19748, r_loss: 0.0014, loss_rpn_cls: 0.1872, loss_rpn_bbox: 0.0590, s0.loss_cls: 0.4721, s0.acc: 92.3787, s0.loss_bbox: 0.2770, s0.loss_mask: 0.5942, s1.loss_cls: 0.1281, s1.acc: 96.3015, s1.loss_bbox: 0.0405, s1.loss_mask: 0.2890, s2.loss_cls: 0.0388, s2.acc: 97.9268, s2.loss_bbox: 0.0048, s2.loss_mask: 0.1405, loss: 2.2327
|
| 550 |
+
2025-06-20 16:32:27,278 - mmdet - INFO - Epoch [1][800/7330] lr: 1.000e-04, eta: 3 days, 6:19:49, time: 0.962, data_time: 0.023, memory: 19748, r_loss: 0.0014, loss_rpn_cls: 0.1810, loss_rpn_bbox: 0.0560, s0.loss_cls: 0.4734, s0.acc: 92.3376, s0.loss_bbox: 0.2794, s0.loss_mask: 0.5923, s1.loss_cls: 0.1287, s1.acc: 96.2595, s1.loss_bbox: 0.0418, s1.loss_mask: 0.2888, s2.loss_cls: 0.0386, s2.acc: 97.9307, s2.loss_bbox: 0.0050, s2.loss_mask: 0.1413, loss: 2.2278
|
| 551 |
+
2025-06-20 16:33:12,936 - mmdet - INFO - Epoch [1][850/7330] lr: 1.000e-04, eta: 3 days, 5:38:01, time: 0.913, data_time: 0.024, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1882, loss_rpn_bbox: 0.0600, s0.loss_cls: 0.4514, s0.acc: 92.6785, s0.loss_bbox: 0.2636, s0.loss_mask: 0.5796, s1.loss_cls: 0.1255, s1.acc: 96.3271, s1.loss_bbox: 0.0406, s1.loss_mask: 0.2824, s2.loss_cls: 0.0375, s2.acc: 97.9612, s2.loss_bbox: 0.0047, s2.loss_mask: 0.1374, loss: 2.1723
|
| 552 |
+
2025-06-20 16:33:57,557 - mmdet - INFO - Epoch [1][900/7330] lr: 1.000e-04, eta: 3 days, 4:55:41, time: 0.892, data_time: 0.022, memory: 19748, r_loss: 0.0013, loss_rpn_cls: 0.1757, loss_rpn_bbox: 0.0568, s0.loss_cls: 0.4752, s0.acc: 92.2673, s0.loss_bbox: 0.2807, s0.loss_mask: 0.5848, s1.loss_cls: 0.1308, s1.acc: 96.1675, s1.loss_bbox: 0.0428, s1.loss_mask: 0.2841, s2.loss_cls: 0.0389, s2.acc: 97.8911, s2.loss_bbox: 0.0050, s2.loss_mask: 0.1387, loss: 2.2148
|
| 553 |
+
2025-06-20 16:34:45,532 - mmdet - INFO - Epoch [1][950/7330] lr: 1.000e-04, eta: 3 days, 4:33:12, time: 0.959, data_time: 0.024, memory: 19748, r_loss: 0.0013, loss_rpn_cls: 0.1696, loss_rpn_bbox: 0.0535, s0.loss_cls: 0.4713, s0.acc: 92.3374, s0.loss_bbox: 0.2784, s0.loss_mask: 0.5742, s1.loss_cls: 0.1317, s1.acc: 96.1257, s1.loss_bbox: 0.0443, s1.loss_mask: 0.2813, s2.loss_cls: 0.0391, s2.acc: 97.8909, s2.loss_bbox: 0.0053, s2.loss_mask: 0.1366, loss: 2.1866
|
| 554 |
+
2025-06-20 16:35:38,865 - mmdet - INFO - Exp name: cascade_mask_swin_base_3x_coco_sample_1_bs_16_llama_moe.py
|
| 555 |
+
2025-06-20 16:35:38,866 - mmdet - INFO - Epoch [1][1000/7330] lr: 1.000e-04, eta: 3 days, 4:36:23, time: 1.067, data_time: 0.025, memory: 19748, r_loss: 0.0012, loss_rpn_cls: 0.1765, loss_rpn_bbox: 0.0547, s0.loss_cls: 0.4694, s0.acc: 92.1941, s0.loss_bbox: 0.2818, s0.loss_mask: 0.5683, s1.loss_cls: 0.1334, s1.acc: 95.9756, s1.loss_bbox: 0.0460, s1.loss_mask: 0.2772, s2.loss_cls: 0.0394, s2.acc: 97.8245, s2.loss_bbox: 0.0054, s2.loss_mask: 0.1349, loss: 2.1885
|
| 556 |
+
2025-06-20 16:36:27,230 - mmdet - INFO - Epoch [1][1050/7330] lr: 1.000e-04, eta: 3 days, 4:18:24, time: 0.967, data_time: 0.026, memory: 19748, r_loss: 0.0013, loss_rpn_cls: 0.1736, loss_rpn_bbox: 0.0547, s0.loss_cls: 0.4720, s0.acc: 92.1873, s0.loss_bbox: 0.2808, s0.loss_mask: 0.5678, s1.loss_cls: 0.1364, s1.acc: 95.8508, s1.loss_bbox: 0.0480, s1.loss_mask: 0.2755, s2.loss_cls: 0.0405, s2.acc: 97.7468, s2.loss_bbox: 0.0060, s2.loss_mask: 0.1341, loss: 2.1907
|
| 557 |
+
2025-06-20 16:37:15,022 - mmdet - INFO - Epoch [1][1100/7330] lr: 1.000e-04, eta: 3 days, 3:59:47, time: 0.956, data_time: 0.027, memory: 19748, r_loss: 0.0013, loss_rpn_cls: 0.1548, loss_rpn_bbox: 0.0517, s0.loss_cls: 0.4617, s0.acc: 92.2188, s0.loss_bbox: 0.2822, s0.loss_mask: 0.5622, s1.loss_cls: 0.1345, s1.acc: 95.8225, s1.loss_bbox: 0.0501, s1.loss_mask: 0.2731, s2.loss_cls: 0.0389, s2.acc: 97.8018, s2.loss_bbox: 0.0062, s2.loss_mask: 0.1325, loss: 2.1491
|
| 558 |
+
2025-06-20 16:38:00,424 - mmdet - INFO - Epoch [1][1150/7330] lr: 1.000e-04, eta: 3 days, 3:33:35, time: 0.908, data_time: 0.026, memory: 19748, r_loss: 0.0012, loss_rpn_cls: 0.1700, loss_rpn_bbox: 0.0570, s0.loss_cls: 0.4653, s0.acc: 92.1116, s0.loss_bbox: 0.2824, s0.loss_mask: 0.5610, s1.loss_cls: 0.1381, s1.acc: 95.6643, s1.loss_bbox: 0.0511, s1.loss_mask: 0.2725, s2.loss_cls: 0.0403, s2.acc: 97.6765, s2.loss_bbox: 0.0064, s2.loss_mask: 0.1322, loss: 2.1775
|
| 559 |
+
2025-06-20 16:38:49,674 - mmdet - INFO - Epoch [1][1200/7330] lr: 1.000e-04, eta: 3 days, 3:23:31, time: 0.985, data_time: 0.029, memory: 19748, r_loss: 0.0012, loss_rpn_cls: 0.1711, loss_rpn_bbox: 0.0588, s0.loss_cls: 0.4757, s0.acc: 91.7695, s0.loss_bbox: 0.2938, s0.loss_mask: 0.5604, s1.loss_cls: 0.1422, s1.acc: 95.4233, s1.loss_bbox: 0.0540, s1.loss_mask: 0.2706, s2.loss_cls: 0.0423, s2.acc: 97.5142, s2.loss_bbox: 0.0071, s2.loss_mask: 0.1310, loss: 2.2080
|
| 560 |
+
2025-06-20 16:39:40,124 - mmdet - INFO - Epoch [1][1250/7330] lr: 1.000e-04, eta: 3 days, 3:18:22, time: 1.009, data_time: 0.025, memory: 19748, r_loss: 0.0013, loss_rpn_cls: 0.1638, loss_rpn_bbox: 0.0540, s0.loss_cls: 0.4602, s0.acc: 92.2368, s0.loss_bbox: 0.2780, s0.loss_mask: 0.5537, s1.loss_cls: 0.1412, s1.acc: 95.5205, s1.loss_bbox: 0.0542, s1.loss_mask: 0.2678, s2.loss_cls: 0.0408, s2.acc: 97.6326, s2.loss_bbox: 0.0071, s2.loss_mask: 0.1295, loss: 2.1516
|
| 561 |
+
2025-06-20 16:40:31,603 - mmdet - INFO - Epoch [1][1300/7330] lr: 1.000e-04, eta: 3 days, 3:17:07, time: 1.030, data_time: 0.024, memory: 19748, r_loss: 0.0013, loss_rpn_cls: 0.1546, loss_rpn_bbox: 0.0511, s0.loss_cls: 0.4662, s0.acc: 92.1296, s0.loss_bbox: 0.2819, s0.loss_mask: 0.5441, s1.loss_cls: 0.1444, s1.acc: 95.4031, s1.loss_bbox: 0.0561, s1.loss_mask: 0.2633, s2.loss_cls: 0.0421, s2.acc: 97.5378, s2.loss_bbox: 0.0076, s2.loss_mask: 0.1271, loss: 2.1401
|
| 562 |
+
2025-06-20 16:41:20,243 - mmdet - INFO - Epoch [1][1350/7330] lr: 1.000e-04, eta: 3 days, 3:06:38, time: 0.973, data_time: 0.025, memory: 19748, r_loss: 0.0013, loss_rpn_cls: 0.1636, loss_rpn_bbox: 0.0555, s0.loss_cls: 0.4701, s0.acc: 91.7637, s0.loss_bbox: 0.2959, s0.loss_mask: 0.5471, s1.loss_cls: 0.1452, s1.acc: 95.1948, s1.loss_bbox: 0.0592, s1.loss_mask: 0.2637, s2.loss_cls: 0.0422, s2.acc: 97.4385, s2.loss_bbox: 0.0081, s2.loss_mask: 0.1270, loss: 2.1789
|
| 563 |
+
2025-06-20 16:42:08,145 - mmdet - INFO - Epoch [1][1400/7330] lr: 1.000e-04, eta: 3 days, 2:54:32, time: 0.958, data_time: 0.023, memory: 19748, r_loss: 0.0014, loss_rpn_cls: 0.1501, loss_rpn_bbox: 0.0521, s0.loss_cls: 0.4591, s0.acc: 92.0781, s0.loss_bbox: 0.2848, s0.loss_mask: 0.5379, s1.loss_cls: 0.1446, s1.acc: 95.2485, s1.loss_bbox: 0.0590, s1.loss_mask: 0.2597, s2.loss_cls: 0.0418, s2.acc: 97.4902, s2.loss_bbox: 0.0081, s2.loss_mask: 0.1252, loss: 2.1239
|
| 564 |
+
2025-06-20 16:42:56,203 - mmdet - INFO - Epoch [1][1450/7330] lr: 1.000e-04, eta: 3 days, 2:43:40, time: 0.961, data_time: 0.022, memory: 19748, r_loss: 0.0014, loss_rpn_cls: 0.1561, loss_rpn_bbox: 0.0529, s0.loss_cls: 0.4650, s0.acc: 91.7893, s0.loss_bbox: 0.2931, s0.loss_mask: 0.5386, s1.loss_cls: 0.1488, s1.acc: 94.9685, s1.loss_bbox: 0.0622, s1.loss_mask: 0.2599, s2.loss_cls: 0.0431, s2.acc: 97.3218, s2.loss_bbox: 0.0087, s2.loss_mask: 0.1252, loss: 2.1549
|
| 565 |
+
2025-06-20 16:43:42,213 - mmdet - INFO - Epoch [1][1500/7330] lr: 1.000e-04, eta: 3 days, 2:27:33, time: 0.920, data_time: 0.025, memory: 19748, r_loss: 0.0014, loss_rpn_cls: 0.1575, loss_rpn_bbox: 0.0577, s0.loss_cls: 0.4774, s0.acc: 91.4978, s0.loss_bbox: 0.3046, s0.loss_mask: 0.5389, s1.loss_cls: 0.1524, s1.acc: 94.8298, s1.loss_bbox: 0.0644, s1.loss_mask: 0.2597, s2.loss_cls: 0.0444, s2.acc: 97.2524, s2.loss_bbox: 0.0090, s2.loss_mask: 0.1246, loss: 2.1919
|
| 566 |
+
2025-06-20 16:44:37,274 - mmdet - INFO - Epoch [1][1550/7330] lr: 1.000e-04, eta: 3 days, 2:37:53, time: 1.101, data_time: 0.032, memory: 19748, r_loss: 0.0014, loss_rpn_cls: 0.1485, loss_rpn_bbox: 0.0533, s0.loss_cls: 0.4618, s0.acc: 91.9006, s0.loss_bbox: 0.2891, s0.loss_mask: 0.5366, s1.loss_cls: 0.1480, s1.acc: 95.0056, s1.loss_bbox: 0.0624, s1.loss_mask: 0.2582, s2.loss_cls: 0.0433, s2.acc: 97.3013, s2.loss_bbox: 0.0090, s2.loss_mask: 0.1241, loss: 2.1356
|
| 567 |
+
2025-06-20 16:45:28,115 - mmdet - INFO - Epoch [1][1600/7330] lr: 1.000e-04, eta: 3 days, 2:36:02, time: 1.017, data_time: 0.022, memory: 19748, r_loss: 0.0014, loss_rpn_cls: 0.1558, loss_rpn_bbox: 0.0541, s0.loss_cls: 0.4715, s0.acc: 91.6938, s0.loss_bbox: 0.2954, s0.loss_mask: 0.5353, s1.loss_cls: 0.1532, s1.acc: 94.7935, s1.loss_bbox: 0.0653, s1.loss_mask: 0.2566, s2.loss_cls: 0.0450, s2.acc: 97.1553, s2.loss_bbox: 0.0096, s2.loss_mask: 0.1230, loss: 2.1663
|
| 568 |
+
2025-06-20 16:46:16,469 - mmdet - INFO - Epoch [1][1650/7330] lr: 1.000e-04, eta: 3 days, 2:27:35, time: 0.967, data_time: 0.027, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1472, loss_rpn_bbox: 0.0516, s0.loss_cls: 0.4604, s0.acc: 91.8923, s0.loss_bbox: 0.2890, s0.loss_mask: 0.5324, s1.loss_cls: 0.1512, s1.acc: 94.8445, s1.loss_bbox: 0.0648, s1.loss_mask: 0.2551, s2.loss_cls: 0.0444, s2.acc: 97.1938, s2.loss_bbox: 0.0096, s2.loss_mask: 0.1228, loss: 2.1299
|
| 569 |
+
2025-06-20 16:47:05,489 - mmdet - INFO - Epoch [1][1700/7330] lr: 1.000e-04, eta: 3 days, 2:21:22, time: 0.980, data_time: 0.025, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1526, loss_rpn_bbox: 0.0519, s0.loss_cls: 0.4658, s0.acc: 91.6958, s0.loss_bbox: 0.2922, s0.loss_mask: 0.5298, s1.loss_cls: 0.1568, s1.acc: 94.5852, s1.loss_bbox: 0.0678, s1.loss_mask: 0.2555, s2.loss_cls: 0.0462, s2.acc: 97.0496, s2.loss_bbox: 0.0102, s2.loss_mask: 0.1226, loss: 2.1529
|
| 570 |
+
2025-06-20 16:47:52,071 - mmdet - INFO - Epoch [1][1750/7330] lr: 1.000e-04, eta: 3 days, 2:09:24, time: 0.932, data_time: 0.024, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1527, loss_rpn_bbox: 0.0559, s0.loss_cls: 0.4844, s0.acc: 91.3584, s0.loss_bbox: 0.3041, s0.loss_mask: 0.5211, s1.loss_cls: 0.1646, s1.acc: 94.2219, s1.loss_bbox: 0.0735, s1.loss_mask: 0.2508, s2.loss_cls: 0.0481, s2.acc: 96.8760, s2.loss_bbox: 0.0113, s2.loss_mask: 0.1208, loss: 2.1887
|
| 571 |
+
2025-06-20 16:48:46,879 - mmdet - INFO - Epoch [1][1800/7330] lr: 1.000e-04, eta: 3 days, 2:18:01, time: 1.096, data_time: 0.023, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1527, loss_rpn_bbox: 0.0512, s0.loss_cls: 0.4724, s0.acc: 91.6426, s0.loss_bbox: 0.2951, s0.loss_mask: 0.5248, s1.loss_cls: 0.1600, s1.acc: 94.4915, s1.loss_bbox: 0.0701, s1.loss_mask: 0.2518, s2.loss_cls: 0.0469, s2.acc: 96.9832, s2.loss_bbox: 0.0107, s2.loss_mask: 0.1206, loss: 2.1579
|
| 572 |
+
2025-06-20 16:49:33,553 - mmdet - INFO - Epoch [1][1850/7330] lr: 1.000e-04, eta: 3 days, 2:06:50, time: 0.933, data_time: 0.028, memory: 19748, r_loss: 0.0016, loss_rpn_cls: 0.1481, loss_rpn_bbox: 0.0535, s0.loss_cls: 0.4800, s0.acc: 91.3792, s0.loss_bbox: 0.3048, s0.loss_mask: 0.5185, s1.loss_cls: 0.1660, s1.acc: 94.1240, s1.loss_bbox: 0.0757, s1.loss_mask: 0.2485, s2.loss_cls: 0.0493, s2.acc: 96.7520, s2.loss_bbox: 0.0120, s2.loss_mask: 0.1189, loss: 2.1770
|
| 573 |
+
2025-06-20 16:50:28,128 - mmdet - INFO - Epoch [1][1900/7330] lr: 1.000e-04, eta: 3 days, 2:14:25, time: 1.092, data_time: 0.024, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1424, loss_rpn_bbox: 0.0525, s0.loss_cls: 0.4545, s0.acc: 91.7488, s0.loss_bbox: 0.2901, s0.loss_mask: 0.5209, s1.loss_cls: 0.1562, s1.acc: 94.3499, s1.loss_bbox: 0.0720, s1.loss_mask: 0.2498, s2.loss_cls: 0.0468, s2.acc: 96.8398, s2.loss_bbox: 0.0117, s2.loss_mask: 0.1202, loss: 2.1185
|
| 574 |
+
2025-06-20 16:51:17,124 - mmdet - INFO - Epoch [1][1950/7330] lr: 1.000e-04, eta: 3 days, 2:09:04, time: 0.980, data_time: 0.025, memory: 19748, r_loss: 0.0016, loss_rpn_cls: 0.1376, loss_rpn_bbox: 0.0530, s0.loss_cls: 0.4649, s0.acc: 91.3611, s0.loss_bbox: 0.3082, s0.loss_mask: 0.5170, s1.loss_cls: 0.1612, s1.acc: 94.0696, s1.loss_bbox: 0.0771, s1.loss_mask: 0.2479, s2.loss_cls: 0.0479, s2.acc: 96.7119, s2.loss_bbox: 0.0123, s2.loss_mask: 0.1192, loss: 2.1479
|
| 575 |
+
2025-06-20 16:52:03,703 - mmdet - INFO - Exp name: cascade_mask_swin_base_3x_coco_sample_1_bs_16_llama_moe.py
|
| 576 |
+
2025-06-20 16:52:03,703 - mmdet - INFO - Epoch [1][2000/7330] lr: 1.000e-04, eta: 3 days, 1:58:39, time: 0.932, data_time: 0.027, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1463, loss_rpn_bbox: 0.0515, s0.loss_cls: 0.4666, s0.acc: 91.3276, s0.loss_bbox: 0.3034, s0.loss_mask: 0.5177, s1.loss_cls: 0.1671, s1.acc: 93.8352, s1.loss_bbox: 0.0800, s1.loss_mask: 0.2488, s2.loss_cls: 0.0498, s2.acc: 96.5693, s2.loss_bbox: 0.0133, s2.loss_mask: 0.1190, loss: 2.1649
|
| 577 |
+
2025-06-20 16:52:56,200 - mmdet - INFO - Epoch [1][2050/7330] lr: 1.000e-04, eta: 3 days, 2:01:20, time: 1.050, data_time: 0.023, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1447, loss_rpn_bbox: 0.0507, s0.loss_cls: 0.4658, s0.acc: 91.3267, s0.loss_bbox: 0.3071, s0.loss_mask: 0.5236, s1.loss_cls: 0.1642, s1.acc: 93.9326, s1.loss_bbox: 0.0786, s1.loss_mask: 0.2504, s2.loss_cls: 0.0493, s2.acc: 96.6104, s2.loss_bbox: 0.0130, s2.loss_mask: 0.1199, loss: 2.1688
|
| 578 |
+
2025-06-20 16:53:42,887 - mmdet - INFO - Epoch [1][2100/7330] lr: 1.000e-04, eta: 3 days, 1:51:45, time: 0.934, data_time: 0.022, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1340, loss_rpn_bbox: 0.0513, s0.loss_cls: 0.4526, s0.acc: 91.5217, s0.loss_bbox: 0.2992, s0.loss_mask: 0.5045, s1.loss_cls: 0.1623, s1.acc: 93.9475, s1.loss_bbox: 0.0790, s1.loss_mask: 0.2417, s2.loss_cls: 0.0489, s2.acc: 96.5830, s2.loss_bbox: 0.0132, s2.loss_mask: 0.1155, loss: 2.1039
|
| 579 |
+
2025-06-20 16:54:35,035 - mmdet - INFO - Epoch [1][2150/7330] lr: 1.000e-04, eta: 3 days, 1:53:40, time: 1.043, data_time: 0.023, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1375, loss_rpn_bbox: 0.0510, s0.loss_cls: 0.4443, s0.acc: 91.6472, s0.loss_bbox: 0.2941, s0.loss_mask: 0.5051, s1.loss_cls: 0.1632, s1.acc: 93.8262, s1.loss_bbox: 0.0801, s1.loss_mask: 0.2421, s2.loss_cls: 0.0499, s2.acc: 96.4719, s2.loss_bbox: 0.0140, s2.loss_mask: 0.1155, loss: 2.0983
|
| 580 |
+
2025-06-20 16:55:27,555 - mmdet - INFO - Epoch [1][2200/7330] lr: 1.000e-04, eta: 3 days, 1:56:08, time: 1.050, data_time: 0.022, memory: 19748, r_loss: 0.0017, loss_rpn_cls: 0.1370, loss_rpn_bbox: 0.0523, s0.loss_cls: 0.4705, s0.acc: 91.3201, s0.loss_bbox: 0.3054, s0.loss_mask: 0.5086, s1.loss_cls: 0.1694, s1.acc: 93.7239, s1.loss_bbox: 0.0816, s1.loss_mask: 0.2427, s2.loss_cls: 0.0516, s2.acc: 96.4050, s2.loss_bbox: 0.0141, s2.loss_mask: 0.1163, loss: 2.1511
|
| 581 |
+
2025-06-20 16:56:14,071 - mmdet - INFO - Epoch [1][2250/7330] lr: 1.000e-04, eta: 3 days, 1:46:55, time: 0.931, data_time: 0.025, memory: 19748, r_loss: 0.0016, loss_rpn_cls: 0.1302, loss_rpn_bbox: 0.0479, s0.loss_cls: 0.4580, s0.acc: 91.3982, s0.loss_bbox: 0.3017, s0.loss_mask: 0.5019, s1.loss_cls: 0.1679, s1.acc: 93.6460, s1.loss_bbox: 0.0839, s1.loss_mask: 0.2386, s2.loss_cls: 0.0518, s2.acc: 96.2466, s2.loss_bbox: 0.0153, s2.loss_mask: 0.1141, loss: 2.1130
|
| 582 |
+
2025-06-20 16:57:04,285 - mmdet - INFO - Epoch [1][2300/7330] lr: 1.000e-04, eta: 3 days, 1:45:03, time: 1.004, data_time: 0.021, memory: 19748, r_loss: 0.0016, loss_rpn_cls: 0.1441, loss_rpn_bbox: 0.0529, s0.loss_cls: 0.4622, s0.acc: 91.2048, s0.loss_bbox: 0.3117, s0.loss_mask: 0.5057, s1.loss_cls: 0.1691, s1.acc: 93.4653, s1.loss_bbox: 0.0869, s1.loss_mask: 0.2436, s2.loss_cls: 0.0519, s2.acc: 96.1904, s2.loss_bbox: 0.0155, s2.loss_mask: 0.1163, loss: 2.1615
|
| 583 |
+
2025-06-20 16:57:51,551 - mmdet - INFO - Epoch [1][2350/7330] lr: 1.000e-04, eta: 3 days, 1:37:44, time: 0.945, data_time: 0.021, memory: 19748, r_loss: 0.0016, loss_rpn_cls: 0.1300, loss_rpn_bbox: 0.0510, s0.loss_cls: 0.4593, s0.acc: 91.3479, s0.loss_bbox: 0.3024, s0.loss_mask: 0.4998, s1.loss_cls: 0.1720, s1.acc: 93.4587, s1.loss_bbox: 0.0864, s1.loss_mask: 0.2381, s2.loss_cls: 0.0530, s2.acc: 96.1746, s2.loss_bbox: 0.0158, s2.loss_mask: 0.1129, loss: 2.1223
|
| 584 |
+
2025-06-20 16:58:46,298 - mmdet - INFO - Epoch [1][2400/7330] lr: 1.000e-04, eta: 3 days, 1:44:16, time: 1.095, data_time: 0.023, memory: 19748, r_loss: 0.0015, loss_rpn_cls: 0.1374, loss_rpn_bbox: 0.0524, s0.loss_cls: 0.4628, s0.acc: 91.1279, s0.loss_bbox: 0.3082, s0.loss_mask: 0.5001, s1.loss_cls: 0.1733, s1.acc: 93.3199, s1.loss_bbox: 0.0880, s1.loss_mask: 0.2387, s2.loss_cls: 0.0537, s2.acc: 96.0493, s2.loss_bbox: 0.0163, s2.loss_mask: 0.1132, loss: 2.1456
|
| 585 |
+
2025-06-20 16:59:34,494 - mmdet - INFO - Epoch [1][2450/7330] lr: 1.000e-04, eta: 3 days, 1:38:50, time: 0.963, data_time: 0.029, memory: 19748, r_loss: 0.0016, loss_rpn_cls: 0.1328, loss_rpn_bbox: 0.0502, s0.loss_cls: 0.4735, s0.acc: 90.8613, s0.loss_bbox: 0.3204, s0.loss_mask: 0.4960, s1.loss_cls: 0.1781, s1.acc: 93.0613, s1.loss_bbox: 0.0921, s1.loss_mask: 0.2372, s2.loss_cls: 0.0557, s2.acc: 95.8508, s2.loss_bbox: 0.0174, s2.loss_mask: 0.1132, loss: 2.1681
|
mmdet/results/train/llama_moe_4_16_1e-4/20250620_161720.log.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b813f247dedebb9b1312db12164c90ad2e14174fef4fa4ef82172ed0596291a3
|
| 3 |
+
size 42800
|
mmdet/results/train/llama_moe_4_16_1e-4/cascade_mask_swin_base_3x_coco_sample_1_bs_16_llama_moe.py
ADDED
|
@@ -0,0 +1,438 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model = dict(
|
| 2 |
+
type='CascadeRCNN_loss',
|
| 3 |
+
pretrained=None,
|
| 4 |
+
backbone=dict(
|
| 5 |
+
type='SwinTransformer_llama_moe',
|
| 6 |
+
embed_dim=128,
|
| 7 |
+
depths=[2, 2, 18, 2],
|
| 8 |
+
num_heads=[4, 8, 16, 32],
|
| 9 |
+
window_size=7,
|
| 10 |
+
mlp_ratio=4.0,
|
| 11 |
+
qkv_bias=True,
|
| 12 |
+
qk_scale=None,
|
| 13 |
+
drop_rate=0.0,
|
| 14 |
+
attn_drop_rate=0.0,
|
| 15 |
+
drop_path_rate=0.3,
|
| 16 |
+
ape=False,
|
| 17 |
+
patch_norm=True,
|
| 18 |
+
out_indices=(0, 1, 2, 3),
|
| 19 |
+
use_checkpoint=False),
|
| 20 |
+
neck=dict(
|
| 21 |
+
type='FPN',
|
| 22 |
+
in_channels=[128, 256, 512, 1024],
|
| 23 |
+
out_channels=256,
|
| 24 |
+
num_outs=5),
|
| 25 |
+
rpn_head=dict(
|
| 26 |
+
type='RPNHead',
|
| 27 |
+
in_channels=256,
|
| 28 |
+
feat_channels=256,
|
| 29 |
+
anchor_generator=dict(
|
| 30 |
+
type='AnchorGenerator',
|
| 31 |
+
scales=[8],
|
| 32 |
+
ratios=[0.5, 1.0, 2.0],
|
| 33 |
+
strides=[4, 8, 16, 32, 64]),
|
| 34 |
+
bbox_coder=dict(
|
| 35 |
+
type='DeltaXYWHBBoxCoder',
|
| 36 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 37 |
+
target_stds=[1.0, 1.0, 1.0, 1.0]),
|
| 38 |
+
loss_cls=dict(
|
| 39 |
+
type='CrossEntropyLoss', use_sigmoid=True, loss_weight=1.0),
|
| 40 |
+
loss_bbox=dict(
|
| 41 |
+
type='SmoothL1Loss', beta=0.1111111111111111, loss_weight=1.0)),
|
| 42 |
+
roi_head=dict(
|
| 43 |
+
type='CascadeRoIHead',
|
| 44 |
+
num_stages=3,
|
| 45 |
+
stage_loss_weights=[1, 0.5, 0.25],
|
| 46 |
+
bbox_roi_extractor=dict(
|
| 47 |
+
type='SingleRoIExtractor',
|
| 48 |
+
roi_layer=dict(type='RoIAlign', output_size=7, sampling_ratio=0),
|
| 49 |
+
out_channels=256,
|
| 50 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 51 |
+
bbox_head=[
|
| 52 |
+
dict(
|
| 53 |
+
type='ConvFCBBoxHead',
|
| 54 |
+
num_shared_convs=4,
|
| 55 |
+
num_shared_fcs=1,
|
| 56 |
+
in_channels=256,
|
| 57 |
+
conv_out_channels=256,
|
| 58 |
+
fc_out_channels=1024,
|
| 59 |
+
roi_feat_size=7,
|
| 60 |
+
num_classes=80,
|
| 61 |
+
bbox_coder=dict(
|
| 62 |
+
type='DeltaXYWHBBoxCoder',
|
| 63 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 64 |
+
target_stds=[0.1, 0.1, 0.2, 0.2]),
|
| 65 |
+
reg_class_agnostic=False,
|
| 66 |
+
reg_decoded_bbox=True,
|
| 67 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 68 |
+
loss_cls=dict(
|
| 69 |
+
type='CrossEntropyLoss',
|
| 70 |
+
use_sigmoid=False,
|
| 71 |
+
loss_weight=1.0),
|
| 72 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 73 |
+
dict(
|
| 74 |
+
type='ConvFCBBoxHead',
|
| 75 |
+
num_shared_convs=4,
|
| 76 |
+
num_shared_fcs=1,
|
| 77 |
+
in_channels=256,
|
| 78 |
+
conv_out_channels=256,
|
| 79 |
+
fc_out_channels=1024,
|
| 80 |
+
roi_feat_size=7,
|
| 81 |
+
num_classes=80,
|
| 82 |
+
bbox_coder=dict(
|
| 83 |
+
type='DeltaXYWHBBoxCoder',
|
| 84 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 85 |
+
target_stds=[0.05, 0.05, 0.1, 0.1]),
|
| 86 |
+
reg_class_agnostic=False,
|
| 87 |
+
reg_decoded_bbox=True,
|
| 88 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 89 |
+
loss_cls=dict(
|
| 90 |
+
type='CrossEntropyLoss',
|
| 91 |
+
use_sigmoid=False,
|
| 92 |
+
loss_weight=1.0),
|
| 93 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 94 |
+
dict(
|
| 95 |
+
type='ConvFCBBoxHead',
|
| 96 |
+
num_shared_convs=4,
|
| 97 |
+
num_shared_fcs=1,
|
| 98 |
+
in_channels=256,
|
| 99 |
+
conv_out_channels=256,
|
| 100 |
+
fc_out_channels=1024,
|
| 101 |
+
roi_feat_size=7,
|
| 102 |
+
num_classes=80,
|
| 103 |
+
bbox_coder=dict(
|
| 104 |
+
type='DeltaXYWHBBoxCoder',
|
| 105 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 106 |
+
target_stds=[0.033, 0.033, 0.067, 0.067]),
|
| 107 |
+
reg_class_agnostic=False,
|
| 108 |
+
reg_decoded_bbox=True,
|
| 109 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 110 |
+
loss_cls=dict(
|
| 111 |
+
type='CrossEntropyLoss',
|
| 112 |
+
use_sigmoid=False,
|
| 113 |
+
loss_weight=1.0),
|
| 114 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
|
| 115 |
+
],
|
| 116 |
+
mask_roi_extractor=dict(
|
| 117 |
+
type='SingleRoIExtractor',
|
| 118 |
+
roi_layer=dict(type='RoIAlign', output_size=14, sampling_ratio=0),
|
| 119 |
+
out_channels=256,
|
| 120 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 121 |
+
mask_head=dict(
|
| 122 |
+
type='FCNMaskHead',
|
| 123 |
+
num_convs=4,
|
| 124 |
+
in_channels=256,
|
| 125 |
+
conv_out_channels=256,
|
| 126 |
+
num_classes=80,
|
| 127 |
+
loss_mask=dict(
|
| 128 |
+
type='CrossEntropyLoss', use_mask=True, loss_weight=1.0))),
|
| 129 |
+
train_cfg=dict(
|
| 130 |
+
rpn=dict(
|
| 131 |
+
assigner=dict(
|
| 132 |
+
type='MaxIoUAssigner',
|
| 133 |
+
pos_iou_thr=0.7,
|
| 134 |
+
neg_iou_thr=0.3,
|
| 135 |
+
min_pos_iou=0.3,
|
| 136 |
+
match_low_quality=True,
|
| 137 |
+
ignore_iof_thr=-1),
|
| 138 |
+
sampler=dict(
|
| 139 |
+
type='RandomSampler',
|
| 140 |
+
num=256,
|
| 141 |
+
pos_fraction=0.5,
|
| 142 |
+
neg_pos_ub=-1,
|
| 143 |
+
add_gt_as_proposals=False),
|
| 144 |
+
allowed_border=0,
|
| 145 |
+
pos_weight=-1,
|
| 146 |
+
debug=False),
|
| 147 |
+
rpn_proposal=dict(
|
| 148 |
+
nms_across_levels=False,
|
| 149 |
+
nms_pre=2000,
|
| 150 |
+
nms_post=2000,
|
| 151 |
+
max_per_img=2000,
|
| 152 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 153 |
+
min_bbox_size=0),
|
| 154 |
+
rcnn=[
|
| 155 |
+
dict(
|
| 156 |
+
assigner=dict(
|
| 157 |
+
type='MaxIoUAssigner',
|
| 158 |
+
pos_iou_thr=0.5,
|
| 159 |
+
neg_iou_thr=0.5,
|
| 160 |
+
min_pos_iou=0.5,
|
| 161 |
+
match_low_quality=False,
|
| 162 |
+
ignore_iof_thr=-1),
|
| 163 |
+
sampler=dict(
|
| 164 |
+
type='RandomSampler',
|
| 165 |
+
num=512,
|
| 166 |
+
pos_fraction=0.25,
|
| 167 |
+
neg_pos_ub=-1,
|
| 168 |
+
add_gt_as_proposals=True),
|
| 169 |
+
mask_size=28,
|
| 170 |
+
pos_weight=-1,
|
| 171 |
+
debug=False),
|
| 172 |
+
dict(
|
| 173 |
+
assigner=dict(
|
| 174 |
+
type='MaxIoUAssigner',
|
| 175 |
+
pos_iou_thr=0.6,
|
| 176 |
+
neg_iou_thr=0.6,
|
| 177 |
+
min_pos_iou=0.6,
|
| 178 |
+
match_low_quality=False,
|
| 179 |
+
ignore_iof_thr=-1),
|
| 180 |
+
sampler=dict(
|
| 181 |
+
type='RandomSampler',
|
| 182 |
+
num=512,
|
| 183 |
+
pos_fraction=0.25,
|
| 184 |
+
neg_pos_ub=-1,
|
| 185 |
+
add_gt_as_proposals=True),
|
| 186 |
+
mask_size=28,
|
| 187 |
+
pos_weight=-1,
|
| 188 |
+
debug=False),
|
| 189 |
+
dict(
|
| 190 |
+
assigner=dict(
|
| 191 |
+
type='MaxIoUAssigner',
|
| 192 |
+
pos_iou_thr=0.7,
|
| 193 |
+
neg_iou_thr=0.7,
|
| 194 |
+
min_pos_iou=0.7,
|
| 195 |
+
match_low_quality=False,
|
| 196 |
+
ignore_iof_thr=-1),
|
| 197 |
+
sampler=dict(
|
| 198 |
+
type='RandomSampler',
|
| 199 |
+
num=512,
|
| 200 |
+
pos_fraction=0.25,
|
| 201 |
+
neg_pos_ub=-1,
|
| 202 |
+
add_gt_as_proposals=True),
|
| 203 |
+
mask_size=28,
|
| 204 |
+
pos_weight=-1,
|
| 205 |
+
debug=False)
|
| 206 |
+
]),
|
| 207 |
+
test_cfg=dict(
|
| 208 |
+
rpn=dict(
|
| 209 |
+
nms_across_levels=False,
|
| 210 |
+
nms_pre=1000,
|
| 211 |
+
nms_post=1000,
|
| 212 |
+
max_per_img=1000,
|
| 213 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 214 |
+
min_bbox_size=0),
|
| 215 |
+
rcnn=dict(
|
| 216 |
+
score_thr=0.05,
|
| 217 |
+
nms=dict(type='nms', iou_threshold=0.5),
|
| 218 |
+
max_per_img=100,
|
| 219 |
+
mask_thr_binary=0.5)))
|
| 220 |
+
dataset_type = 'CocoDataset'
|
| 221 |
+
data_root = '/root/autodl-tmp/COCO2017/'
|
| 222 |
+
img_norm_cfg = dict(
|
| 223 |
+
mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
|
| 224 |
+
train_pipeline = [
|
| 225 |
+
dict(type='LoadImageFromFile'),
|
| 226 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 227 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 228 |
+
dict(
|
| 229 |
+
type='AutoAugment',
|
| 230 |
+
policies=[[{
|
| 231 |
+
'type':
|
| 232 |
+
'Resize',
|
| 233 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333), (576, 1333),
|
| 234 |
+
(608, 1333), (640, 1333), (672, 1333), (704, 1333),
|
| 235 |
+
(736, 1333), (768, 1333), (800, 1333)],
|
| 236 |
+
'multiscale_mode':
|
| 237 |
+
'value',
|
| 238 |
+
'keep_ratio':
|
| 239 |
+
True
|
| 240 |
+
}],
|
| 241 |
+
[{
|
| 242 |
+
'type': 'Resize',
|
| 243 |
+
'img_scale': [(400, 1333), (500, 1333), (600, 1333)],
|
| 244 |
+
'multiscale_mode': 'value',
|
| 245 |
+
'keep_ratio': True
|
| 246 |
+
}, {
|
| 247 |
+
'type': 'RandomCrop',
|
| 248 |
+
'crop_type': 'absolute_range',
|
| 249 |
+
'crop_size': (384, 600),
|
| 250 |
+
'allow_negative_crop': True
|
| 251 |
+
}, {
|
| 252 |
+
'type':
|
| 253 |
+
'Resize',
|
| 254 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 255 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 256 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 257 |
+
(768, 1333), (800, 1333)],
|
| 258 |
+
'multiscale_mode':
|
| 259 |
+
'value',
|
| 260 |
+
'override':
|
| 261 |
+
True,
|
| 262 |
+
'keep_ratio':
|
| 263 |
+
True
|
| 264 |
+
}]]),
|
| 265 |
+
dict(
|
| 266 |
+
type='Normalize',
|
| 267 |
+
mean=[123.675, 116.28, 103.53],
|
| 268 |
+
std=[58.395, 57.12, 57.375],
|
| 269 |
+
to_rgb=True),
|
| 270 |
+
dict(type='Pad', size_divisor=32),
|
| 271 |
+
dict(type='DefaultFormatBundle'),
|
| 272 |
+
dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 273 |
+
]
|
| 274 |
+
test_pipeline = [
|
| 275 |
+
dict(type='LoadImageFromFile'),
|
| 276 |
+
dict(
|
| 277 |
+
type='MultiScaleFlipAug',
|
| 278 |
+
img_scale=(1333, 800),
|
| 279 |
+
flip=False,
|
| 280 |
+
transforms=[
|
| 281 |
+
dict(type='Resize', keep_ratio=True),
|
| 282 |
+
dict(type='RandomFlip'),
|
| 283 |
+
dict(
|
| 284 |
+
type='Normalize',
|
| 285 |
+
mean=[123.675, 116.28, 103.53],
|
| 286 |
+
std=[58.395, 57.12, 57.375],
|
| 287 |
+
to_rgb=True),
|
| 288 |
+
dict(type='Pad', size_divisor=32),
|
| 289 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 290 |
+
dict(type='Collect', keys=['img'])
|
| 291 |
+
])
|
| 292 |
+
]
|
| 293 |
+
data = dict(
|
| 294 |
+
samples_per_gpu=2,
|
| 295 |
+
workers_per_gpu=4,
|
| 296 |
+
train=dict(
|
| 297 |
+
type='CocoDataset',
|
| 298 |
+
ann_file=
|
| 299 |
+
'/root/autodl-tmp/COCO2017/annotations/instances_train2017.json',
|
| 300 |
+
img_prefix='/root/autodl-tmp/COCO2017/train2017/',
|
| 301 |
+
pipeline=[
|
| 302 |
+
dict(type='LoadImageFromFile'),
|
| 303 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 304 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 305 |
+
dict(
|
| 306 |
+
type='AutoAugment',
|
| 307 |
+
policies=[[{
|
| 308 |
+
'type':
|
| 309 |
+
'Resize',
|
| 310 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 311 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 312 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 313 |
+
(768, 1333), (800, 1333)],
|
| 314 |
+
'multiscale_mode':
|
| 315 |
+
'value',
|
| 316 |
+
'keep_ratio':
|
| 317 |
+
True
|
| 318 |
+
}],
|
| 319 |
+
[{
|
| 320 |
+
'type': 'Resize',
|
| 321 |
+
'img_scale': [(400, 1333), (500, 1333),
|
| 322 |
+
(600, 1333)],
|
| 323 |
+
'multiscale_mode': 'value',
|
| 324 |
+
'keep_ratio': True
|
| 325 |
+
}, {
|
| 326 |
+
'type': 'RandomCrop',
|
| 327 |
+
'crop_type': 'absolute_range',
|
| 328 |
+
'crop_size': (384, 600),
|
| 329 |
+
'allow_negative_crop': True
|
| 330 |
+
}, {
|
| 331 |
+
'type':
|
| 332 |
+
'Resize',
|
| 333 |
+
'img_scale': [(480, 1333), (512, 1333),
|
| 334 |
+
(544, 1333), (576, 1333),
|
| 335 |
+
(608, 1333), (640, 1333),
|
| 336 |
+
(672, 1333), (704, 1333),
|
| 337 |
+
(736, 1333), (768, 1333),
|
| 338 |
+
(800, 1333)],
|
| 339 |
+
'multiscale_mode':
|
| 340 |
+
'value',
|
| 341 |
+
'override':
|
| 342 |
+
True,
|
| 343 |
+
'keep_ratio':
|
| 344 |
+
True
|
| 345 |
+
}]]),
|
| 346 |
+
dict(
|
| 347 |
+
type='Normalize',
|
| 348 |
+
mean=[123.675, 116.28, 103.53],
|
| 349 |
+
std=[58.395, 57.12, 57.375],
|
| 350 |
+
to_rgb=True),
|
| 351 |
+
dict(type='Pad', size_divisor=32),
|
| 352 |
+
dict(type='DefaultFormatBundle'),
|
| 353 |
+
dict(
|
| 354 |
+
type='Collect',
|
| 355 |
+
keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 356 |
+
]),
|
| 357 |
+
val=dict(
|
| 358 |
+
type='CocoDataset',
|
| 359 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 360 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 361 |
+
pipeline=[
|
| 362 |
+
dict(type='LoadImageFromFile'),
|
| 363 |
+
dict(
|
| 364 |
+
type='MultiScaleFlipAug',
|
| 365 |
+
img_scale=(1333, 800),
|
| 366 |
+
flip=False,
|
| 367 |
+
transforms=[
|
| 368 |
+
dict(type='Resize', keep_ratio=True),
|
| 369 |
+
dict(type='RandomFlip'),
|
| 370 |
+
dict(
|
| 371 |
+
type='Normalize',
|
| 372 |
+
mean=[123.675, 116.28, 103.53],
|
| 373 |
+
std=[58.395, 57.12, 57.375],
|
| 374 |
+
to_rgb=True),
|
| 375 |
+
dict(type='Pad', size_divisor=32),
|
| 376 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 377 |
+
dict(type='Collect', keys=['img'])
|
| 378 |
+
])
|
| 379 |
+
]),
|
| 380 |
+
test=dict(
|
| 381 |
+
type='CocoDataset',
|
| 382 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 383 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 384 |
+
pipeline=[
|
| 385 |
+
dict(type='LoadImageFromFile'),
|
| 386 |
+
dict(
|
| 387 |
+
type='MultiScaleFlipAug',
|
| 388 |
+
img_scale=(1333, 800),
|
| 389 |
+
flip=False,
|
| 390 |
+
transforms=[
|
| 391 |
+
dict(type='Resize', keep_ratio=True),
|
| 392 |
+
dict(type='RandomFlip'),
|
| 393 |
+
dict(
|
| 394 |
+
type='Normalize',
|
| 395 |
+
mean=[123.675, 116.28, 103.53],
|
| 396 |
+
std=[58.395, 57.12, 57.375],
|
| 397 |
+
to_rgb=True),
|
| 398 |
+
dict(type='Pad', size_divisor=32),
|
| 399 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 400 |
+
dict(type='Collect', keys=['img'])
|
| 401 |
+
])
|
| 402 |
+
]))
|
| 403 |
+
evaluation = dict(metric=['bbox', 'segm'], gpu_collect=True)
|
| 404 |
+
optimizer = dict(
|
| 405 |
+
type='AdamW',
|
| 406 |
+
lr=0.0001,
|
| 407 |
+
betas=(0.9, 0.999),
|
| 408 |
+
weight_decay=0.05,
|
| 409 |
+
paramwise_cfg=dict(
|
| 410 |
+
custom_keys=dict(
|
| 411 |
+
absolute_pos_embed=dict(decay_mult=0.0),
|
| 412 |
+
relative_position_bias_table=dict(decay_mult=0.0),
|
| 413 |
+
norm=dict(decay_mult=0.0))))
|
| 414 |
+
optimizer_config = dict(
|
| 415 |
+
grad_clip=None,
|
| 416 |
+
type='DistOptimizerHook',
|
| 417 |
+
update_interval=1,
|
| 418 |
+
coalesce=True,
|
| 419 |
+
bucket_size_mb=-1,
|
| 420 |
+
use_fp16=True)
|
| 421 |
+
lr_config = dict(
|
| 422 |
+
policy='step',
|
| 423 |
+
warmup='linear',
|
| 424 |
+
warmup_iters=500,
|
| 425 |
+
warmup_ratio=0.001,
|
| 426 |
+
step=[27, 33])
|
| 427 |
+
runner = dict(type='EpochBasedRunnerAmp', max_epochs=36)
|
| 428 |
+
checkpoint_config = dict(interval=1)
|
| 429 |
+
log_config = dict(interval=50, hooks=[dict(type='TextLoggerHook')])
|
| 430 |
+
custom_hooks = [dict(type='NumClassCheckHook')]
|
| 431 |
+
dist_params = dict(backend='nccl')
|
| 432 |
+
log_level = 'INFO'
|
| 433 |
+
load_from = '/root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/pretrained_model/swin_base_llama_moe_16.pth'
|
| 434 |
+
resume_from = None
|
| 435 |
+
workflow = [('train', 1)]
|
| 436 |
+
fp16 = None
|
| 437 |
+
work_dir = './results/train/llama_moe_4_16_1e-4/'
|
| 438 |
+
gpu_ids = range(0, 8)
|
mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora → results/train/lora}/20250614_124757.log
RENAMED
|
File without changes
|
mmdet/results/train/lora/20250614_124757.log.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f4154b2817468ae639a0543be385680c3b12df495a7ebf6d4c4993aa1c3fed9
|
| 3 |
+
size 2464645
|
mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora → results/train/lora}/cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora.py
RENAMED
|
File without changes
|
mmdet/results/train/lora/epoch_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aa6ec77aebcf19bbd0a6e33295ce386d23e36f0dcb058a248dc59cbec5198724
|
| 3 |
+
size 1083632016
|
mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_lora → results/train/lora}/epoch_36.pth
RENAMED
|
File without changes
|
mmdet/results/train/lora/latest.pth
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
epoch_36.pth
|
mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona → results/train/mona}/20250610_212914.log
RENAMED
|
File without changes
|
mmdet/results/train/mona/20250610_212914.log.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5dfd7d6ae15d69d9a4bfd5e8981d2e23ddfa4e2f08b571d1234ef959dd3e199b
|
| 3 |
+
size 2464610
|
mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona → results/train/mona}/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona.py
RENAMED
|
File without changes
|
mmdet/results/train/mona/epoch_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:461b1f6c667dedadb274c7d0ee73325e9a9ab95d8154229f27aa55b6a0ce0d05
|
| 3 |
+
size 1091645264
|
mmdet/{cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona → results/train/mona}/epoch_36.pth
RENAMED
|
File without changes
|
mmdet/results/train/mona/latest.pth
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
epoch_36.pth
|
mmdet/results/train/mona_llama_moe_2_8_1e-4/20250624_193305.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
mmdet/results/train/mona_llama_moe_2_8_1e-4/20250624_193305.log.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df9f821c5849c1ae8fa751f96350ae042c14db37198350243b46111ce1c73ca1
|
| 3 |
+
size 2595560
|
mmdet/results/train/mona_llama_moe_2_8_1e-4/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_llama_moe.py
ADDED
|
@@ -0,0 +1,438 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model = dict(
|
| 2 |
+
type='CascadeRCNN_loss',
|
| 3 |
+
pretrained=None,
|
| 4 |
+
backbone=dict(
|
| 5 |
+
type='SwinTransformer_mona_llama_moe',
|
| 6 |
+
embed_dim=128,
|
| 7 |
+
depths=[2, 2, 18, 2],
|
| 8 |
+
num_heads=[4, 8, 16, 32],
|
| 9 |
+
window_size=7,
|
| 10 |
+
mlp_ratio=4.0,
|
| 11 |
+
qkv_bias=True,
|
| 12 |
+
qk_scale=None,
|
| 13 |
+
drop_rate=0.0,
|
| 14 |
+
attn_drop_rate=0.0,
|
| 15 |
+
drop_path_rate=0.3,
|
| 16 |
+
ape=False,
|
| 17 |
+
patch_norm=True,
|
| 18 |
+
out_indices=(0, 1, 2, 3),
|
| 19 |
+
use_checkpoint=False),
|
| 20 |
+
neck=dict(
|
| 21 |
+
type='FPN',
|
| 22 |
+
in_channels=[128, 256, 512, 1024],
|
| 23 |
+
out_channels=256,
|
| 24 |
+
num_outs=5),
|
| 25 |
+
rpn_head=dict(
|
| 26 |
+
type='RPNHead',
|
| 27 |
+
in_channels=256,
|
| 28 |
+
feat_channels=256,
|
| 29 |
+
anchor_generator=dict(
|
| 30 |
+
type='AnchorGenerator',
|
| 31 |
+
scales=[8],
|
| 32 |
+
ratios=[0.5, 1.0, 2.0],
|
| 33 |
+
strides=[4, 8, 16, 32, 64]),
|
| 34 |
+
bbox_coder=dict(
|
| 35 |
+
type='DeltaXYWHBBoxCoder',
|
| 36 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 37 |
+
target_stds=[1.0, 1.0, 1.0, 1.0]),
|
| 38 |
+
loss_cls=dict(
|
| 39 |
+
type='CrossEntropyLoss', use_sigmoid=True, loss_weight=1.0),
|
| 40 |
+
loss_bbox=dict(
|
| 41 |
+
type='SmoothL1Loss', beta=0.1111111111111111, loss_weight=1.0)),
|
| 42 |
+
roi_head=dict(
|
| 43 |
+
type='CascadeRoIHead',
|
| 44 |
+
num_stages=3,
|
| 45 |
+
stage_loss_weights=[1, 0.5, 0.25],
|
| 46 |
+
bbox_roi_extractor=dict(
|
| 47 |
+
type='SingleRoIExtractor',
|
| 48 |
+
roi_layer=dict(type='RoIAlign', output_size=7, sampling_ratio=0),
|
| 49 |
+
out_channels=256,
|
| 50 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 51 |
+
bbox_head=[
|
| 52 |
+
dict(
|
| 53 |
+
type='ConvFCBBoxHead',
|
| 54 |
+
num_shared_convs=4,
|
| 55 |
+
num_shared_fcs=1,
|
| 56 |
+
in_channels=256,
|
| 57 |
+
conv_out_channels=256,
|
| 58 |
+
fc_out_channels=1024,
|
| 59 |
+
roi_feat_size=7,
|
| 60 |
+
num_classes=80,
|
| 61 |
+
bbox_coder=dict(
|
| 62 |
+
type='DeltaXYWHBBoxCoder',
|
| 63 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 64 |
+
target_stds=[0.1, 0.1, 0.2, 0.2]),
|
| 65 |
+
reg_class_agnostic=False,
|
| 66 |
+
reg_decoded_bbox=True,
|
| 67 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 68 |
+
loss_cls=dict(
|
| 69 |
+
type='CrossEntropyLoss',
|
| 70 |
+
use_sigmoid=False,
|
| 71 |
+
loss_weight=1.0),
|
| 72 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 73 |
+
dict(
|
| 74 |
+
type='ConvFCBBoxHead',
|
| 75 |
+
num_shared_convs=4,
|
| 76 |
+
num_shared_fcs=1,
|
| 77 |
+
in_channels=256,
|
| 78 |
+
conv_out_channels=256,
|
| 79 |
+
fc_out_channels=1024,
|
| 80 |
+
roi_feat_size=7,
|
| 81 |
+
num_classes=80,
|
| 82 |
+
bbox_coder=dict(
|
| 83 |
+
type='DeltaXYWHBBoxCoder',
|
| 84 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 85 |
+
target_stds=[0.05, 0.05, 0.1, 0.1]),
|
| 86 |
+
reg_class_agnostic=False,
|
| 87 |
+
reg_decoded_bbox=True,
|
| 88 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 89 |
+
loss_cls=dict(
|
| 90 |
+
type='CrossEntropyLoss',
|
| 91 |
+
use_sigmoid=False,
|
| 92 |
+
loss_weight=1.0),
|
| 93 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 94 |
+
dict(
|
| 95 |
+
type='ConvFCBBoxHead',
|
| 96 |
+
num_shared_convs=4,
|
| 97 |
+
num_shared_fcs=1,
|
| 98 |
+
in_channels=256,
|
| 99 |
+
conv_out_channels=256,
|
| 100 |
+
fc_out_channels=1024,
|
| 101 |
+
roi_feat_size=7,
|
| 102 |
+
num_classes=80,
|
| 103 |
+
bbox_coder=dict(
|
| 104 |
+
type='DeltaXYWHBBoxCoder',
|
| 105 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 106 |
+
target_stds=[0.033, 0.033, 0.067, 0.067]),
|
| 107 |
+
reg_class_agnostic=False,
|
| 108 |
+
reg_decoded_bbox=True,
|
| 109 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 110 |
+
loss_cls=dict(
|
| 111 |
+
type='CrossEntropyLoss',
|
| 112 |
+
use_sigmoid=False,
|
| 113 |
+
loss_weight=1.0),
|
| 114 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
|
| 115 |
+
],
|
| 116 |
+
mask_roi_extractor=dict(
|
| 117 |
+
type='SingleRoIExtractor',
|
| 118 |
+
roi_layer=dict(type='RoIAlign', output_size=14, sampling_ratio=0),
|
| 119 |
+
out_channels=256,
|
| 120 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 121 |
+
mask_head=dict(
|
| 122 |
+
type='FCNMaskHead',
|
| 123 |
+
num_convs=4,
|
| 124 |
+
in_channels=256,
|
| 125 |
+
conv_out_channels=256,
|
| 126 |
+
num_classes=80,
|
| 127 |
+
loss_mask=dict(
|
| 128 |
+
type='CrossEntropyLoss', use_mask=True, loss_weight=1.0))),
|
| 129 |
+
train_cfg=dict(
|
| 130 |
+
rpn=dict(
|
| 131 |
+
assigner=dict(
|
| 132 |
+
type='MaxIoUAssigner',
|
| 133 |
+
pos_iou_thr=0.7,
|
| 134 |
+
neg_iou_thr=0.3,
|
| 135 |
+
min_pos_iou=0.3,
|
| 136 |
+
match_low_quality=True,
|
| 137 |
+
ignore_iof_thr=-1),
|
| 138 |
+
sampler=dict(
|
| 139 |
+
type='RandomSampler',
|
| 140 |
+
num=256,
|
| 141 |
+
pos_fraction=0.5,
|
| 142 |
+
neg_pos_ub=-1,
|
| 143 |
+
add_gt_as_proposals=False),
|
| 144 |
+
allowed_border=0,
|
| 145 |
+
pos_weight=-1,
|
| 146 |
+
debug=False),
|
| 147 |
+
rpn_proposal=dict(
|
| 148 |
+
nms_across_levels=False,
|
| 149 |
+
nms_pre=2000,
|
| 150 |
+
nms_post=2000,
|
| 151 |
+
max_per_img=2000,
|
| 152 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 153 |
+
min_bbox_size=0),
|
| 154 |
+
rcnn=[
|
| 155 |
+
dict(
|
| 156 |
+
assigner=dict(
|
| 157 |
+
type='MaxIoUAssigner',
|
| 158 |
+
pos_iou_thr=0.5,
|
| 159 |
+
neg_iou_thr=0.5,
|
| 160 |
+
min_pos_iou=0.5,
|
| 161 |
+
match_low_quality=False,
|
| 162 |
+
ignore_iof_thr=-1),
|
| 163 |
+
sampler=dict(
|
| 164 |
+
type='RandomSampler',
|
| 165 |
+
num=512,
|
| 166 |
+
pos_fraction=0.25,
|
| 167 |
+
neg_pos_ub=-1,
|
| 168 |
+
add_gt_as_proposals=True),
|
| 169 |
+
mask_size=28,
|
| 170 |
+
pos_weight=-1,
|
| 171 |
+
debug=False),
|
| 172 |
+
dict(
|
| 173 |
+
assigner=dict(
|
| 174 |
+
type='MaxIoUAssigner',
|
| 175 |
+
pos_iou_thr=0.6,
|
| 176 |
+
neg_iou_thr=0.6,
|
| 177 |
+
min_pos_iou=0.6,
|
| 178 |
+
match_low_quality=False,
|
| 179 |
+
ignore_iof_thr=-1),
|
| 180 |
+
sampler=dict(
|
| 181 |
+
type='RandomSampler',
|
| 182 |
+
num=512,
|
| 183 |
+
pos_fraction=0.25,
|
| 184 |
+
neg_pos_ub=-1,
|
| 185 |
+
add_gt_as_proposals=True),
|
| 186 |
+
mask_size=28,
|
| 187 |
+
pos_weight=-1,
|
| 188 |
+
debug=False),
|
| 189 |
+
dict(
|
| 190 |
+
assigner=dict(
|
| 191 |
+
type='MaxIoUAssigner',
|
| 192 |
+
pos_iou_thr=0.7,
|
| 193 |
+
neg_iou_thr=0.7,
|
| 194 |
+
min_pos_iou=0.7,
|
| 195 |
+
match_low_quality=False,
|
| 196 |
+
ignore_iof_thr=-1),
|
| 197 |
+
sampler=dict(
|
| 198 |
+
type='RandomSampler',
|
| 199 |
+
num=512,
|
| 200 |
+
pos_fraction=0.25,
|
| 201 |
+
neg_pos_ub=-1,
|
| 202 |
+
add_gt_as_proposals=True),
|
| 203 |
+
mask_size=28,
|
| 204 |
+
pos_weight=-1,
|
| 205 |
+
debug=False)
|
| 206 |
+
]),
|
| 207 |
+
test_cfg=dict(
|
| 208 |
+
rpn=dict(
|
| 209 |
+
nms_across_levels=False,
|
| 210 |
+
nms_pre=1000,
|
| 211 |
+
nms_post=1000,
|
| 212 |
+
max_per_img=1000,
|
| 213 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 214 |
+
min_bbox_size=0),
|
| 215 |
+
rcnn=dict(
|
| 216 |
+
score_thr=0.05,
|
| 217 |
+
nms=dict(type='nms', iou_threshold=0.5),
|
| 218 |
+
max_per_img=100,
|
| 219 |
+
mask_thr_binary=0.5)))
|
| 220 |
+
dataset_type = 'CocoDataset'
|
| 221 |
+
data_root = '/root/autodl-tmp/COCO2017/'
|
| 222 |
+
img_norm_cfg = dict(
|
| 223 |
+
mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
|
| 224 |
+
train_pipeline = [
|
| 225 |
+
dict(type='LoadImageFromFile'),
|
| 226 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 227 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 228 |
+
dict(
|
| 229 |
+
type='AutoAugment',
|
| 230 |
+
policies=[[{
|
| 231 |
+
'type':
|
| 232 |
+
'Resize',
|
| 233 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333), (576, 1333),
|
| 234 |
+
(608, 1333), (640, 1333), (672, 1333), (704, 1333),
|
| 235 |
+
(736, 1333), (768, 1333), (800, 1333)],
|
| 236 |
+
'multiscale_mode':
|
| 237 |
+
'value',
|
| 238 |
+
'keep_ratio':
|
| 239 |
+
True
|
| 240 |
+
}],
|
| 241 |
+
[{
|
| 242 |
+
'type': 'Resize',
|
| 243 |
+
'img_scale': [(400, 1333), (500, 1333), (600, 1333)],
|
| 244 |
+
'multiscale_mode': 'value',
|
| 245 |
+
'keep_ratio': True
|
| 246 |
+
}, {
|
| 247 |
+
'type': 'RandomCrop',
|
| 248 |
+
'crop_type': 'absolute_range',
|
| 249 |
+
'crop_size': (384, 600),
|
| 250 |
+
'allow_negative_crop': True
|
| 251 |
+
}, {
|
| 252 |
+
'type':
|
| 253 |
+
'Resize',
|
| 254 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 255 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 256 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 257 |
+
(768, 1333), (800, 1333)],
|
| 258 |
+
'multiscale_mode':
|
| 259 |
+
'value',
|
| 260 |
+
'override':
|
| 261 |
+
True,
|
| 262 |
+
'keep_ratio':
|
| 263 |
+
True
|
| 264 |
+
}]]),
|
| 265 |
+
dict(
|
| 266 |
+
type='Normalize',
|
| 267 |
+
mean=[123.675, 116.28, 103.53],
|
| 268 |
+
std=[58.395, 57.12, 57.375],
|
| 269 |
+
to_rgb=True),
|
| 270 |
+
dict(type='Pad', size_divisor=32),
|
| 271 |
+
dict(type='DefaultFormatBundle'),
|
| 272 |
+
dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 273 |
+
]
|
| 274 |
+
test_pipeline = [
|
| 275 |
+
dict(type='LoadImageFromFile'),
|
| 276 |
+
dict(
|
| 277 |
+
type='MultiScaleFlipAug',
|
| 278 |
+
img_scale=(1333, 800),
|
| 279 |
+
flip=False,
|
| 280 |
+
transforms=[
|
| 281 |
+
dict(type='Resize', keep_ratio=True),
|
| 282 |
+
dict(type='RandomFlip'),
|
| 283 |
+
dict(
|
| 284 |
+
type='Normalize',
|
| 285 |
+
mean=[123.675, 116.28, 103.53],
|
| 286 |
+
std=[58.395, 57.12, 57.375],
|
| 287 |
+
to_rgb=True),
|
| 288 |
+
dict(type='Pad', size_divisor=32),
|
| 289 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 290 |
+
dict(type='Collect', keys=['img'])
|
| 291 |
+
])
|
| 292 |
+
]
|
| 293 |
+
data = dict(
|
| 294 |
+
samples_per_gpu=2,
|
| 295 |
+
workers_per_gpu=4,
|
| 296 |
+
train=dict(
|
| 297 |
+
type='CocoDataset',
|
| 298 |
+
ann_file=
|
| 299 |
+
'/root/autodl-tmp/COCO2017/annotations/instances_train2017.json',
|
| 300 |
+
img_prefix='/root/autodl-tmp/COCO2017/train2017/',
|
| 301 |
+
pipeline=[
|
| 302 |
+
dict(type='LoadImageFromFile'),
|
| 303 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 304 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 305 |
+
dict(
|
| 306 |
+
type='AutoAugment',
|
| 307 |
+
policies=[[{
|
| 308 |
+
'type':
|
| 309 |
+
'Resize',
|
| 310 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 311 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 312 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 313 |
+
(768, 1333), (800, 1333)],
|
| 314 |
+
'multiscale_mode':
|
| 315 |
+
'value',
|
| 316 |
+
'keep_ratio':
|
| 317 |
+
True
|
| 318 |
+
}],
|
| 319 |
+
[{
|
| 320 |
+
'type': 'Resize',
|
| 321 |
+
'img_scale': [(400, 1333), (500, 1333),
|
| 322 |
+
(600, 1333)],
|
| 323 |
+
'multiscale_mode': 'value',
|
| 324 |
+
'keep_ratio': True
|
| 325 |
+
}, {
|
| 326 |
+
'type': 'RandomCrop',
|
| 327 |
+
'crop_type': 'absolute_range',
|
| 328 |
+
'crop_size': (384, 600),
|
| 329 |
+
'allow_negative_crop': True
|
| 330 |
+
}, {
|
| 331 |
+
'type':
|
| 332 |
+
'Resize',
|
| 333 |
+
'img_scale': [(480, 1333), (512, 1333),
|
| 334 |
+
(544, 1333), (576, 1333),
|
| 335 |
+
(608, 1333), (640, 1333),
|
| 336 |
+
(672, 1333), (704, 1333),
|
| 337 |
+
(736, 1333), (768, 1333),
|
| 338 |
+
(800, 1333)],
|
| 339 |
+
'multiscale_mode':
|
| 340 |
+
'value',
|
| 341 |
+
'override':
|
| 342 |
+
True,
|
| 343 |
+
'keep_ratio':
|
| 344 |
+
True
|
| 345 |
+
}]]),
|
| 346 |
+
dict(
|
| 347 |
+
type='Normalize',
|
| 348 |
+
mean=[123.675, 116.28, 103.53],
|
| 349 |
+
std=[58.395, 57.12, 57.375],
|
| 350 |
+
to_rgb=True),
|
| 351 |
+
dict(type='Pad', size_divisor=32),
|
| 352 |
+
dict(type='DefaultFormatBundle'),
|
| 353 |
+
dict(
|
| 354 |
+
type='Collect',
|
| 355 |
+
keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 356 |
+
]),
|
| 357 |
+
val=dict(
|
| 358 |
+
type='CocoDataset',
|
| 359 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 360 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 361 |
+
pipeline=[
|
| 362 |
+
dict(type='LoadImageFromFile'),
|
| 363 |
+
dict(
|
| 364 |
+
type='MultiScaleFlipAug',
|
| 365 |
+
img_scale=(1333, 800),
|
| 366 |
+
flip=False,
|
| 367 |
+
transforms=[
|
| 368 |
+
dict(type='Resize', keep_ratio=True),
|
| 369 |
+
dict(type='RandomFlip'),
|
| 370 |
+
dict(
|
| 371 |
+
type='Normalize',
|
| 372 |
+
mean=[123.675, 116.28, 103.53],
|
| 373 |
+
std=[58.395, 57.12, 57.375],
|
| 374 |
+
to_rgb=True),
|
| 375 |
+
dict(type='Pad', size_divisor=32),
|
| 376 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 377 |
+
dict(type='Collect', keys=['img'])
|
| 378 |
+
])
|
| 379 |
+
]),
|
| 380 |
+
test=dict(
|
| 381 |
+
type='CocoDataset',
|
| 382 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 383 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 384 |
+
pipeline=[
|
| 385 |
+
dict(type='LoadImageFromFile'),
|
| 386 |
+
dict(
|
| 387 |
+
type='MultiScaleFlipAug',
|
| 388 |
+
img_scale=(1333, 800),
|
| 389 |
+
flip=False,
|
| 390 |
+
transforms=[
|
| 391 |
+
dict(type='Resize', keep_ratio=True),
|
| 392 |
+
dict(type='RandomFlip'),
|
| 393 |
+
dict(
|
| 394 |
+
type='Normalize',
|
| 395 |
+
mean=[123.675, 116.28, 103.53],
|
| 396 |
+
std=[58.395, 57.12, 57.375],
|
| 397 |
+
to_rgb=True),
|
| 398 |
+
dict(type='Pad', size_divisor=32),
|
| 399 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 400 |
+
dict(type='Collect', keys=['img'])
|
| 401 |
+
])
|
| 402 |
+
]))
|
| 403 |
+
evaluation = dict(metric=['bbox', 'segm'], gpu_collect=True)
|
| 404 |
+
optimizer = dict(
|
| 405 |
+
type='AdamW',
|
| 406 |
+
lr=0.0001,
|
| 407 |
+
betas=(0.9, 0.999),
|
| 408 |
+
weight_decay=0.05,
|
| 409 |
+
paramwise_cfg=dict(
|
| 410 |
+
custom_keys=dict(
|
| 411 |
+
absolute_pos_embed=dict(decay_mult=0.0),
|
| 412 |
+
relative_position_bias_table=dict(decay_mult=0.0),
|
| 413 |
+
norm=dict(decay_mult=0.0))))
|
| 414 |
+
optimizer_config = dict(
|
| 415 |
+
grad_clip=None,
|
| 416 |
+
type='DistOptimizerHook',
|
| 417 |
+
update_interval=1,
|
| 418 |
+
coalesce=True,
|
| 419 |
+
bucket_size_mb=-1,
|
| 420 |
+
use_fp16=True)
|
| 421 |
+
lr_config = dict(
|
| 422 |
+
policy='step',
|
| 423 |
+
warmup='linear',
|
| 424 |
+
warmup_iters=500,
|
| 425 |
+
warmup_ratio=0.001,
|
| 426 |
+
step=[27, 33])
|
| 427 |
+
runner = dict(type='EpochBasedRunnerAmp', max_epochs=36)
|
| 428 |
+
checkpoint_config = dict(interval=1)
|
| 429 |
+
log_config = dict(interval=50, hooks=[dict(type='TextLoggerHook')])
|
| 430 |
+
custom_hooks = [dict(type='NumClassCheckHook')]
|
| 431 |
+
dist_params = dict(backend='nccl')
|
| 432 |
+
log_level = 'INFO'
|
| 433 |
+
load_from = '/root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/pretrained_model/swin_base_mona_llama_moe_8.pth'
|
| 434 |
+
resume_from = None
|
| 435 |
+
workflow = [('train', 1)]
|
| 436 |
+
fp16 = None
|
| 437 |
+
work_dir = './results/train/mona_llama_moe_2_8_1e-4/'
|
| 438 |
+
gpu_ids = range(0, 8)
|
mmdet/results/train/mona_llama_moe_2_8_1e-4/epoch_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce5ae42106a6cc130fa0b866985a0736e3da6ae3f57ad4cadce510106ac2b348
|
| 3 |
+
size 1512371920
|
mmdet/results/train/mona_llama_moe_2_8_1e-4/epoch_36.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:55b45bd3774399eab3a6938e1978f1dd2e99a59fa61ca0ffd0751c9e5d43c9b4
|
| 3 |
+
size 1512372112
|
mmdet/results/train/mona_llama_moe_2_8_1e-4/latest.pth
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
epoch_36.pth
|
mmdet/results/train/mona_llama_moe_5_8_1e-4/20250702_125523.log
ADDED
|
@@ -0,0 +1,613 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
2025-07-02 12:55:24,048 - mmdet - INFO - Environment info:
|
| 2 |
+
------------------------------------------------------------
|
| 3 |
+
sys.platform: linux
|
| 4 |
+
Python: 3.8.20 (default, Oct 3 2024, 15:24:27) [GCC 11.2.0]
|
| 5 |
+
CUDA available: True
|
| 6 |
+
GPU 0,1,2,3,4,5,6,7: NVIDIA GeForce RTX 4090
|
| 7 |
+
CUDA_HOME: /root/autodl-tmp/cuda/cuda-11.7
|
| 8 |
+
NVCC: Cuda compilation tools, release 11.7, V11.7.64
|
| 9 |
+
GCC: gcc (Ubuntu 9.4.0-1ubuntu1~20.04.1) 9.4.0
|
| 10 |
+
PyTorch: 1.13.1+cu117
|
| 11 |
+
PyTorch compiling details: PyTorch built with:
|
| 12 |
+
- GCC 9.3
|
| 13 |
+
- C++ Version: 201402
|
| 14 |
+
- Intel(R) Math Kernel Library Version 2020.0.0 Product Build 20191122 for Intel(R) 64 architecture applications
|
| 15 |
+
- Intel(R) MKL-DNN v2.6.0 (Git Hash 52b5f107dd9cf10910aaa19cb47f3abf9b349815)
|
| 16 |
+
- OpenMP 201511 (a.k.a. OpenMP 4.5)
|
| 17 |
+
- LAPACK is enabled (usually provided by MKL)
|
| 18 |
+
- NNPACK is enabled
|
| 19 |
+
- CPU capability usage: AVX2
|
| 20 |
+
- CUDA Runtime 11.7
|
| 21 |
+
- NVCC architecture flags: -gencode;arch=compute_37,code=sm_37;-gencode;arch=compute_50,code=sm_50;-gencode;arch=compute_60,code=sm_60;-gencode;arch=compute_70,code=sm_70;-gencode;arch=compute_75,code=sm_75;-gencode;arch=compute_80,code=sm_80;-gencode;arch=compute_86,code=sm_86
|
| 22 |
+
- CuDNN 8.5
|
| 23 |
+
- Magma 2.6.1
|
| 24 |
+
- Build settings: BLAS_INFO=mkl, BUILD_TYPE=Release, CUDA_VERSION=11.7, CUDNN_VERSION=8.5.0, CXX_COMPILER=/opt/rh/devtoolset-9/root/usr/bin/c++, CXX_FLAGS= -fabi-version=11 -Wno-deprecated -fvisibility-inlines-hidden -DUSE_PTHREADPOOL -fopenmp -DNDEBUG -DUSE_KINETO -DUSE_FBGEMM -DUSE_QNNPACK -DUSE_PYTORCH_QNNPACK -DUSE_XNNPACK -DSYMBOLICATE_MOBILE_DEBUG_HANDLE -DEDGE_PROFILER_USE_KINETO -O2 -fPIC -Wno-narrowing -Wall -Wextra -Werror=return-type -Werror=non-virtual-dtor -Wno-missing-field-initializers -Wno-type-limits -Wno-array-bounds -Wno-unknown-pragmas -Wunused-local-typedefs -Wno-unused-parameter -Wno-unused-function -Wno-unused-result -Wno-strict-overflow -Wno-strict-aliasing -Wno-error=deprecated-declarations -Wno-stringop-overflow -Wno-psabi -Wno-error=pedantic -Wno-error=redundant-decls -Wno-error=old-style-cast -fdiagnostics-color=always -faligned-new -Wno-unused-but-set-variable -Wno-maybe-uninitialized -fno-math-errno -fno-trapping-math -Werror=format -Werror=cast-function-type -Wno-stringop-overflow, LAPACK_INFO=mkl, PERF_WITH_AVX=1, PERF_WITH_AVX2=1, PERF_WITH_AVX512=1, TORCH_VERSION=1.13.1, USE_CUDA=ON, USE_CUDNN=ON, USE_EXCEPTION_PTR=1, USE_GFLAGS=OFF, USE_GLOG=OFF, USE_MKL=ON, USE_MKLDNN=ON, USE_MPI=OFF, USE_NCCL=ON, USE_NNPACK=ON, USE_OPENMP=ON, USE_ROCM=OFF,
|
| 25 |
+
|
| 26 |
+
TorchVision: 0.14.1+cu117
|
| 27 |
+
OpenCV: 4.11.0
|
| 28 |
+
MMCV: 1.7.2
|
| 29 |
+
MMCV Compiler: GCC 9.3
|
| 30 |
+
MMCV CUDA Compiler: 11.7
|
| 31 |
+
MMDetection: 2.11.0+9022e00
|
| 32 |
+
------------------------------------------------------------
|
| 33 |
+
|
| 34 |
+
2025-07-02 12:55:27,575 - mmdet - INFO - Distributed training: True
|
| 35 |
+
2025-07-02 12:55:30,976 - mmdet - INFO - Config:
|
| 36 |
+
model = dict(
|
| 37 |
+
type='CascadeRCNN_loss',
|
| 38 |
+
pretrained=None,
|
| 39 |
+
backbone=dict(
|
| 40 |
+
type='SwinTransformer_mona_llama_moe',
|
| 41 |
+
embed_dim=128,
|
| 42 |
+
depths=[2, 2, 18, 2],
|
| 43 |
+
num_heads=[4, 8, 16, 32],
|
| 44 |
+
window_size=7,
|
| 45 |
+
mlp_ratio=4.0,
|
| 46 |
+
qkv_bias=True,
|
| 47 |
+
qk_scale=None,
|
| 48 |
+
drop_rate=0.0,
|
| 49 |
+
attn_drop_rate=0.0,
|
| 50 |
+
drop_path_rate=0.3,
|
| 51 |
+
ape=False,
|
| 52 |
+
patch_norm=True,
|
| 53 |
+
out_indices=(0, 1, 2, 3),
|
| 54 |
+
use_checkpoint=False),
|
| 55 |
+
neck=dict(
|
| 56 |
+
type='FPN',
|
| 57 |
+
in_channels=[128, 256, 512, 1024],
|
| 58 |
+
out_channels=256,
|
| 59 |
+
num_outs=5),
|
| 60 |
+
rpn_head=dict(
|
| 61 |
+
type='RPNHead',
|
| 62 |
+
in_channels=256,
|
| 63 |
+
feat_channels=256,
|
| 64 |
+
anchor_generator=dict(
|
| 65 |
+
type='AnchorGenerator',
|
| 66 |
+
scales=[8],
|
| 67 |
+
ratios=[0.5, 1.0, 2.0],
|
| 68 |
+
strides=[4, 8, 16, 32, 64]),
|
| 69 |
+
bbox_coder=dict(
|
| 70 |
+
type='DeltaXYWHBBoxCoder',
|
| 71 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 72 |
+
target_stds=[1.0, 1.0, 1.0, 1.0]),
|
| 73 |
+
loss_cls=dict(
|
| 74 |
+
type='CrossEntropyLoss', use_sigmoid=True, loss_weight=1.0),
|
| 75 |
+
loss_bbox=dict(
|
| 76 |
+
type='SmoothL1Loss', beta=0.1111111111111111, loss_weight=1.0)),
|
| 77 |
+
roi_head=dict(
|
| 78 |
+
type='CascadeRoIHead',
|
| 79 |
+
num_stages=3,
|
| 80 |
+
stage_loss_weights=[1, 0.5, 0.25],
|
| 81 |
+
bbox_roi_extractor=dict(
|
| 82 |
+
type='SingleRoIExtractor',
|
| 83 |
+
roi_layer=dict(type='RoIAlign', output_size=7, sampling_ratio=0),
|
| 84 |
+
out_channels=256,
|
| 85 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 86 |
+
bbox_head=[
|
| 87 |
+
dict(
|
| 88 |
+
type='ConvFCBBoxHead',
|
| 89 |
+
num_shared_convs=4,
|
| 90 |
+
num_shared_fcs=1,
|
| 91 |
+
in_channels=256,
|
| 92 |
+
conv_out_channels=256,
|
| 93 |
+
fc_out_channels=1024,
|
| 94 |
+
roi_feat_size=7,
|
| 95 |
+
num_classes=80,
|
| 96 |
+
bbox_coder=dict(
|
| 97 |
+
type='DeltaXYWHBBoxCoder',
|
| 98 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 99 |
+
target_stds=[0.1, 0.1, 0.2, 0.2]),
|
| 100 |
+
reg_class_agnostic=False,
|
| 101 |
+
reg_decoded_bbox=True,
|
| 102 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 103 |
+
loss_cls=dict(
|
| 104 |
+
type='CrossEntropyLoss',
|
| 105 |
+
use_sigmoid=False,
|
| 106 |
+
loss_weight=1.0),
|
| 107 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 108 |
+
dict(
|
| 109 |
+
type='ConvFCBBoxHead',
|
| 110 |
+
num_shared_convs=4,
|
| 111 |
+
num_shared_fcs=1,
|
| 112 |
+
in_channels=256,
|
| 113 |
+
conv_out_channels=256,
|
| 114 |
+
fc_out_channels=1024,
|
| 115 |
+
roi_feat_size=7,
|
| 116 |
+
num_classes=80,
|
| 117 |
+
bbox_coder=dict(
|
| 118 |
+
type='DeltaXYWHBBoxCoder',
|
| 119 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 120 |
+
target_stds=[0.05, 0.05, 0.1, 0.1]),
|
| 121 |
+
reg_class_agnostic=False,
|
| 122 |
+
reg_decoded_bbox=True,
|
| 123 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 124 |
+
loss_cls=dict(
|
| 125 |
+
type='CrossEntropyLoss',
|
| 126 |
+
use_sigmoid=False,
|
| 127 |
+
loss_weight=1.0),
|
| 128 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 129 |
+
dict(
|
| 130 |
+
type='ConvFCBBoxHead',
|
| 131 |
+
num_shared_convs=4,
|
| 132 |
+
num_shared_fcs=1,
|
| 133 |
+
in_channels=256,
|
| 134 |
+
conv_out_channels=256,
|
| 135 |
+
fc_out_channels=1024,
|
| 136 |
+
roi_feat_size=7,
|
| 137 |
+
num_classes=80,
|
| 138 |
+
bbox_coder=dict(
|
| 139 |
+
type='DeltaXYWHBBoxCoder',
|
| 140 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 141 |
+
target_stds=[0.033, 0.033, 0.067, 0.067]),
|
| 142 |
+
reg_class_agnostic=False,
|
| 143 |
+
reg_decoded_bbox=True,
|
| 144 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 145 |
+
loss_cls=dict(
|
| 146 |
+
type='CrossEntropyLoss',
|
| 147 |
+
use_sigmoid=False,
|
| 148 |
+
loss_weight=1.0),
|
| 149 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
|
| 150 |
+
],
|
| 151 |
+
mask_roi_extractor=dict(
|
| 152 |
+
type='SingleRoIExtractor',
|
| 153 |
+
roi_layer=dict(type='RoIAlign', output_size=14, sampling_ratio=0),
|
| 154 |
+
out_channels=256,
|
| 155 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 156 |
+
mask_head=dict(
|
| 157 |
+
type='FCNMaskHead',
|
| 158 |
+
num_convs=4,
|
| 159 |
+
in_channels=256,
|
| 160 |
+
conv_out_channels=256,
|
| 161 |
+
num_classes=80,
|
| 162 |
+
loss_mask=dict(
|
| 163 |
+
type='CrossEntropyLoss', use_mask=True, loss_weight=1.0))),
|
| 164 |
+
train_cfg=dict(
|
| 165 |
+
rpn=dict(
|
| 166 |
+
assigner=dict(
|
| 167 |
+
type='MaxIoUAssigner',
|
| 168 |
+
pos_iou_thr=0.7,
|
| 169 |
+
neg_iou_thr=0.3,
|
| 170 |
+
min_pos_iou=0.3,
|
| 171 |
+
match_low_quality=True,
|
| 172 |
+
ignore_iof_thr=-1),
|
| 173 |
+
sampler=dict(
|
| 174 |
+
type='RandomSampler',
|
| 175 |
+
num=256,
|
| 176 |
+
pos_fraction=0.5,
|
| 177 |
+
neg_pos_ub=-1,
|
| 178 |
+
add_gt_as_proposals=False),
|
| 179 |
+
allowed_border=0,
|
| 180 |
+
pos_weight=-1,
|
| 181 |
+
debug=False),
|
| 182 |
+
rpn_proposal=dict(
|
| 183 |
+
nms_across_levels=False,
|
| 184 |
+
nms_pre=2000,
|
| 185 |
+
nms_post=2000,
|
| 186 |
+
max_per_img=2000,
|
| 187 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 188 |
+
min_bbox_size=0),
|
| 189 |
+
rcnn=[
|
| 190 |
+
dict(
|
| 191 |
+
assigner=dict(
|
| 192 |
+
type='MaxIoUAssigner',
|
| 193 |
+
pos_iou_thr=0.5,
|
| 194 |
+
neg_iou_thr=0.5,
|
| 195 |
+
min_pos_iou=0.5,
|
| 196 |
+
match_low_quality=False,
|
| 197 |
+
ignore_iof_thr=-1),
|
| 198 |
+
sampler=dict(
|
| 199 |
+
type='RandomSampler',
|
| 200 |
+
num=512,
|
| 201 |
+
pos_fraction=0.25,
|
| 202 |
+
neg_pos_ub=-1,
|
| 203 |
+
add_gt_as_proposals=True),
|
| 204 |
+
mask_size=28,
|
| 205 |
+
pos_weight=-1,
|
| 206 |
+
debug=False),
|
| 207 |
+
dict(
|
| 208 |
+
assigner=dict(
|
| 209 |
+
type='MaxIoUAssigner',
|
| 210 |
+
pos_iou_thr=0.6,
|
| 211 |
+
neg_iou_thr=0.6,
|
| 212 |
+
min_pos_iou=0.6,
|
| 213 |
+
match_low_quality=False,
|
| 214 |
+
ignore_iof_thr=-1),
|
| 215 |
+
sampler=dict(
|
| 216 |
+
type='RandomSampler',
|
| 217 |
+
num=512,
|
| 218 |
+
pos_fraction=0.25,
|
| 219 |
+
neg_pos_ub=-1,
|
| 220 |
+
add_gt_as_proposals=True),
|
| 221 |
+
mask_size=28,
|
| 222 |
+
pos_weight=-1,
|
| 223 |
+
debug=False),
|
| 224 |
+
dict(
|
| 225 |
+
assigner=dict(
|
| 226 |
+
type='MaxIoUAssigner',
|
| 227 |
+
pos_iou_thr=0.7,
|
| 228 |
+
neg_iou_thr=0.7,
|
| 229 |
+
min_pos_iou=0.7,
|
| 230 |
+
match_low_quality=False,
|
| 231 |
+
ignore_iof_thr=-1),
|
| 232 |
+
sampler=dict(
|
| 233 |
+
type='RandomSampler',
|
| 234 |
+
num=512,
|
| 235 |
+
pos_fraction=0.25,
|
| 236 |
+
neg_pos_ub=-1,
|
| 237 |
+
add_gt_as_proposals=True),
|
| 238 |
+
mask_size=28,
|
| 239 |
+
pos_weight=-1,
|
| 240 |
+
debug=False)
|
| 241 |
+
]),
|
| 242 |
+
test_cfg=dict(
|
| 243 |
+
rpn=dict(
|
| 244 |
+
nms_across_levels=False,
|
| 245 |
+
nms_pre=1000,
|
| 246 |
+
nms_post=1000,
|
| 247 |
+
max_per_img=1000,
|
| 248 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 249 |
+
min_bbox_size=0),
|
| 250 |
+
rcnn=dict(
|
| 251 |
+
score_thr=0.05,
|
| 252 |
+
nms=dict(type='nms', iou_threshold=0.5),
|
| 253 |
+
max_per_img=100,
|
| 254 |
+
mask_thr_binary=0.5)))
|
| 255 |
+
dataset_type = 'CocoDataset'
|
| 256 |
+
data_root = '/root/autodl-tmp/COCO2017/'
|
| 257 |
+
img_norm_cfg = dict(
|
| 258 |
+
mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
|
| 259 |
+
train_pipeline = [
|
| 260 |
+
dict(type='LoadImageFromFile'),
|
| 261 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 262 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 263 |
+
dict(
|
| 264 |
+
type='AutoAugment',
|
| 265 |
+
policies=[[{
|
| 266 |
+
'type':
|
| 267 |
+
'Resize',
|
| 268 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333), (576, 1333),
|
| 269 |
+
(608, 1333), (640, 1333), (672, 1333), (704, 1333),
|
| 270 |
+
(736, 1333), (768, 1333), (800, 1333)],
|
| 271 |
+
'multiscale_mode':
|
| 272 |
+
'value',
|
| 273 |
+
'keep_ratio':
|
| 274 |
+
True
|
| 275 |
+
}],
|
| 276 |
+
[{
|
| 277 |
+
'type': 'Resize',
|
| 278 |
+
'img_scale': [(400, 1333), (500, 1333), (600, 1333)],
|
| 279 |
+
'multiscale_mode': 'value',
|
| 280 |
+
'keep_ratio': True
|
| 281 |
+
}, {
|
| 282 |
+
'type': 'RandomCrop',
|
| 283 |
+
'crop_type': 'absolute_range',
|
| 284 |
+
'crop_size': (384, 600),
|
| 285 |
+
'allow_negative_crop': True
|
| 286 |
+
}, {
|
| 287 |
+
'type':
|
| 288 |
+
'Resize',
|
| 289 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 290 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 291 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 292 |
+
(768, 1333), (800, 1333)],
|
| 293 |
+
'multiscale_mode':
|
| 294 |
+
'value',
|
| 295 |
+
'override':
|
| 296 |
+
True,
|
| 297 |
+
'keep_ratio':
|
| 298 |
+
True
|
| 299 |
+
}]]),
|
| 300 |
+
dict(
|
| 301 |
+
type='Normalize',
|
| 302 |
+
mean=[123.675, 116.28, 103.53],
|
| 303 |
+
std=[58.395, 57.12, 57.375],
|
| 304 |
+
to_rgb=True),
|
| 305 |
+
dict(type='Pad', size_divisor=32),
|
| 306 |
+
dict(type='DefaultFormatBundle'),
|
| 307 |
+
dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 308 |
+
]
|
| 309 |
+
test_pipeline = [
|
| 310 |
+
dict(type='LoadImageFromFile'),
|
| 311 |
+
dict(
|
| 312 |
+
type='MultiScaleFlipAug',
|
| 313 |
+
img_scale=(1333, 800),
|
| 314 |
+
flip=False,
|
| 315 |
+
transforms=[
|
| 316 |
+
dict(type='Resize', keep_ratio=True),
|
| 317 |
+
dict(type='RandomFlip'),
|
| 318 |
+
dict(
|
| 319 |
+
type='Normalize',
|
| 320 |
+
mean=[123.675, 116.28, 103.53],
|
| 321 |
+
std=[58.395, 57.12, 57.375],
|
| 322 |
+
to_rgb=True),
|
| 323 |
+
dict(type='Pad', size_divisor=32),
|
| 324 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 325 |
+
dict(type='Collect', keys=['img'])
|
| 326 |
+
])
|
| 327 |
+
]
|
| 328 |
+
data = dict(
|
| 329 |
+
samples_per_gpu=2,
|
| 330 |
+
workers_per_gpu=4,
|
| 331 |
+
train=dict(
|
| 332 |
+
type='CocoDataset',
|
| 333 |
+
ann_file=
|
| 334 |
+
'/root/autodl-tmp/COCO2017/annotations/instances_train2017.json',
|
| 335 |
+
img_prefix='/root/autodl-tmp/COCO2017/train2017/',
|
| 336 |
+
pipeline=[
|
| 337 |
+
dict(type='LoadImageFromFile'),
|
| 338 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 339 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 340 |
+
dict(
|
| 341 |
+
type='AutoAugment',
|
| 342 |
+
policies=[[{
|
| 343 |
+
'type':
|
| 344 |
+
'Resize',
|
| 345 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 346 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 347 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 348 |
+
(768, 1333), (800, 1333)],
|
| 349 |
+
'multiscale_mode':
|
| 350 |
+
'value',
|
| 351 |
+
'keep_ratio':
|
| 352 |
+
True
|
| 353 |
+
}],
|
| 354 |
+
[{
|
| 355 |
+
'type': 'Resize',
|
| 356 |
+
'img_scale': [(400, 1333), (500, 1333),
|
| 357 |
+
(600, 1333)],
|
| 358 |
+
'multiscale_mode': 'value',
|
| 359 |
+
'keep_ratio': True
|
| 360 |
+
}, {
|
| 361 |
+
'type': 'RandomCrop',
|
| 362 |
+
'crop_type': 'absolute_range',
|
| 363 |
+
'crop_size': (384, 600),
|
| 364 |
+
'allow_negative_crop': True
|
| 365 |
+
}, {
|
| 366 |
+
'type':
|
| 367 |
+
'Resize',
|
| 368 |
+
'img_scale': [(480, 1333), (512, 1333),
|
| 369 |
+
(544, 1333), (576, 1333),
|
| 370 |
+
(608, 1333), (640, 1333),
|
| 371 |
+
(672, 1333), (704, 1333),
|
| 372 |
+
(736, 1333), (768, 1333),
|
| 373 |
+
(800, 1333)],
|
| 374 |
+
'multiscale_mode':
|
| 375 |
+
'value',
|
| 376 |
+
'override':
|
| 377 |
+
True,
|
| 378 |
+
'keep_ratio':
|
| 379 |
+
True
|
| 380 |
+
}]]),
|
| 381 |
+
dict(
|
| 382 |
+
type='Normalize',
|
| 383 |
+
mean=[123.675, 116.28, 103.53],
|
| 384 |
+
std=[58.395, 57.12, 57.375],
|
| 385 |
+
to_rgb=True),
|
| 386 |
+
dict(type='Pad', size_divisor=32),
|
| 387 |
+
dict(type='DefaultFormatBundle'),
|
| 388 |
+
dict(
|
| 389 |
+
type='Collect',
|
| 390 |
+
keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 391 |
+
]),
|
| 392 |
+
val=dict(
|
| 393 |
+
type='CocoDataset',
|
| 394 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 395 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 396 |
+
pipeline=[
|
| 397 |
+
dict(type='LoadImageFromFile'),
|
| 398 |
+
dict(
|
| 399 |
+
type='MultiScaleFlipAug',
|
| 400 |
+
img_scale=(1333, 800),
|
| 401 |
+
flip=False,
|
| 402 |
+
transforms=[
|
| 403 |
+
dict(type='Resize', keep_ratio=True),
|
| 404 |
+
dict(type='RandomFlip'),
|
| 405 |
+
dict(
|
| 406 |
+
type='Normalize',
|
| 407 |
+
mean=[123.675, 116.28, 103.53],
|
| 408 |
+
std=[58.395, 57.12, 57.375],
|
| 409 |
+
to_rgb=True),
|
| 410 |
+
dict(type='Pad', size_divisor=32),
|
| 411 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 412 |
+
dict(type='Collect', keys=['img'])
|
| 413 |
+
])
|
| 414 |
+
]),
|
| 415 |
+
test=dict(
|
| 416 |
+
type='CocoDataset',
|
| 417 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 418 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 419 |
+
pipeline=[
|
| 420 |
+
dict(type='LoadImageFromFile'),
|
| 421 |
+
dict(
|
| 422 |
+
type='MultiScaleFlipAug',
|
| 423 |
+
img_scale=(1333, 800),
|
| 424 |
+
flip=False,
|
| 425 |
+
transforms=[
|
| 426 |
+
dict(type='Resize', keep_ratio=True),
|
| 427 |
+
dict(type='RandomFlip'),
|
| 428 |
+
dict(
|
| 429 |
+
type='Normalize',
|
| 430 |
+
mean=[123.675, 116.28, 103.53],
|
| 431 |
+
std=[58.395, 57.12, 57.375],
|
| 432 |
+
to_rgb=True),
|
| 433 |
+
dict(type='Pad', size_divisor=32),
|
| 434 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 435 |
+
dict(type='Collect', keys=['img'])
|
| 436 |
+
])
|
| 437 |
+
]))
|
| 438 |
+
evaluation = dict(metric=['bbox', 'segm'], gpu_collect=True)
|
| 439 |
+
optimizer = dict(
|
| 440 |
+
type='AdamW',
|
| 441 |
+
lr=0.0001,
|
| 442 |
+
betas=(0.9, 0.999),
|
| 443 |
+
weight_decay=0.05,
|
| 444 |
+
paramwise_cfg=dict(
|
| 445 |
+
custom_keys=dict(
|
| 446 |
+
absolute_pos_embed=dict(decay_mult=0.0),
|
| 447 |
+
relative_position_bias_table=dict(decay_mult=0.0),
|
| 448 |
+
norm=dict(decay_mult=0.0))))
|
| 449 |
+
optimizer_config = dict(
|
| 450 |
+
grad_clip=None,
|
| 451 |
+
type='DistOptimizerHook',
|
| 452 |
+
update_interval=1,
|
| 453 |
+
coalesce=True,
|
| 454 |
+
bucket_size_mb=-1,
|
| 455 |
+
use_fp16=True)
|
| 456 |
+
lr_config = dict(
|
| 457 |
+
policy='step',
|
| 458 |
+
warmup='linear',
|
| 459 |
+
warmup_iters=500,
|
| 460 |
+
warmup_ratio=0.001,
|
| 461 |
+
step=[27, 33])
|
| 462 |
+
runner = dict(type='EpochBasedRunnerAmp', max_epochs=36)
|
| 463 |
+
checkpoint_config = dict(interval=1)
|
| 464 |
+
log_config = dict(interval=50, hooks=[dict(type='TextLoggerHook')])
|
| 465 |
+
custom_hooks = [dict(type='NumClassCheckHook')]
|
| 466 |
+
dist_params = dict(backend='nccl')
|
| 467 |
+
log_level = 'INFO'
|
| 468 |
+
load_from = '/root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/pretrained_model/swin_base_mona_llama_moe_8.pth'
|
| 469 |
+
resume_from = None
|
| 470 |
+
workflow = [('train', 1)]
|
| 471 |
+
fp16 = None
|
| 472 |
+
work_dir = './results/train/mona_llama_moe_5_8_1e-4/'
|
| 473 |
+
gpu_ids = range(0, 8)
|
| 474 |
+
|
| 475 |
+
2025-07-02 12:56:15,818 - mmdet - INFO - load checkpoint from local path: /root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/pretrained_model/swin_base_mona_llama_moe_8.pth
|
| 476 |
+
2025-07-02 12:56:16,553 - mmdet - WARNING - The model and loaded state dict do not match exactly
|
| 477 |
+
|
| 478 |
+
missing keys in source state_dict: backbone.layers.0.blocks.0.mlp.fc1.gate.gate_network.0.weight, backbone.layers.0.blocks.0.mlp.fc1.gate.gate_network.2.weight, backbone.layers.0.blocks.0.mlp.fc1.gate.weight_noise.weight, backbone.layers.0.blocks.1.mlp.fc1.gate.gate_network.0.weight, backbone.layers.0.blocks.1.mlp.fc1.gate.gate_network.2.weight, backbone.layers.0.blocks.1.mlp.fc1.gate.weight_noise.weight, backbone.layers.1.blocks.0.mlp.fc1.gate.gate_network.0.weight, backbone.layers.1.blocks.0.mlp.fc1.gate.gate_network.2.weight, backbone.layers.1.blocks.0.mlp.fc1.gate.weight_noise.weight, backbone.layers.1.blocks.1.mlp.fc1.gate.gate_network.0.weight, backbone.layers.1.blocks.1.mlp.fc1.gate.gate_network.2.weight, backbone.layers.1.blocks.1.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.0.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.0.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.0.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.1.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.1.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.1.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.2.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.2.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.2.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.3.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.3.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.3.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.4.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.4.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.4.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.5.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.5.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.5.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.6.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.6.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.6.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.7.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.7.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.7.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.8.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.8.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.8.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.9.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.9.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.9.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.10.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.10.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.10.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.11.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.11.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.11.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.12.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.12.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.12.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.13.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.13.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.13.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.14.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.14.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.14.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.15.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.15.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.15.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.16.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.16.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.16.mlp.fc1.gate.weight_noise.weight, backbone.layers.2.blocks.17.mlp.fc1.gate.gate_network.0.weight, backbone.layers.2.blocks.17.mlp.fc1.gate.gate_network.2.weight, backbone.layers.2.blocks.17.mlp.fc1.gate.weight_noise.weight, backbone.layers.3.blocks.0.mlp.fc1.gate.gate_network.0.weight, backbone.layers.3.blocks.0.mlp.fc1.gate.gate_network.2.weight, backbone.layers.3.blocks.0.mlp.fc1.gate.weight_noise.weight, backbone.layers.3.blocks.1.mlp.fc1.gate.gate_network.0.weight, backbone.layers.3.blocks.1.mlp.fc1.gate.gate_network.2.weight, backbone.layers.3.blocks.1.mlp.fc1.gate.weight_noise.weight
|
| 479 |
+
|
| 480 |
+
2025-07-02 12:56:16,596 - mmdet - INFO - Start running, host: root@autodl-container-313040b114-67ed2cfc, work_dir: /root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/results/train/mona_llama_moe_5_8_1e-4
|
| 481 |
+
2025-07-02 12:56:16,597 - mmdet - INFO - Hooks will be executed in the following order:
|
| 482 |
+
before_run:
|
| 483 |
+
(VERY_HIGH ) StepLrUpdaterHook
|
| 484 |
+
(ABOVE_NORMAL) DistOptimizerHook
|
| 485 |
+
(NORMAL ) CheckpointHook
|
| 486 |
+
(NORMAL ) DistEvalHook
|
| 487 |
+
(VERY_LOW ) TextLoggerHook
|
| 488 |
+
--------------------
|
| 489 |
+
before_train_epoch:
|
| 490 |
+
(VERY_HIGH ) StepLrUpdaterHook
|
| 491 |
+
(NORMAL ) DistSamplerSeedHook
|
| 492 |
+
(NORMAL ) DistEvalHook
|
| 493 |
+
(NORMAL ) NumClassCheckHook
|
| 494 |
+
(LOW ) IterTimerHook
|
| 495 |
+
(VERY_LOW ) TextLoggerHook
|
| 496 |
+
--------------------
|
| 497 |
+
before_train_iter:
|
| 498 |
+
(VERY_HIGH ) StepLrUpdaterHook
|
| 499 |
+
(LOW ) IterTimerHook
|
| 500 |
+
--------------------
|
| 501 |
+
after_train_iter:
|
| 502 |
+
(ABOVE_NORMAL) DistOptimizerHook
|
| 503 |
+
(NORMAL ) CheckpointHook
|
| 504 |
+
(NORMAL ) DistEvalHook
|
| 505 |
+
(LOW ) IterTimerHook
|
| 506 |
+
(VERY_LOW ) TextLoggerHook
|
| 507 |
+
--------------------
|
| 508 |
+
after_train_epoch:
|
| 509 |
+
(NORMAL ) CheckpointHook
|
| 510 |
+
(NORMAL ) DistEvalHook
|
| 511 |
+
(VERY_LOW ) TextLoggerHook
|
| 512 |
+
--------------------
|
| 513 |
+
before_val_epoch:
|
| 514 |
+
(NORMAL ) DistSamplerSeedHook
|
| 515 |
+
(NORMAL ) NumClassCheckHook
|
| 516 |
+
(LOW ) IterTimerHook
|
| 517 |
+
(VERY_LOW ) TextLoggerHook
|
| 518 |
+
--------------------
|
| 519 |
+
before_val_iter:
|
| 520 |
+
(LOW ) IterTimerHook
|
| 521 |
+
--------------------
|
| 522 |
+
after_val_iter:
|
| 523 |
+
(LOW ) IterTimerHook
|
| 524 |
+
--------------------
|
| 525 |
+
after_val_epoch:
|
| 526 |
+
(VERY_LOW ) TextLoggerHook
|
| 527 |
+
--------------------
|
| 528 |
+
after_run:
|
| 529 |
+
(VERY_LOW ) TextLoggerHook
|
| 530 |
+
--------------------
|
| 531 |
+
2025-07-02 12:56:16,597 - mmdet - INFO - workflow: [('train', 1)], max: 36 epochs
|
| 532 |
+
2025-07-02 12:56:16,598 - mmdet - INFO - Checkpoints will be saved to /root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/results/train/mona_llama_moe_5_8_1e-4 by HardDiskBackend.
|
| 533 |
+
2025-07-02 12:58:28,211 - mmdet - INFO - Epoch [1][50/7330] lr: 9.890e-06, eta: 8 days, 0:53:05, time: 2.632, data_time: 1.579, memory: 21698, balance_loss: 0.0045, loss_rpn_cls: 0.0864, loss_rpn_bbox: 0.0372, s0.loss_cls: 0.3122, s0.acc: 92.0986, s0.loss_bbox: 0.2536, s0.loss_mask: 0.3424, s1.loss_cls: 0.1452, s1.acc: 92.4118, s1.loss_bbox: 0.1034, s1.loss_mask: 0.1652, s2.loss_cls: 0.0654, s2.acc: 93.0664, s2.loss_bbox: 0.0358, s2.loss_mask: 0.0756, loss: 1.6268
|
| 534 |
+
2025-07-02 12:59:18,589 - mmdet - INFO - Epoch [1][100/7330] lr: 1.988e-05, eta: 5 days, 13:19:34, time: 1.007, data_time: 0.028, memory: 21698, balance_loss: 0.0032, loss_rpn_cls: 0.0637, loss_rpn_bbox: 0.0314, s0.loss_cls: 0.2797, s0.acc: 92.3184, s0.loss_bbox: 0.2496, s0.loss_mask: 0.3049, s1.loss_cls: 0.1309, s1.acc: 92.6028, s1.loss_bbox: 0.1045, s1.loss_mask: 0.1463, s2.loss_cls: 0.0598, s2.acc: 93.0062, s2.loss_bbox: 0.0369, s2.loss_mask: 0.0676, loss: 1.4786
|
| 535 |
+
2025-07-02 13:00:09,020 - mmdet - INFO - Epoch [1][150/7330] lr: 2.987e-05, eta: 4 days, 17:29:24, time: 1.008, data_time: 0.028, memory: 21698, balance_loss: 0.0023, loss_rpn_cls: 0.0615, loss_rpn_bbox: 0.0317, s0.loss_cls: 0.2742, s0.acc: 92.1995, s0.loss_bbox: 0.2583, s0.loss_mask: 0.3022, s1.loss_cls: 0.1269, s1.acc: 92.4707, s1.loss_bbox: 0.1087, s1.loss_mask: 0.1458, s2.loss_cls: 0.0574, s2.acc: 93.0941, s2.loss_bbox: 0.0389, s2.loss_mask: 0.0673, loss: 1.4752
|
| 536 |
+
2025-07-02 13:01:00,137 - mmdet - INFO - Epoch [1][200/7330] lr: 3.986e-05, eta: 4 days, 7:49:38, time: 1.023, data_time: 0.027, memory: 21698, balance_loss: 0.0018, loss_rpn_cls: 0.0607, loss_rpn_bbox: 0.0313, s0.loss_cls: 0.2629, s0.acc: 92.2280, s0.loss_bbox: 0.2663, s0.loss_mask: 0.2874, s1.loss_cls: 0.1221, s1.acc: 92.5153, s1.loss_bbox: 0.1121, s1.loss_mask: 0.1375, s2.loss_cls: 0.0565, s2.acc: 92.9050, s2.loss_bbox: 0.0403, s2.loss_mask: 0.0631, loss: 1.4422
|
| 537 |
+
2025-07-02 13:02:05,371 - mmdet - INFO - Epoch [1][250/7330] lr: 4.985e-05, eta: 4 days, 6:09:18, time: 1.305, data_time: 0.026, memory: 21698, balance_loss: 0.0013, loss_rpn_cls: 0.0565, loss_rpn_bbox: 0.0328, s0.loss_cls: 0.2491, s0.acc: 92.4004, s0.loss_bbox: 0.2666, s0.loss_mask: 0.2798, s1.loss_cls: 0.1169, s1.acc: 92.7210, s1.loss_bbox: 0.1152, s1.loss_mask: 0.1342, s2.loss_cls: 0.0545, s2.acc: 92.9300, s2.loss_bbox: 0.0422, s2.loss_mask: 0.0614, loss: 1.4104
|
| 538 |
+
2025-07-02 13:02:55,969 - mmdet - INFO - Epoch [1][300/7330] lr: 5.984e-05, eta: 4 days, 1:27:44, time: 1.012, data_time: 0.029, memory: 21698, balance_loss: 0.0012, loss_rpn_cls: 0.0493, loss_rpn_bbox: 0.0279, s0.loss_cls: 0.2301, s0.acc: 92.8999, s0.loss_bbox: 0.2541, s0.loss_mask: 0.2780, s1.loss_cls: 0.1065, s1.acc: 93.1795, s1.loss_bbox: 0.1104, s1.loss_mask: 0.1358, s2.loss_cls: 0.0491, s2.acc: 93.5397, s2.loss_bbox: 0.0411, s2.loss_mask: 0.0632, loss: 1.3465
|
| 539 |
+
2025-07-02 13:03:45,895 - mmdet - INFO - Epoch [1][350/7330] lr: 6.983e-05, eta: 3 days, 21:57:48, time: 0.998, data_time: 0.027, memory: 21698, balance_loss: 0.0011, loss_rpn_cls: 0.0454, loss_rpn_bbox: 0.0275, s0.loss_cls: 0.2259, s0.acc: 93.0745, s0.loss_bbox: 0.2451, s0.loss_mask: 0.2695, s1.loss_cls: 0.1055, s1.acc: 93.3403, s1.loss_bbox: 0.1071, s1.loss_mask: 0.1297, s2.loss_cls: 0.0492, s2.acc: 93.6529, s2.loss_bbox: 0.0401, s2.loss_mask: 0.0601, loss: 1.3061
|
| 540 |
+
2025-07-02 13:04:36,124 - mmdet - INFO - Epoch [1][400/7330] lr: 7.982e-05, eta: 3 days, 19:23:36, time: 1.005, data_time: 0.024, memory: 21698, balance_loss: 0.0010, loss_rpn_cls: 0.0501, loss_rpn_bbox: 0.0299, s0.loss_cls: 0.2317, s0.acc: 92.9746, s0.loss_bbox: 0.2547, s0.loss_mask: 0.2729, s1.loss_cls: 0.1077, s1.acc: 93.2900, s1.loss_bbox: 0.1119, s1.loss_mask: 0.1327, s2.loss_cls: 0.0500, s2.acc: 93.5254, s2.loss_bbox: 0.0416, s2.loss_mask: 0.0620, loss: 1.3462
|
| 541 |
+
2025-07-02 13:05:26,576 - mmdet - INFO - Epoch [1][450/7330] lr: 8.981e-05, eta: 3 days, 17:25:40, time: 1.009, data_time: 0.024, memory: 21698, balance_loss: 0.0009, loss_rpn_cls: 0.0500, loss_rpn_bbox: 0.0277, s0.loss_cls: 0.2199, s0.acc: 93.1548, s0.loss_bbox: 0.2452, s0.loss_mask: 0.2692, s1.loss_cls: 0.1001, s1.acc: 93.4811, s1.loss_bbox: 0.1062, s1.loss_mask: 0.1311, s2.loss_cls: 0.0468, s2.acc: 93.7126, s2.loss_bbox: 0.0400, s2.loss_mask: 0.0609, loss: 1.2979
|
| 542 |
+
2025-07-02 13:06:16,765 - mmdet - INFO - Epoch [1][500/7330] lr: 9.980e-05, eta: 3 days, 15:48:44, time: 1.004, data_time: 0.020, memory: 21698, balance_loss: 0.0009, loss_rpn_cls: 0.0492, loss_rpn_bbox: 0.0283, s0.loss_cls: 0.2262, s0.acc: 92.9531, s0.loss_bbox: 0.2563, s0.loss_mask: 0.2706, s1.loss_cls: 0.1065, s1.acc: 93.2320, s1.loss_bbox: 0.1103, s1.loss_mask: 0.1321, s2.loss_cls: 0.0495, s2.acc: 93.4644, s2.loss_bbox: 0.0408, s2.loss_mask: 0.0611, loss: 1.3319
|
| 543 |
+
2025-07-02 13:07:06,983 - mmdet - INFO - Epoch [1][550/7330] lr: 1.000e-04, eta: 3 days, 14:29:32, time: 1.004, data_time: 0.022, memory: 21698, balance_loss: 0.0009, loss_rpn_cls: 0.0490, loss_rpn_bbox: 0.0280, s0.loss_cls: 0.2123, s0.acc: 93.3240, s0.loss_bbox: 0.2458, s0.loss_mask: 0.2651, s1.loss_cls: 0.0971, s1.acc: 93.7061, s1.loss_bbox: 0.1061, s1.loss_mask: 0.1288, s2.loss_cls: 0.0459, s2.acc: 93.7669, s2.loss_bbox: 0.0397, s2.loss_mask: 0.0593, loss: 1.2781
|
| 544 |
+
2025-07-02 13:07:57,390 - mmdet - INFO - Epoch [1][600/7330] lr: 1.000e-04, eta: 3 days, 13:24:49, time: 1.008, data_time: 0.024, memory: 21698, balance_loss: 0.0008, loss_rpn_cls: 0.0430, loss_rpn_bbox: 0.0279, s0.loss_cls: 0.2200, s0.acc: 93.1748, s0.loss_bbox: 0.2499, s0.loss_mask: 0.2591, s1.loss_cls: 0.1018, s1.acc: 93.5413, s1.loss_bbox: 0.1083, s1.loss_mask: 0.1255, s2.loss_cls: 0.0472, s2.acc: 93.8184, s2.loss_bbox: 0.0407, s2.loss_mask: 0.0585, loss: 1.2827
|
| 545 |
+
2025-07-02 13:08:58,725 - mmdet - INFO - Epoch [1][650/7330] lr: 1.000e-04, eta: 3 days, 13:43:40, time: 1.227, data_time: 0.026, memory: 21698, balance_loss: 0.0007, loss_rpn_cls: 0.0465, loss_rpn_bbox: 0.0293, s0.loss_cls: 0.2178, s0.acc: 92.9668, s0.loss_bbox: 0.2541, s0.loss_mask: 0.2596, s1.loss_cls: 0.1007, s1.acc: 93.2953, s1.loss_bbox: 0.1109, s1.loss_mask: 0.1271, s2.loss_cls: 0.0478, s2.acc: 93.5762, s2.loss_bbox: 0.0415, s2.loss_mask: 0.0594, loss: 1.2954
|
| 546 |
+
2025-07-02 13:09:48,853 - mmdet - INFO - Epoch [1][700/7330] lr: 1.000e-04, eta: 3 days, 12:49:30, time: 1.003, data_time: 0.024, memory: 21698, balance_loss: 0.0007, loss_rpn_cls: 0.0457, loss_rpn_bbox: 0.0304, s0.loss_cls: 0.2175, s0.acc: 92.9810, s0.loss_bbox: 0.2602, s0.loss_mask: 0.2650, s1.loss_cls: 0.1004, s1.acc: 93.2071, s1.loss_bbox: 0.1120, s1.loss_mask: 0.1288, s2.loss_cls: 0.0471, s2.acc: 93.5041, s2.loss_bbox: 0.0418, s2.loss_mask: 0.0598, loss: 1.3094
|
| 547 |
+
2025-07-02 13:10:38,321 - mmdet - INFO - Epoch [1][750/7330] lr: 1.000e-04, eta: 3 days, 11:58:32, time: 0.989, data_time: 0.024, memory: 21698, balance_loss: 0.0007, loss_rpn_cls: 0.0440, loss_rpn_bbox: 0.0279, s0.loss_cls: 0.2056, s0.acc: 93.3123, s0.loss_bbox: 0.2478, s0.loss_mask: 0.2571, s1.loss_cls: 0.0954, s1.acc: 93.6533, s1.loss_bbox: 0.1071, s1.loss_mask: 0.1251, s2.loss_cls: 0.0450, s2.acc: 93.9220, s2.loss_bbox: 0.0406, s2.loss_mask: 0.0585, loss: 1.2547
|
| 548 |
+
2025-07-02 13:11:27,817 - mmdet - INFO - Epoch [1][800/7330] lr: 1.000e-04, eta: 3 days, 11:14:00, time: 0.990, data_time: 0.031, memory: 21698, balance_loss: 0.0006, loss_rpn_cls: 0.0459, loss_rpn_bbox: 0.0281, s0.loss_cls: 0.2057, s0.acc: 93.3857, s0.loss_bbox: 0.2466, s0.loss_mask: 0.2578, s1.loss_cls: 0.0949, s1.acc: 93.6739, s1.loss_bbox: 0.1080, s1.loss_mask: 0.1249, s2.loss_cls: 0.0446, s2.acc: 93.8285, s2.loss_bbox: 0.0406, s2.loss_mask: 0.0580, loss: 1.2556
|
| 549 |
+
2025-07-02 13:12:17,743 - mmdet - INFO - Epoch [1][850/7330] lr: 1.000e-04, eta: 3 days, 10:36:52, time: 0.999, data_time: 0.028, memory: 21698, balance_loss: 0.0006, loss_rpn_cls: 0.0399, loss_rpn_bbox: 0.0275, s0.loss_cls: 0.2002, s0.acc: 93.4236, s0.loss_bbox: 0.2464, s0.loss_mask: 0.2637, s1.loss_cls: 0.0928, s1.acc: 93.6654, s1.loss_bbox: 0.1084, s1.loss_mask: 0.1289, s2.loss_cls: 0.0438, s2.acc: 93.8355, s2.loss_bbox: 0.0414, s2.loss_mask: 0.0603, loss: 1.2537
|
| 550 |
+
2025-07-02 13:13:07,219 - mmdet - INFO - Epoch [1][900/7330] lr: 1.000e-04, eta: 3 days, 10:01:31, time: 0.989, data_time: 0.027, memory: 21698, balance_loss: 0.0006, loss_rpn_cls: 0.0419, loss_rpn_bbox: 0.0280, s0.loss_cls: 0.2099, s0.acc: 93.2744, s0.loss_bbox: 0.2577, s0.loss_mask: 0.2628, s1.loss_cls: 0.0981, s1.acc: 93.5209, s1.loss_bbox: 0.1134, s1.loss_mask: 0.1287, s2.loss_cls: 0.0464, s2.acc: 93.7224, s2.loss_bbox: 0.0424, s2.loss_mask: 0.0600, loss: 1.2899
|
| 551 |
+
2025-07-02 13:13:57,236 - mmdet - INFO - Epoch [1][950/7330] lr: 1.000e-04, eta: 3 days, 9:32:19, time: 1.000, data_time: 0.022, memory: 21698, balance_loss: 0.0006, loss_rpn_cls: 0.0440, loss_rpn_bbox: 0.0282, s0.loss_cls: 0.2003, s0.acc: 93.5461, s0.loss_bbox: 0.2460, s0.loss_mask: 0.2547, s1.loss_cls: 0.0916, s1.acc: 93.8538, s1.loss_bbox: 0.1074, s1.loss_mask: 0.1252, s2.loss_cls: 0.0429, s2.acc: 94.2533, s2.loss_bbox: 0.0404, s2.loss_mask: 0.0581, loss: 1.2393
|
| 552 |
+
2025-07-02 13:14:47,013 - mmdet - INFO - Exp name: cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_llama_moe.py
|
| 553 |
+
2025-07-02 13:14:47,013 - mmdet - INFO - Epoch [1][1000/7330] lr: 1.000e-04, eta: 3 days, 9:04:46, time: 0.995, data_time: 0.022, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0433, loss_rpn_bbox: 0.0282, s0.loss_cls: 0.2069, s0.acc: 93.2595, s0.loss_bbox: 0.2508, s0.loss_mask: 0.2551, s1.loss_cls: 0.0952, s1.acc: 93.5391, s1.loss_bbox: 0.1081, s1.loss_mask: 0.1243, s2.loss_cls: 0.0452, s2.acc: 93.6667, s2.loss_bbox: 0.0406, s2.loss_mask: 0.0577, loss: 1.2559
|
| 554 |
+
2025-07-02 13:15:56,799 - mmdet - INFO - Epoch [1][1050/7330] lr: 1.000e-04, eta: 3 days, 10:03:31, time: 1.396, data_time: 0.024, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0416, loss_rpn_bbox: 0.0281, s0.loss_cls: 0.1938, s0.acc: 93.6470, s0.loss_bbox: 0.2426, s0.loss_mask: 0.2518, s1.loss_cls: 0.0887, s1.acc: 93.9740, s1.loss_bbox: 0.1067, s1.loss_mask: 0.1234, s2.loss_cls: 0.0418, s2.acc: 94.2758, s2.loss_bbox: 0.0401, s2.loss_mask: 0.0575, loss: 1.2167
|
| 555 |
+
2025-07-02 13:16:44,870 - mmdet - INFO - Epoch [1][1100/7330] lr: 1.000e-04, eta: 3 days, 9:30:13, time: 0.961, data_time: 0.023, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0392, loss_rpn_bbox: 0.0250, s0.loss_cls: 0.1934, s0.acc: 93.6704, s0.loss_bbox: 0.2384, s0.loss_mask: 0.2551, s1.loss_cls: 0.0900, s1.acc: 93.9307, s1.loss_bbox: 0.1048, s1.loss_mask: 0.1252, s2.loss_cls: 0.0430, s2.acc: 93.9533, s2.loss_bbox: 0.0400, s2.loss_mask: 0.0580, loss: 1.2126
|
| 556 |
+
2025-07-02 13:17:33,680 - mmdet - INFO - Epoch [1][1150/7330] lr: 1.000e-04, eta: 3 days, 9:02:33, time: 0.976, data_time: 0.025, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0386, loss_rpn_bbox: 0.0276, s0.loss_cls: 0.2014, s0.acc: 93.4297, s0.loss_bbox: 0.2549, s0.loss_mask: 0.2591, s1.loss_cls: 0.0934, s1.acc: 93.6268, s1.loss_bbox: 0.1132, s1.loss_mask: 0.1277, s2.loss_cls: 0.0443, s2.acc: 93.6808, s2.loss_bbox: 0.0428, s2.loss_mask: 0.0593, loss: 1.2629
|
| 557 |
+
2025-07-02 13:18:22,632 - mmdet - INFO - Epoch [1][1200/7330] lr: 1.000e-04, eta: 3 days, 8:37:38, time: 0.979, data_time: 0.025, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0415, loss_rpn_bbox: 0.0294, s0.loss_cls: 0.2003, s0.acc: 93.3601, s0.loss_bbox: 0.2513, s0.loss_mask: 0.2580, s1.loss_cls: 0.0944, s1.acc: 93.6558, s1.loss_bbox: 0.1106, s1.loss_mask: 0.1260, s2.loss_cls: 0.0446, s2.acc: 93.7693, s2.loss_bbox: 0.0420, s2.loss_mask: 0.0587, loss: 1.2572
|
| 558 |
+
2025-07-02 13:19:10,593 - mmdet - INFO - Epoch [1][1250/7330] lr: 1.000e-04, eta: 3 days, 8:11:09, time: 0.959, data_time: 0.025, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0386, loss_rpn_bbox: 0.0248, s0.loss_cls: 0.1936, s0.acc: 93.6946, s0.loss_bbox: 0.2370, s0.loss_mask: 0.2525, s1.loss_cls: 0.0893, s1.acc: 93.9175, s1.loss_bbox: 0.1055, s1.loss_mask: 0.1233, s2.loss_cls: 0.0428, s2.acc: 94.0574, s2.loss_bbox: 0.0398, s2.loss_mask: 0.0577, loss: 1.2051
|
| 559 |
+
2025-07-02 13:19:59,326 - mmdet - INFO - Epoch [1][1300/7330] lr: 1.000e-04, eta: 3 days, 7:49:18, time: 0.975, data_time: 0.024, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0396, loss_rpn_bbox: 0.0268, s0.loss_cls: 0.1953, s0.acc: 93.6196, s0.loss_bbox: 0.2401, s0.loss_mask: 0.2518, s1.loss_cls: 0.0925, s1.acc: 93.7325, s1.loss_bbox: 0.1074, s1.loss_mask: 0.1239, s2.loss_cls: 0.0440, s2.acc: 93.8915, s2.loss_bbox: 0.0405, s2.loss_mask: 0.0577, loss: 1.2199
|
| 560 |
+
2025-07-02 13:20:48,539 - mmdet - INFO - Epoch [1][1350/7330] lr: 1.000e-04, eta: 3 days, 7:30:33, time: 0.984, data_time: 0.026, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0412, loss_rpn_bbox: 0.0278, s0.loss_cls: 0.1981, s0.acc: 93.4673, s0.loss_bbox: 0.2485, s0.loss_mask: 0.2504, s1.loss_cls: 0.0920, s1.acc: 93.7890, s1.loss_bbox: 0.1105, s1.loss_mask: 0.1239, s2.loss_cls: 0.0436, s2.acc: 93.9530, s2.loss_bbox: 0.0422, s2.loss_mask: 0.0576, loss: 1.2362
|
| 561 |
+
2025-07-02 13:21:36,394 - mmdet - INFO - Epoch [1][1400/7330] lr: 1.000e-04, eta: 3 days, 7:08:51, time: 0.957, data_time: 0.020, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0399, loss_rpn_bbox: 0.0251, s0.loss_cls: 0.1843, s0.acc: 94.0496, s0.loss_bbox: 0.2276, s0.loss_mask: 0.2435, s1.loss_cls: 0.0848, s1.acc: 94.2850, s1.loss_bbox: 0.1019, s1.loss_mask: 0.1194, s2.loss_cls: 0.0405, s2.acc: 94.3298, s2.loss_bbox: 0.0396, s2.loss_mask: 0.0560, loss: 1.1633
|
| 562 |
+
2025-07-02 13:22:32,901 - mmdet - INFO - Epoch [1][1450/7330] lr: 1.000e-04, eta: 3 days, 7:14:35, time: 1.130, data_time: 0.023, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0403, loss_rpn_bbox: 0.0271, s0.loss_cls: 0.1933, s0.acc: 93.6177, s0.loss_bbox: 0.2457, s0.loss_mask: 0.2498, s1.loss_cls: 0.0887, s1.acc: 93.9880, s1.loss_bbox: 0.1084, s1.loss_mask: 0.1226, s2.loss_cls: 0.0421, s2.acc: 94.1195, s2.loss_bbox: 0.0415, s2.loss_mask: 0.0574, loss: 1.2174
|
| 563 |
+
2025-07-02 13:23:29,117 - mmdet - INFO - Epoch [1][1500/7330] lr: 1.000e-04, eta: 3 days, 7:19:10, time: 1.125, data_time: 0.026, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0411, loss_rpn_bbox: 0.0284, s0.loss_cls: 0.1935, s0.acc: 93.5239, s0.loss_bbox: 0.2469, s0.loss_mask: 0.2539, s1.loss_cls: 0.0898, s1.acc: 93.9006, s1.loss_bbox: 0.1092, s1.loss_mask: 0.1250, s2.loss_cls: 0.0429, s2.acc: 93.9969, s2.loss_bbox: 0.0411, s2.loss_mask: 0.0588, loss: 1.2310
|
| 564 |
+
2025-07-02 13:24:17,805 - mmdet - INFO - Epoch [1][1550/7330] lr: 1.000e-04, eta: 3 days, 7:02:07, time: 0.974, data_time: 0.029, memory: 21698, balance_loss: 0.0005, loss_rpn_cls: 0.0383, loss_rpn_bbox: 0.0265, s0.loss_cls: 0.1890, s0.acc: 93.5908, s0.loss_bbox: 0.2468, s0.loss_mask: 0.2506, s1.loss_cls: 0.0879, s1.acc: 93.8166, s1.loss_bbox: 0.1083, s1.loss_mask: 0.1220, s2.loss_cls: 0.0422, s2.acc: 93.9235, s2.loss_bbox: 0.0416, s2.loss_mask: 0.0572, loss: 1.2108
|
| 565 |
+
2025-07-02 13:25:05,795 - mmdet - INFO - Epoch [1][1600/7330] lr: 1.000e-04, eta: 3 days, 6:44:09, time: 0.960, data_time: 0.023, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0392, loss_rpn_bbox: 0.0276, s0.loss_cls: 0.1917, s0.acc: 93.5811, s0.loss_bbox: 0.2463, s0.loss_mask: 0.2533, s1.loss_cls: 0.0902, s1.acc: 93.7888, s1.loss_bbox: 0.1091, s1.loss_mask: 0.1244, s2.loss_cls: 0.0434, s2.acc: 93.8748, s2.loss_bbox: 0.0416, s2.loss_mask: 0.0584, loss: 1.2256
|
| 566 |
+
2025-07-02 13:25:54,656 - mmdet - INFO - Epoch [1][1650/7330] lr: 1.000e-04, eta: 3 days, 6:29:32, time: 0.977, data_time: 0.029, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0387, loss_rpn_bbox: 0.0269, s0.loss_cls: 0.1861, s0.acc: 93.8123, s0.loss_bbox: 0.2349, s0.loss_mask: 0.2469, s1.loss_cls: 0.0864, s1.acc: 94.1004, s1.loss_bbox: 0.1043, s1.loss_mask: 0.1205, s2.loss_cls: 0.0414, s2.acc: 94.1816, s2.loss_bbox: 0.0405, s2.loss_mask: 0.0566, loss: 1.1835
|
| 567 |
+
2025-07-02 13:26:43,327 - mmdet - INFO - Epoch [1][1700/7330] lr: 1.000e-04, eta: 3 days, 6:15:15, time: 0.973, data_time: 0.022, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0409, loss_rpn_bbox: 0.0269, s0.loss_cls: 0.1943, s0.acc: 93.5156, s0.loss_bbox: 0.2454, s0.loss_mask: 0.2489, s1.loss_cls: 0.0895, s1.acc: 93.8823, s1.loss_bbox: 0.1081, s1.loss_mask: 0.1221, s2.loss_cls: 0.0428, s2.acc: 93.9270, s2.loss_bbox: 0.0411, s2.loss_mask: 0.0570, loss: 1.2175
|
| 568 |
+
2025-07-02 13:27:32,133 - mmdet - INFO - Epoch [1][1750/7330] lr: 1.000e-04, eta: 3 days, 6:02:01, time: 0.976, data_time: 0.025, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0420, loss_rpn_bbox: 0.0272, s0.loss_cls: 0.2012, s0.acc: 93.4895, s0.loss_bbox: 0.2459, s0.loss_mask: 0.2510, s1.loss_cls: 0.0920, s1.acc: 93.7919, s1.loss_bbox: 0.1094, s1.loss_mask: 0.1227, s2.loss_cls: 0.0440, s2.acc: 93.9080, s2.loss_bbox: 0.0420, s2.loss_mask: 0.0571, loss: 1.2351
|
| 569 |
+
2025-07-02 13:28:20,876 - mmdet - INFO - Epoch [1][1800/7330] lr: 1.000e-04, eta: 3 days, 5:49:27, time: 0.975, data_time: 0.024, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0408, loss_rpn_bbox: 0.0290, s0.loss_cls: 0.2022, s0.acc: 93.5105, s0.loss_bbox: 0.2474, s0.loss_mask: 0.2519, s1.loss_cls: 0.0933, s1.acc: 93.8210, s1.loss_bbox: 0.1086, s1.loss_mask: 0.1231, s2.loss_cls: 0.0441, s2.acc: 93.9340, s2.loss_bbox: 0.0411, s2.loss_mask: 0.0573, loss: 1.2393
|
| 570 |
+
2025-07-02 13:29:09,933 - mmdet - INFO - Epoch [1][1850/7330] lr: 1.000e-04, eta: 3 days, 5:38:11, time: 0.981, data_time: 0.033, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0397, loss_rpn_bbox: 0.0273, s0.loss_cls: 0.2016, s0.acc: 93.2983, s0.loss_bbox: 0.2488, s0.loss_mask: 0.2486, s1.loss_cls: 0.0946, s1.acc: 93.4929, s1.loss_bbox: 0.1102, s1.loss_mask: 0.1219, s2.loss_cls: 0.0447, s2.acc: 93.6339, s2.loss_bbox: 0.0423, s2.loss_mask: 0.0570, loss: 1.2371
|
| 571 |
+
2025-07-02 13:30:18,445 - mmdet - INFO - Epoch [1][1900/7330] lr: 1.000e-04, eta: 3 days, 6:12:10, time: 1.370, data_time: 0.024, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0392, loss_rpn_bbox: 0.0275, s0.loss_cls: 0.1856, s0.acc: 93.8496, s0.loss_bbox: 0.2352, s0.loss_mask: 0.2528, s1.loss_cls: 0.0871, s1.acc: 94.1435, s1.loss_bbox: 0.1049, s1.loss_mask: 0.1240, s2.loss_cls: 0.0415, s2.acc: 94.2827, s2.loss_bbox: 0.0402, s2.loss_mask: 0.0582, loss: 1.1965
|
| 572 |
+
2025-07-02 13:31:07,179 - mmdet - INFO - Epoch [1][1950/7330] lr: 1.000e-04, eta: 3 days, 6:00:05, time: 0.975, data_time: 0.024, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0367, loss_rpn_bbox: 0.0277, s0.loss_cls: 0.1838, s0.acc: 93.8313, s0.loss_bbox: 0.2362, s0.loss_mask: 0.2407, s1.loss_cls: 0.0854, s1.acc: 94.1545, s1.loss_bbox: 0.1056, s1.loss_mask: 0.1187, s2.loss_cls: 0.0413, s2.acc: 94.1325, s2.loss_bbox: 0.0411, s2.loss_mask: 0.0558, loss: 1.1732
|
| 573 |
+
2025-07-02 13:31:56,148 - mmdet - INFO - Exp name: cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_llama_moe.py
|
| 574 |
+
2025-07-02 13:31:56,148 - mmdet - INFO - Epoch [1][2000/7330] lr: 1.000e-04, eta: 3 days, 5:49:04, time: 0.979, data_time: 0.028, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0378, loss_rpn_bbox: 0.0264, s0.loss_cls: 0.1935, s0.acc: 93.6133, s0.loss_bbox: 0.2395, s0.loss_mask: 0.2474, s1.loss_cls: 0.0897, s1.acc: 93.8377, s1.loss_bbox: 0.1070, s1.loss_mask: 0.1216, s2.loss_cls: 0.0428, s2.acc: 93.9132, s2.loss_bbox: 0.0413, s2.loss_mask: 0.0570, loss: 1.2044
|
| 575 |
+
2025-07-02 13:32:45,266 - mmdet - INFO - Epoch [1][2050/7330] lr: 1.000e-04, eta: 3 days, 5:38:53, time: 0.982, data_time: 0.024, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0377, loss_rpn_bbox: 0.0269, s0.loss_cls: 0.1969, s0.acc: 93.4460, s0.loss_bbox: 0.2495, s0.loss_mask: 0.2523, s1.loss_cls: 0.0925, s1.acc: 93.6907, s1.loss_bbox: 0.1107, s1.loss_mask: 0.1231, s2.loss_cls: 0.0438, s2.acc: 93.7479, s2.loss_bbox: 0.0422, s2.loss_mask: 0.0575, loss: 1.2335
|
| 576 |
+
2025-07-02 13:33:33,755 - mmdet - INFO - Epoch [1][2100/7330] lr: 1.000e-04, eta: 3 days, 5:27:50, time: 0.970, data_time: 0.025, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0372, loss_rpn_bbox: 0.0257, s0.loss_cls: 0.1874, s0.acc: 93.7849, s0.loss_bbox: 0.2388, s0.loss_mask: 0.2433, s1.loss_cls: 0.0864, s1.acc: 94.0517, s1.loss_bbox: 0.1069, s1.loss_mask: 0.1204, s2.loss_cls: 0.0412, s2.acc: 94.1879, s2.loss_bbox: 0.0413, s2.loss_mask: 0.0560, loss: 1.1849
|
| 577 |
+
2025-07-02 13:34:22,335 - mmdet - INFO - Epoch [1][2150/7330] lr: 1.000e-04, eta: 3 days, 5:17:27, time: 0.972, data_time: 0.023, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0368, loss_rpn_bbox: 0.0264, s0.loss_cls: 0.1837, s0.acc: 93.8245, s0.loss_bbox: 0.2401, s0.loss_mask: 0.2482, s1.loss_cls: 0.0852, s1.acc: 94.1270, s1.loss_bbox: 0.1074, s1.loss_mask: 0.1223, s2.loss_cls: 0.0412, s2.acc: 94.1742, s2.loss_bbox: 0.0414, s2.loss_mask: 0.0573, loss: 1.1903
|
| 578 |
+
2025-07-02 13:35:11,193 - mmdet - INFO - Epoch [1][2200/7330] lr: 1.000e-04, eta: 3 days, 5:08:02, time: 0.977, data_time: 0.025, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0395, loss_rpn_bbox: 0.0271, s0.loss_cls: 0.1931, s0.acc: 93.6047, s0.loss_bbox: 0.2389, s0.loss_mask: 0.2445, s1.loss_cls: 0.0893, s1.acc: 93.9235, s1.loss_bbox: 0.1068, s1.loss_mask: 0.1207, s2.loss_cls: 0.0427, s2.acc: 94.0086, s2.loss_bbox: 0.0416, s2.loss_mask: 0.0568, loss: 1.2016
|
| 579 |
+
2025-07-02 13:35:59,585 - mmdet - INFO - Epoch [1][2250/7330] lr: 1.000e-04, eta: 3 days, 4:58:06, time: 0.968, data_time: 0.026, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0384, loss_rpn_bbox: 0.0270, s0.loss_cls: 0.1852, s0.acc: 93.7393, s0.loss_bbox: 0.2379, s0.loss_mask: 0.2417, s1.loss_cls: 0.0863, s1.acc: 94.0585, s1.loss_bbox: 0.1057, s1.loss_mask: 0.1191, s2.loss_cls: 0.0414, s2.acc: 94.1331, s2.loss_bbox: 0.0408, s2.loss_mask: 0.0554, loss: 1.1794
|
| 580 |
+
2025-07-02 13:37:09,408 - mmdet - INFO - Epoch [1][2300/7330] lr: 1.000e-04, eta: 3 days, 5:29:11, time: 1.396, data_time: 0.023, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0388, loss_rpn_bbox: 0.0276, s0.loss_cls: 0.2008, s0.acc: 93.3813, s0.loss_bbox: 0.2575, s0.loss_mask: 0.2496, s1.loss_cls: 0.0926, s1.acc: 93.7594, s1.loss_bbox: 0.1141, s1.loss_mask: 0.1221, s2.loss_cls: 0.0444, s2.acc: 93.7765, s2.loss_bbox: 0.0434, s2.loss_mask: 0.0575, loss: 1.2487
|
| 581 |
+
2025-07-02 13:37:57,541 - mmdet - INFO - Epoch [1][2350/7330] lr: 1.000e-04, eta: 3 days, 5:18:41, time: 0.963, data_time: 0.021, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0377, loss_rpn_bbox: 0.0265, s0.loss_cls: 0.1815, s0.acc: 93.9387, s0.loss_bbox: 0.2337, s0.loss_mask: 0.2443, s1.loss_cls: 0.0838, s1.acc: 94.2205, s1.loss_bbox: 0.1045, s1.loss_mask: 0.1194, s2.loss_cls: 0.0403, s2.acc: 94.3219, s2.loss_bbox: 0.0403, s2.loss_mask: 0.0559, loss: 1.1682
|
| 582 |
+
2025-07-02 13:38:45,946 - mmdet - INFO - Epoch [1][2400/7330] lr: 1.000e-04, eta: 3 days, 5:09:04, time: 0.968, data_time: 0.022, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0378, loss_rpn_bbox: 0.0270, s0.loss_cls: 0.1923, s0.acc: 93.5818, s0.loss_bbox: 0.2420, s0.loss_mask: 0.2498, s1.loss_cls: 0.0896, s1.acc: 93.8602, s1.loss_bbox: 0.1064, s1.loss_mask: 0.1212, s2.loss_cls: 0.0432, s2.acc: 93.9519, s2.loss_bbox: 0.0406, s2.loss_mask: 0.0563, loss: 1.2066
|
| 583 |
+
2025-07-02 13:39:34,605 - mmdet - INFO - Epoch [1][2450/7330] lr: 1.000e-04, eta: 3 days, 5:00:13, time: 0.973, data_time: 0.027, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0450, loss_rpn_bbox: 0.0285, s0.loss_cls: 0.1927, s0.acc: 93.5000, s0.loss_bbox: 0.2495, s0.loss_mask: 0.2503, s1.loss_cls: 0.0906, s1.acc: 93.7021, s1.loss_bbox: 0.1104, s1.loss_mask: 0.1232, s2.loss_cls: 0.0435, s2.acc: 93.7930, s2.loss_bbox: 0.0423, s2.loss_mask: 0.0570, loss: 1.2335
|
| 584 |
+
2025-07-02 13:40:23,098 - mmdet - INFO - Epoch [1][2500/7330] lr: 1.000e-04, eta: 3 days, 4:51:30, time: 0.970, data_time: 0.020, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0364, loss_rpn_bbox: 0.0254, s0.loss_cls: 0.1848, s0.acc: 93.9280, s0.loss_bbox: 0.2358, s0.loss_mask: 0.2378, s1.loss_cls: 0.0860, s1.acc: 94.1514, s1.loss_bbox: 0.1051, s1.loss_mask: 0.1179, s2.loss_cls: 0.0407, s2.acc: 94.3786, s2.loss_bbox: 0.0412, s2.loss_mask: 0.0553, loss: 1.1667
|
| 585 |
+
2025-07-02 13:41:11,271 - mmdet - INFO - Epoch [1][2550/7330] lr: 1.000e-04, eta: 3 days, 4:42:29, time: 0.963, data_time: 0.022, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0392, loss_rpn_bbox: 0.0256, s0.loss_cls: 0.1941, s0.acc: 93.5264, s0.loss_bbox: 0.2458, s0.loss_mask: 0.2535, s1.loss_cls: 0.0897, s1.acc: 93.7970, s1.loss_bbox: 0.1090, s1.loss_mask: 0.1241, s2.loss_cls: 0.0431, s2.acc: 93.8811, s2.loss_bbox: 0.0421, s2.loss_mask: 0.0580, loss: 1.2245
|
| 586 |
+
2025-07-02 13:41:59,880 - mmdet - INFO - Epoch [1][2600/7330] lr: 1.000e-04, eta: 3 days, 4:34:31, time: 0.972, data_time: 0.025, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0404, loss_rpn_bbox: 0.0265, s0.loss_cls: 0.1907, s0.acc: 93.7168, s0.loss_bbox: 0.2395, s0.loss_mask: 0.2395, s1.loss_cls: 0.0884, s1.acc: 93.9960, s1.loss_bbox: 0.1065, s1.loss_mask: 0.1183, s2.loss_cls: 0.0425, s2.acc: 94.0753, s2.loss_bbox: 0.0414, s2.loss_mask: 0.0554, loss: 1.1894
|
| 587 |
+
2025-07-02 13:42:48,779 - mmdet - INFO - Epoch [1][2650/7330] lr: 1.000e-04, eta: 3 days, 4:27:19, time: 0.978, data_time: 0.025, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0388, loss_rpn_bbox: 0.0254, s0.loss_cls: 0.1873, s0.acc: 93.7534, s0.loss_bbox: 0.2454, s0.loss_mask: 0.2455, s1.loss_cls: 0.0874, s1.acc: 94.0282, s1.loss_bbox: 0.1092, s1.loss_mask: 0.1217, s2.loss_cls: 0.0420, s2.acc: 94.0656, s2.loss_bbox: 0.0424, s2.loss_mask: 0.0570, loss: 1.2024
|
| 588 |
+
2025-07-02 13:43:54,106 - mmdet - INFO - Epoch [1][2700/7330] lr: 1.000e-04, eta: 3 days, 4:42:23, time: 1.251, data_time: 0.027, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0400, loss_rpn_bbox: 0.0271, s0.loss_cls: 0.1872, s0.acc: 93.6235, s0.loss_bbox: 0.2463, s0.loss_mask: 0.2484, s1.loss_cls: 0.0881, s1.acc: 93.8361, s1.loss_bbox: 0.1105, s1.loss_mask: 0.1221, s2.loss_cls: 0.0428, s2.acc: 93.8556, s2.loss_bbox: 0.0428, s2.loss_mask: 0.0570, loss: 1.2126
|
| 589 |
+
2025-07-02 13:44:42,314 - mmdet - INFO - Epoch [1][2750/7330] lr: 1.000e-04, eta: 3 days, 4:38:29, time: 1.019, data_time: 0.080, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0369, loss_rpn_bbox: 0.0272, s0.loss_cls: 0.1828, s0.acc: 93.8555, s0.loss_bbox: 0.2379, s0.loss_mask: 0.2413, s1.loss_cls: 0.0843, s1.acc: 94.2069, s1.loss_bbox: 0.1055, s1.loss_mask: 0.1199, s2.loss_cls: 0.0407, s2.acc: 94.3324, s2.loss_bbox: 0.0408, s2.loss_mask: 0.0569, loss: 1.1746
|
| 590 |
+
2025-07-02 13:45:30,488 - mmdet - INFO - Epoch [1][2800/7330] lr: 1.000e-04, eta: 3 days, 4:30:22, time: 0.963, data_time: 0.027, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0361, loss_rpn_bbox: 0.0257, s0.loss_cls: 0.1835, s0.acc: 93.8899, s0.loss_bbox: 0.2321, s0.loss_mask: 0.2401, s1.loss_cls: 0.0860, s1.acc: 94.0564, s1.loss_bbox: 0.1047, s1.loss_mask: 0.1190, s2.loss_cls: 0.0412, s2.acc: 94.1673, s2.loss_bbox: 0.0404, s2.loss_mask: 0.0554, loss: 1.1647
|
| 591 |
+
2025-07-02 13:46:19,162 - mmdet - INFO - Epoch [1][2850/7330] lr: 1.000e-04, eta: 3 days, 4:23:16, time: 0.973, data_time: 0.028, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0373, loss_rpn_bbox: 0.0268, s0.loss_cls: 0.1852, s0.acc: 93.8083, s0.loss_bbox: 0.2435, s0.loss_mask: 0.2463, s1.loss_cls: 0.0868, s1.acc: 93.9897, s1.loss_bbox: 0.1080, s1.loss_mask: 0.1196, s2.loss_cls: 0.0423, s2.acc: 93.9719, s2.loss_bbox: 0.0417, s2.loss_mask: 0.0560, loss: 1.1939
|
| 592 |
+
2025-07-02 13:47:07,365 - mmdet - INFO - Epoch [1][2900/7330] lr: 1.000e-04, eta: 3 days, 4:15:42, time: 0.964, data_time: 0.028, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0329, loss_rpn_bbox: 0.0254, s0.loss_cls: 0.1823, s0.acc: 93.8904, s0.loss_bbox: 0.2392, s0.loss_mask: 0.2470, s1.loss_cls: 0.0853, s1.acc: 94.1023, s1.loss_bbox: 0.1073, s1.loss_mask: 0.1210, s2.loss_cls: 0.0408, s2.acc: 94.1597, s2.loss_bbox: 0.0412, s2.loss_mask: 0.0564, loss: 1.1793
|
| 593 |
+
2025-07-02 13:47:56,072 - mmdet - INFO - Epoch [1][2950/7330] lr: 1.000e-04, eta: 3 days, 4:09:02, time: 0.974, data_time: 0.021, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0341, loss_rpn_bbox: 0.0252, s0.loss_cls: 0.1809, s0.acc: 93.9258, s0.loss_bbox: 0.2371, s0.loss_mask: 0.2377, s1.loss_cls: 0.0854, s1.acc: 94.0653, s1.loss_bbox: 0.1082, s1.loss_mask: 0.1178, s2.loss_cls: 0.0412, s2.acc: 94.1025, s2.loss_bbox: 0.0420, s2.loss_mask: 0.0550, loss: 1.1650
|
| 594 |
+
2025-07-02 13:48:44,210 - mmdet - INFO - Exp name: cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_llama_moe.py
|
| 595 |
+
2025-07-02 13:48:44,211 - mmdet - INFO - Epoch [1][3000/7330] lr: 1.000e-04, eta: 3 days, 4:01:50, time: 0.963, data_time: 0.023, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0405, loss_rpn_bbox: 0.0286, s0.loss_cls: 0.1843, s0.acc: 93.7048, s0.loss_bbox: 0.2456, s0.loss_mask: 0.2489, s1.loss_cls: 0.0849, s1.acc: 94.0368, s1.loss_bbox: 0.1077, s1.loss_mask: 0.1223, s2.loss_cls: 0.0408, s2.acc: 94.1490, s2.loss_bbox: 0.0416, s2.loss_mask: 0.0568, loss: 1.2024
|
| 596 |
+
2025-07-02 13:49:32,724 - mmdet - INFO - Epoch [1][3050/7330] lr: 1.000e-04, eta: 3 days, 3:55:20, time: 0.970, data_time: 0.028, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0405, loss_rpn_bbox: 0.0278, s0.loss_cls: 0.1877, s0.acc: 93.6897, s0.loss_bbox: 0.2453, s0.loss_mask: 0.2545, s1.loss_cls: 0.0882, s1.acc: 93.8731, s1.loss_bbox: 0.1099, s1.loss_mask: 0.1257, s2.loss_cls: 0.0416, s2.acc: 94.0650, s2.loss_bbox: 0.0418, s2.loss_mask: 0.0591, loss: 1.2225
|
| 597 |
+
2025-07-02 13:50:21,384 - mmdet - INFO - Epoch [1][3100/7330] lr: 1.000e-04, eta: 3 days, 3:49:11, time: 0.973, data_time: 0.022, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0390, loss_rpn_bbox: 0.0262, s0.loss_cls: 0.1893, s0.acc: 93.6362, s0.loss_bbox: 0.2427, s0.loss_mask: 0.2475, s1.loss_cls: 0.0886, s1.acc: 93.8217, s1.loss_bbox: 0.1074, s1.loss_mask: 0.1223, s2.loss_cls: 0.0421, s2.acc: 93.9657, s2.loss_bbox: 0.0413, s2.loss_mask: 0.0575, loss: 1.2041
|
| 598 |
+
2025-07-02 13:51:22,019 - mmdet - INFO - Epoch [1][3150/7330] lr: 1.000e-04, eta: 3 days, 3:59:46, time: 1.213, data_time: 0.022, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0337, loss_rpn_bbox: 0.0258, s0.loss_cls: 0.1820, s0.acc: 93.9199, s0.loss_bbox: 0.2352, s0.loss_mask: 0.2402, s1.loss_cls: 0.0854, s1.acc: 94.1666, s1.loss_bbox: 0.1054, s1.loss_mask: 0.1190, s2.loss_cls: 0.0408, s2.acc: 94.2147, s2.loss_bbox: 0.0413, s2.loss_mask: 0.0561, loss: 1.1652
|
| 599 |
+
2025-07-02 13:52:10,664 - mmdet - INFO - Epoch [1][3200/7330] lr: 1.000e-04, eta: 3 days, 3:53:44, time: 0.973, data_time: 0.026, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0373, loss_rpn_bbox: 0.0270, s0.loss_cls: 0.1929, s0.acc: 93.5549, s0.loss_bbox: 0.2423, s0.loss_mask: 0.2405, s1.loss_cls: 0.0904, s1.acc: 93.7999, s1.loss_bbox: 0.1069, s1.loss_mask: 0.1180, s2.loss_cls: 0.0426, s2.acc: 93.9240, s2.loss_bbox: 0.0415, s2.loss_mask: 0.0552, loss: 1.1951
|
| 600 |
+
2025-07-02 13:52:59,547 - mmdet - INFO - Epoch [1][3250/7330] lr: 1.000e-04, eta: 3 days, 3:48:09, time: 0.978, data_time: 0.022, memory: 21698, balance_loss: 0.0003, loss_rpn_cls: 0.0386, loss_rpn_bbox: 0.0263, s0.loss_cls: 0.1925, s0.acc: 93.5605, s0.loss_bbox: 0.2469, s0.loss_mask: 0.2489, s1.loss_cls: 0.0899, s1.acc: 93.8169, s1.loss_bbox: 0.1119, s1.loss_mask: 0.1241, s2.loss_cls: 0.0432, s2.acc: 93.8767, s2.loss_bbox: 0.0438, s2.loss_mask: 0.0589, loss: 1.2253
|
| 601 |
+
2025-07-02 13:53:47,857 - mmdet - INFO - Epoch [1][3300/7330] lr: 1.000e-04, eta: 3 days, 3:41:58, time: 0.966, data_time: 0.023, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0381, loss_rpn_bbox: 0.0278, s0.loss_cls: 0.1897, s0.acc: 93.5981, s0.loss_bbox: 0.2448, s0.loss_mask: 0.2453, s1.loss_cls: 0.0888, s1.acc: 93.8614, s1.loss_bbox: 0.1093, s1.loss_mask: 0.1204, s2.loss_cls: 0.0431, s2.acc: 93.8512, s2.loss_bbox: 0.0428, s2.loss_mask: 0.0569, loss: 1.2072
|
| 602 |
+
2025-07-02 13:54:36,544 - mmdet - INFO - Epoch [1][3350/7330] lr: 1.000e-04, eta: 3 days, 3:36:25, time: 0.974, data_time: 0.024, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0371, loss_rpn_bbox: 0.0257, s0.loss_cls: 0.1867, s0.acc: 93.8193, s0.loss_bbox: 0.2387, s0.loss_mask: 0.2463, s1.loss_cls: 0.0882, s1.acc: 94.0322, s1.loss_bbox: 0.1077, s1.loss_mask: 0.1224, s2.loss_cls: 0.0428, s2.acc: 94.0282, s2.loss_bbox: 0.0420, s2.loss_mask: 0.0572, loss: 1.1951
|
| 603 |
+
2025-07-02 13:55:25,354 - mmdet - INFO - Epoch [1][3400/7330] lr: 1.000e-04, eta: 3 days, 3:31:10, time: 0.976, data_time: 0.027, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0378, loss_rpn_bbox: 0.0276, s0.loss_cls: 0.1858, s0.acc: 93.6411, s0.loss_bbox: 0.2447, s0.loss_mask: 0.2451, s1.loss_cls: 0.0868, s1.acc: 93.8109, s1.loss_bbox: 0.1097, s1.loss_mask: 0.1216, s2.loss_cls: 0.0416, s2.acc: 93.9548, s2.loss_bbox: 0.0425, s2.loss_mask: 0.0571, loss: 1.2006
|
| 604 |
+
2025-07-02 13:56:13,819 - mmdet - INFO - Epoch [1][3450/7330] lr: 1.000e-04, eta: 3 days, 3:25:37, time: 0.969, data_time: 0.022, memory: 21698, balance_loss: 0.0003, loss_rpn_cls: 0.0383, loss_rpn_bbox: 0.0281, s0.loss_cls: 0.1877, s0.acc: 93.7153, s0.loss_bbox: 0.2405, s0.loss_mask: 0.2454, s1.loss_cls: 0.0871, s1.acc: 94.0572, s1.loss_bbox: 0.1077, s1.loss_mask: 0.1212, s2.loss_cls: 0.0423, s2.acc: 94.0259, s2.loss_bbox: 0.0419, s2.loss_mask: 0.0568, loss: 1.1976
|
| 605 |
+
2025-07-02 13:57:02,430 - mmdet - INFO - Epoch [1][3500/7330] lr: 1.000e-04, eta: 3 days, 3:20:22, time: 0.972, data_time: 0.025, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0364, loss_rpn_bbox: 0.0269, s0.loss_cls: 0.1867, s0.acc: 93.8547, s0.loss_bbox: 0.2438, s0.loss_mask: 0.2456, s1.loss_cls: 0.0869, s1.acc: 94.1400, s1.loss_bbox: 0.1080, s1.loss_mask: 0.1212, s2.loss_cls: 0.0416, s2.acc: 94.1682, s2.loss_bbox: 0.0410, s2.loss_mask: 0.0565, loss: 1.1949
|
| 606 |
+
2025-07-02 13:58:12,861 - mmdet - INFO - Epoch [1][3550/7330] lr: 1.000e-04, eta: 3 days, 3:41:57, time: 1.409, data_time: 0.026, memory: 21698, balance_loss: 0.0003, loss_rpn_cls: 0.0355, loss_rpn_bbox: 0.0243, s0.loss_cls: 0.1857, s0.acc: 93.8430, s0.loss_bbox: 0.2425, s0.loss_mask: 0.2442, s1.loss_cls: 0.0860, s1.acc: 94.1098, s1.loss_bbox: 0.1083, s1.loss_mask: 0.1206, s2.loss_cls: 0.0419, s2.acc: 94.0926, s2.loss_bbox: 0.0422, s2.loss_mask: 0.0570, loss: 1.1885
|
| 607 |
+
2025-07-02 13:59:01,271 - mmdet - INFO - Epoch [1][3600/7330] lr: 1.000e-04, eta: 3 days, 3:36:20, time: 0.968, data_time: 0.027, memory: 21698, balance_loss: 0.0003, loss_rpn_cls: 0.0355, loss_rpn_bbox: 0.0266, s0.loss_cls: 0.1838, s0.acc: 93.7742, s0.loss_bbox: 0.2424, s0.loss_mask: 0.2470, s1.loss_cls: 0.0856, s1.acc: 94.0677, s1.loss_bbox: 0.1087, s1.loss_mask: 0.1223, s2.loss_cls: 0.0415, s2.acc: 94.1235, s2.loss_bbox: 0.0425, s2.loss_mask: 0.0573, loss: 1.1934
|
| 608 |
+
2025-07-02 13:59:49,993 - mmdet - INFO - Epoch [1][3650/7330] lr: 1.000e-04, eta: 3 days, 3:31:12, time: 0.974, data_time: 0.023, memory: 21698, balance_loss: 0.0003, loss_rpn_cls: 0.0393, loss_rpn_bbox: 0.0263, s0.loss_cls: 0.1887, s0.acc: 93.6582, s0.loss_bbox: 0.2443, s0.loss_mask: 0.2446, s1.loss_cls: 0.0888, s1.acc: 93.8015, s1.loss_bbox: 0.1078, s1.loss_mask: 0.1202, s2.loss_cls: 0.0425, s2.acc: 93.9605, s2.loss_bbox: 0.0413, s2.loss_mask: 0.0561, loss: 1.2001
|
| 609 |
+
2025-07-02 14:00:38,867 - mmdet - INFO - Epoch [1][3700/7330] lr: 1.000e-04, eta: 3 days, 3:26:25, time: 0.978, data_time: 0.023, memory: 21698, balance_loss: 0.0003, loss_rpn_cls: 0.0376, loss_rpn_bbox: 0.0284, s0.loss_cls: 0.1817, s0.acc: 93.8740, s0.loss_bbox: 0.2434, s0.loss_mask: 0.2365, s1.loss_cls: 0.0839, s1.acc: 94.1783, s1.loss_bbox: 0.1086, s1.loss_mask: 0.1173, s2.loss_cls: 0.0401, s2.acc: 94.2137, s2.loss_bbox: 0.0420, s2.loss_mask: 0.0549, loss: 1.1747
|
| 610 |
+
2025-07-02 14:01:27,482 - mmdet - INFO - Epoch [1][3750/7330] lr: 1.000e-04, eta: 3 days, 3:21:25, time: 0.972, data_time: 0.022, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0407, loss_rpn_bbox: 0.0282, s0.loss_cls: 0.1954, s0.acc: 93.4277, s0.loss_bbox: 0.2569, s0.loss_mask: 0.2490, s1.loss_cls: 0.0909, s1.acc: 93.7575, s1.loss_bbox: 0.1118, s1.loss_mask: 0.1224, s2.loss_cls: 0.0440, s2.acc: 93.7369, s2.loss_bbox: 0.0434, s2.loss_mask: 0.0569, loss: 1.2399
|
| 611 |
+
2025-07-02 14:02:16,051 - mmdet - INFO - Epoch [1][3800/7330] lr: 1.000e-04, eta: 3 days, 3:16:27, time: 0.971, data_time: 0.025, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0383, loss_rpn_bbox: 0.0263, s0.loss_cls: 0.1908, s0.acc: 93.6335, s0.loss_bbox: 0.2404, s0.loss_mask: 0.2441, s1.loss_cls: 0.0895, s1.acc: 93.9461, s1.loss_bbox: 0.1061, s1.loss_mask: 0.1195, s2.loss_cls: 0.0424, s2.acc: 94.0255, s2.loss_bbox: 0.0408, s2.loss_mask: 0.0560, loss: 1.1946
|
| 612 |
+
2025-07-02 14:03:05,063 - mmdet - INFO - Epoch [1][3850/7330] lr: 1.000e-04, eta: 3 days, 3:12:07, time: 0.980, data_time: 0.026, memory: 21698, balance_loss: 0.0004, loss_rpn_cls: 0.0388, loss_rpn_bbox: 0.0284, s0.loss_cls: 0.1896, s0.acc: 93.5769, s0.loss_bbox: 0.2487, s0.loss_mask: 0.2500, s1.loss_cls: 0.0897, s1.acc: 93.7279, s1.loss_bbox: 0.1108, s1.loss_mask: 0.1225, s2.loss_cls: 0.0429, s2.acc: 93.8040, s2.loss_bbox: 0.0422, s2.loss_mask: 0.0573, loss: 1.2213
|
| 613 |
+
2025-07-02 14:03:53,578 - mmdet - INFO - Epoch [1][3900/7330] lr: 1.000e-04, eta: 3 days, 3:07:19, time: 0.970, data_time: 0.023, memory: 21698, balance_loss: 0.0003, loss_rpn_cls: 0.0363, loss_rpn_bbox: 0.0260, s0.loss_cls: 0.1896, s0.acc: 93.6399, s0.loss_bbox: 0.2472, s0.loss_mask: 0.2460, s1.loss_cls: 0.0871, s1.acc: 93.8847, s1.loss_bbox: 0.1105, s1.loss_mask: 0.1210, s2.loss_cls: 0.0422, s2.acc: 93.8701, s2.loss_bbox: 0.0426, s2.loss_mask: 0.0563, loss: 1.2051
|
mmdet/results/train/mona_llama_moe_5_8_1e-4/20250702_125523.log.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cade930c7d3e39be1fc2ffc7f13ecd49a45e41b0ab4a3fa5b44af4d09783e68a
|
| 3 |
+
size 57221
|
mmdet/results/train/mona_llama_moe_5_8_1e-4/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_llama_moe.py
ADDED
|
@@ -0,0 +1,438 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model = dict(
|
| 2 |
+
type='CascadeRCNN_loss',
|
| 3 |
+
pretrained=None,
|
| 4 |
+
backbone=dict(
|
| 5 |
+
type='SwinTransformer_mona_llama_moe',
|
| 6 |
+
embed_dim=128,
|
| 7 |
+
depths=[2, 2, 18, 2],
|
| 8 |
+
num_heads=[4, 8, 16, 32],
|
| 9 |
+
window_size=7,
|
| 10 |
+
mlp_ratio=4.0,
|
| 11 |
+
qkv_bias=True,
|
| 12 |
+
qk_scale=None,
|
| 13 |
+
drop_rate=0.0,
|
| 14 |
+
attn_drop_rate=0.0,
|
| 15 |
+
drop_path_rate=0.3,
|
| 16 |
+
ape=False,
|
| 17 |
+
patch_norm=True,
|
| 18 |
+
out_indices=(0, 1, 2, 3),
|
| 19 |
+
use_checkpoint=False),
|
| 20 |
+
neck=dict(
|
| 21 |
+
type='FPN',
|
| 22 |
+
in_channels=[128, 256, 512, 1024],
|
| 23 |
+
out_channels=256,
|
| 24 |
+
num_outs=5),
|
| 25 |
+
rpn_head=dict(
|
| 26 |
+
type='RPNHead',
|
| 27 |
+
in_channels=256,
|
| 28 |
+
feat_channels=256,
|
| 29 |
+
anchor_generator=dict(
|
| 30 |
+
type='AnchorGenerator',
|
| 31 |
+
scales=[8],
|
| 32 |
+
ratios=[0.5, 1.0, 2.0],
|
| 33 |
+
strides=[4, 8, 16, 32, 64]),
|
| 34 |
+
bbox_coder=dict(
|
| 35 |
+
type='DeltaXYWHBBoxCoder',
|
| 36 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 37 |
+
target_stds=[1.0, 1.0, 1.0, 1.0]),
|
| 38 |
+
loss_cls=dict(
|
| 39 |
+
type='CrossEntropyLoss', use_sigmoid=True, loss_weight=1.0),
|
| 40 |
+
loss_bbox=dict(
|
| 41 |
+
type='SmoothL1Loss', beta=0.1111111111111111, loss_weight=1.0)),
|
| 42 |
+
roi_head=dict(
|
| 43 |
+
type='CascadeRoIHead',
|
| 44 |
+
num_stages=3,
|
| 45 |
+
stage_loss_weights=[1, 0.5, 0.25],
|
| 46 |
+
bbox_roi_extractor=dict(
|
| 47 |
+
type='SingleRoIExtractor',
|
| 48 |
+
roi_layer=dict(type='RoIAlign', output_size=7, sampling_ratio=0),
|
| 49 |
+
out_channels=256,
|
| 50 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 51 |
+
bbox_head=[
|
| 52 |
+
dict(
|
| 53 |
+
type='ConvFCBBoxHead',
|
| 54 |
+
num_shared_convs=4,
|
| 55 |
+
num_shared_fcs=1,
|
| 56 |
+
in_channels=256,
|
| 57 |
+
conv_out_channels=256,
|
| 58 |
+
fc_out_channels=1024,
|
| 59 |
+
roi_feat_size=7,
|
| 60 |
+
num_classes=80,
|
| 61 |
+
bbox_coder=dict(
|
| 62 |
+
type='DeltaXYWHBBoxCoder',
|
| 63 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 64 |
+
target_stds=[0.1, 0.1, 0.2, 0.2]),
|
| 65 |
+
reg_class_agnostic=False,
|
| 66 |
+
reg_decoded_bbox=True,
|
| 67 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 68 |
+
loss_cls=dict(
|
| 69 |
+
type='CrossEntropyLoss',
|
| 70 |
+
use_sigmoid=False,
|
| 71 |
+
loss_weight=1.0),
|
| 72 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 73 |
+
dict(
|
| 74 |
+
type='ConvFCBBoxHead',
|
| 75 |
+
num_shared_convs=4,
|
| 76 |
+
num_shared_fcs=1,
|
| 77 |
+
in_channels=256,
|
| 78 |
+
conv_out_channels=256,
|
| 79 |
+
fc_out_channels=1024,
|
| 80 |
+
roi_feat_size=7,
|
| 81 |
+
num_classes=80,
|
| 82 |
+
bbox_coder=dict(
|
| 83 |
+
type='DeltaXYWHBBoxCoder',
|
| 84 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 85 |
+
target_stds=[0.05, 0.05, 0.1, 0.1]),
|
| 86 |
+
reg_class_agnostic=False,
|
| 87 |
+
reg_decoded_bbox=True,
|
| 88 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 89 |
+
loss_cls=dict(
|
| 90 |
+
type='CrossEntropyLoss',
|
| 91 |
+
use_sigmoid=False,
|
| 92 |
+
loss_weight=1.0),
|
| 93 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 94 |
+
dict(
|
| 95 |
+
type='ConvFCBBoxHead',
|
| 96 |
+
num_shared_convs=4,
|
| 97 |
+
num_shared_fcs=1,
|
| 98 |
+
in_channels=256,
|
| 99 |
+
conv_out_channels=256,
|
| 100 |
+
fc_out_channels=1024,
|
| 101 |
+
roi_feat_size=7,
|
| 102 |
+
num_classes=80,
|
| 103 |
+
bbox_coder=dict(
|
| 104 |
+
type='DeltaXYWHBBoxCoder',
|
| 105 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 106 |
+
target_stds=[0.033, 0.033, 0.067, 0.067]),
|
| 107 |
+
reg_class_agnostic=False,
|
| 108 |
+
reg_decoded_bbox=True,
|
| 109 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 110 |
+
loss_cls=dict(
|
| 111 |
+
type='CrossEntropyLoss',
|
| 112 |
+
use_sigmoid=False,
|
| 113 |
+
loss_weight=1.0),
|
| 114 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
|
| 115 |
+
],
|
| 116 |
+
mask_roi_extractor=dict(
|
| 117 |
+
type='SingleRoIExtractor',
|
| 118 |
+
roi_layer=dict(type='RoIAlign', output_size=14, sampling_ratio=0),
|
| 119 |
+
out_channels=256,
|
| 120 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 121 |
+
mask_head=dict(
|
| 122 |
+
type='FCNMaskHead',
|
| 123 |
+
num_convs=4,
|
| 124 |
+
in_channels=256,
|
| 125 |
+
conv_out_channels=256,
|
| 126 |
+
num_classes=80,
|
| 127 |
+
loss_mask=dict(
|
| 128 |
+
type='CrossEntropyLoss', use_mask=True, loss_weight=1.0))),
|
| 129 |
+
train_cfg=dict(
|
| 130 |
+
rpn=dict(
|
| 131 |
+
assigner=dict(
|
| 132 |
+
type='MaxIoUAssigner',
|
| 133 |
+
pos_iou_thr=0.7,
|
| 134 |
+
neg_iou_thr=0.3,
|
| 135 |
+
min_pos_iou=0.3,
|
| 136 |
+
match_low_quality=True,
|
| 137 |
+
ignore_iof_thr=-1),
|
| 138 |
+
sampler=dict(
|
| 139 |
+
type='RandomSampler',
|
| 140 |
+
num=256,
|
| 141 |
+
pos_fraction=0.5,
|
| 142 |
+
neg_pos_ub=-1,
|
| 143 |
+
add_gt_as_proposals=False),
|
| 144 |
+
allowed_border=0,
|
| 145 |
+
pos_weight=-1,
|
| 146 |
+
debug=False),
|
| 147 |
+
rpn_proposal=dict(
|
| 148 |
+
nms_across_levels=False,
|
| 149 |
+
nms_pre=2000,
|
| 150 |
+
nms_post=2000,
|
| 151 |
+
max_per_img=2000,
|
| 152 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 153 |
+
min_bbox_size=0),
|
| 154 |
+
rcnn=[
|
| 155 |
+
dict(
|
| 156 |
+
assigner=dict(
|
| 157 |
+
type='MaxIoUAssigner',
|
| 158 |
+
pos_iou_thr=0.5,
|
| 159 |
+
neg_iou_thr=0.5,
|
| 160 |
+
min_pos_iou=0.5,
|
| 161 |
+
match_low_quality=False,
|
| 162 |
+
ignore_iof_thr=-1),
|
| 163 |
+
sampler=dict(
|
| 164 |
+
type='RandomSampler',
|
| 165 |
+
num=512,
|
| 166 |
+
pos_fraction=0.25,
|
| 167 |
+
neg_pos_ub=-1,
|
| 168 |
+
add_gt_as_proposals=True),
|
| 169 |
+
mask_size=28,
|
| 170 |
+
pos_weight=-1,
|
| 171 |
+
debug=False),
|
| 172 |
+
dict(
|
| 173 |
+
assigner=dict(
|
| 174 |
+
type='MaxIoUAssigner',
|
| 175 |
+
pos_iou_thr=0.6,
|
| 176 |
+
neg_iou_thr=0.6,
|
| 177 |
+
min_pos_iou=0.6,
|
| 178 |
+
match_low_quality=False,
|
| 179 |
+
ignore_iof_thr=-1),
|
| 180 |
+
sampler=dict(
|
| 181 |
+
type='RandomSampler',
|
| 182 |
+
num=512,
|
| 183 |
+
pos_fraction=0.25,
|
| 184 |
+
neg_pos_ub=-1,
|
| 185 |
+
add_gt_as_proposals=True),
|
| 186 |
+
mask_size=28,
|
| 187 |
+
pos_weight=-1,
|
| 188 |
+
debug=False),
|
| 189 |
+
dict(
|
| 190 |
+
assigner=dict(
|
| 191 |
+
type='MaxIoUAssigner',
|
| 192 |
+
pos_iou_thr=0.7,
|
| 193 |
+
neg_iou_thr=0.7,
|
| 194 |
+
min_pos_iou=0.7,
|
| 195 |
+
match_low_quality=False,
|
| 196 |
+
ignore_iof_thr=-1),
|
| 197 |
+
sampler=dict(
|
| 198 |
+
type='RandomSampler',
|
| 199 |
+
num=512,
|
| 200 |
+
pos_fraction=0.25,
|
| 201 |
+
neg_pos_ub=-1,
|
| 202 |
+
add_gt_as_proposals=True),
|
| 203 |
+
mask_size=28,
|
| 204 |
+
pos_weight=-1,
|
| 205 |
+
debug=False)
|
| 206 |
+
]),
|
| 207 |
+
test_cfg=dict(
|
| 208 |
+
rpn=dict(
|
| 209 |
+
nms_across_levels=False,
|
| 210 |
+
nms_pre=1000,
|
| 211 |
+
nms_post=1000,
|
| 212 |
+
max_per_img=1000,
|
| 213 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 214 |
+
min_bbox_size=0),
|
| 215 |
+
rcnn=dict(
|
| 216 |
+
score_thr=0.05,
|
| 217 |
+
nms=dict(type='nms', iou_threshold=0.5),
|
| 218 |
+
max_per_img=100,
|
| 219 |
+
mask_thr_binary=0.5)))
|
| 220 |
+
dataset_type = 'CocoDataset'
|
| 221 |
+
data_root = '/root/autodl-tmp/COCO2017/'
|
| 222 |
+
img_norm_cfg = dict(
|
| 223 |
+
mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
|
| 224 |
+
train_pipeline = [
|
| 225 |
+
dict(type='LoadImageFromFile'),
|
| 226 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 227 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 228 |
+
dict(
|
| 229 |
+
type='AutoAugment',
|
| 230 |
+
policies=[[{
|
| 231 |
+
'type':
|
| 232 |
+
'Resize',
|
| 233 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333), (576, 1333),
|
| 234 |
+
(608, 1333), (640, 1333), (672, 1333), (704, 1333),
|
| 235 |
+
(736, 1333), (768, 1333), (800, 1333)],
|
| 236 |
+
'multiscale_mode':
|
| 237 |
+
'value',
|
| 238 |
+
'keep_ratio':
|
| 239 |
+
True
|
| 240 |
+
}],
|
| 241 |
+
[{
|
| 242 |
+
'type': 'Resize',
|
| 243 |
+
'img_scale': [(400, 1333), (500, 1333), (600, 1333)],
|
| 244 |
+
'multiscale_mode': 'value',
|
| 245 |
+
'keep_ratio': True
|
| 246 |
+
}, {
|
| 247 |
+
'type': 'RandomCrop',
|
| 248 |
+
'crop_type': 'absolute_range',
|
| 249 |
+
'crop_size': (384, 600),
|
| 250 |
+
'allow_negative_crop': True
|
| 251 |
+
}, {
|
| 252 |
+
'type':
|
| 253 |
+
'Resize',
|
| 254 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 255 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 256 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 257 |
+
(768, 1333), (800, 1333)],
|
| 258 |
+
'multiscale_mode':
|
| 259 |
+
'value',
|
| 260 |
+
'override':
|
| 261 |
+
True,
|
| 262 |
+
'keep_ratio':
|
| 263 |
+
True
|
| 264 |
+
}]]),
|
| 265 |
+
dict(
|
| 266 |
+
type='Normalize',
|
| 267 |
+
mean=[123.675, 116.28, 103.53],
|
| 268 |
+
std=[58.395, 57.12, 57.375],
|
| 269 |
+
to_rgb=True),
|
| 270 |
+
dict(type='Pad', size_divisor=32),
|
| 271 |
+
dict(type='DefaultFormatBundle'),
|
| 272 |
+
dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 273 |
+
]
|
| 274 |
+
test_pipeline = [
|
| 275 |
+
dict(type='LoadImageFromFile'),
|
| 276 |
+
dict(
|
| 277 |
+
type='MultiScaleFlipAug',
|
| 278 |
+
img_scale=(1333, 800),
|
| 279 |
+
flip=False,
|
| 280 |
+
transforms=[
|
| 281 |
+
dict(type='Resize', keep_ratio=True),
|
| 282 |
+
dict(type='RandomFlip'),
|
| 283 |
+
dict(
|
| 284 |
+
type='Normalize',
|
| 285 |
+
mean=[123.675, 116.28, 103.53],
|
| 286 |
+
std=[58.395, 57.12, 57.375],
|
| 287 |
+
to_rgb=True),
|
| 288 |
+
dict(type='Pad', size_divisor=32),
|
| 289 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 290 |
+
dict(type='Collect', keys=['img'])
|
| 291 |
+
])
|
| 292 |
+
]
|
| 293 |
+
data = dict(
|
| 294 |
+
samples_per_gpu=2,
|
| 295 |
+
workers_per_gpu=4,
|
| 296 |
+
train=dict(
|
| 297 |
+
type='CocoDataset',
|
| 298 |
+
ann_file=
|
| 299 |
+
'/root/autodl-tmp/COCO2017/annotations/instances_train2017.json',
|
| 300 |
+
img_prefix='/root/autodl-tmp/COCO2017/train2017/',
|
| 301 |
+
pipeline=[
|
| 302 |
+
dict(type='LoadImageFromFile'),
|
| 303 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 304 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 305 |
+
dict(
|
| 306 |
+
type='AutoAugment',
|
| 307 |
+
policies=[[{
|
| 308 |
+
'type':
|
| 309 |
+
'Resize',
|
| 310 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 311 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 312 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 313 |
+
(768, 1333), (800, 1333)],
|
| 314 |
+
'multiscale_mode':
|
| 315 |
+
'value',
|
| 316 |
+
'keep_ratio':
|
| 317 |
+
True
|
| 318 |
+
}],
|
| 319 |
+
[{
|
| 320 |
+
'type': 'Resize',
|
| 321 |
+
'img_scale': [(400, 1333), (500, 1333),
|
| 322 |
+
(600, 1333)],
|
| 323 |
+
'multiscale_mode': 'value',
|
| 324 |
+
'keep_ratio': True
|
| 325 |
+
}, {
|
| 326 |
+
'type': 'RandomCrop',
|
| 327 |
+
'crop_type': 'absolute_range',
|
| 328 |
+
'crop_size': (384, 600),
|
| 329 |
+
'allow_negative_crop': True
|
| 330 |
+
}, {
|
| 331 |
+
'type':
|
| 332 |
+
'Resize',
|
| 333 |
+
'img_scale': [(480, 1333), (512, 1333),
|
| 334 |
+
(544, 1333), (576, 1333),
|
| 335 |
+
(608, 1333), (640, 1333),
|
| 336 |
+
(672, 1333), (704, 1333),
|
| 337 |
+
(736, 1333), (768, 1333),
|
| 338 |
+
(800, 1333)],
|
| 339 |
+
'multiscale_mode':
|
| 340 |
+
'value',
|
| 341 |
+
'override':
|
| 342 |
+
True,
|
| 343 |
+
'keep_ratio':
|
| 344 |
+
True
|
| 345 |
+
}]]),
|
| 346 |
+
dict(
|
| 347 |
+
type='Normalize',
|
| 348 |
+
mean=[123.675, 116.28, 103.53],
|
| 349 |
+
std=[58.395, 57.12, 57.375],
|
| 350 |
+
to_rgb=True),
|
| 351 |
+
dict(type='Pad', size_divisor=32),
|
| 352 |
+
dict(type='DefaultFormatBundle'),
|
| 353 |
+
dict(
|
| 354 |
+
type='Collect',
|
| 355 |
+
keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 356 |
+
]),
|
| 357 |
+
val=dict(
|
| 358 |
+
type='CocoDataset',
|
| 359 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 360 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 361 |
+
pipeline=[
|
| 362 |
+
dict(type='LoadImageFromFile'),
|
| 363 |
+
dict(
|
| 364 |
+
type='MultiScaleFlipAug',
|
| 365 |
+
img_scale=(1333, 800),
|
| 366 |
+
flip=False,
|
| 367 |
+
transforms=[
|
| 368 |
+
dict(type='Resize', keep_ratio=True),
|
| 369 |
+
dict(type='RandomFlip'),
|
| 370 |
+
dict(
|
| 371 |
+
type='Normalize',
|
| 372 |
+
mean=[123.675, 116.28, 103.53],
|
| 373 |
+
std=[58.395, 57.12, 57.375],
|
| 374 |
+
to_rgb=True),
|
| 375 |
+
dict(type='Pad', size_divisor=32),
|
| 376 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 377 |
+
dict(type='Collect', keys=['img'])
|
| 378 |
+
])
|
| 379 |
+
]),
|
| 380 |
+
test=dict(
|
| 381 |
+
type='CocoDataset',
|
| 382 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 383 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 384 |
+
pipeline=[
|
| 385 |
+
dict(type='LoadImageFromFile'),
|
| 386 |
+
dict(
|
| 387 |
+
type='MultiScaleFlipAug',
|
| 388 |
+
img_scale=(1333, 800),
|
| 389 |
+
flip=False,
|
| 390 |
+
transforms=[
|
| 391 |
+
dict(type='Resize', keep_ratio=True),
|
| 392 |
+
dict(type='RandomFlip'),
|
| 393 |
+
dict(
|
| 394 |
+
type='Normalize',
|
| 395 |
+
mean=[123.675, 116.28, 103.53],
|
| 396 |
+
std=[58.395, 57.12, 57.375],
|
| 397 |
+
to_rgb=True),
|
| 398 |
+
dict(type='Pad', size_divisor=32),
|
| 399 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 400 |
+
dict(type='Collect', keys=['img'])
|
| 401 |
+
])
|
| 402 |
+
]))
|
| 403 |
+
evaluation = dict(metric=['bbox', 'segm'], gpu_collect=True)
|
| 404 |
+
optimizer = dict(
|
| 405 |
+
type='AdamW',
|
| 406 |
+
lr=0.0001,
|
| 407 |
+
betas=(0.9, 0.999),
|
| 408 |
+
weight_decay=0.05,
|
| 409 |
+
paramwise_cfg=dict(
|
| 410 |
+
custom_keys=dict(
|
| 411 |
+
absolute_pos_embed=dict(decay_mult=0.0),
|
| 412 |
+
relative_position_bias_table=dict(decay_mult=0.0),
|
| 413 |
+
norm=dict(decay_mult=0.0))))
|
| 414 |
+
optimizer_config = dict(
|
| 415 |
+
grad_clip=None,
|
| 416 |
+
type='DistOptimizerHook',
|
| 417 |
+
update_interval=1,
|
| 418 |
+
coalesce=True,
|
| 419 |
+
bucket_size_mb=-1,
|
| 420 |
+
use_fp16=True)
|
| 421 |
+
lr_config = dict(
|
| 422 |
+
policy='step',
|
| 423 |
+
warmup='linear',
|
| 424 |
+
warmup_iters=500,
|
| 425 |
+
warmup_ratio=0.001,
|
| 426 |
+
step=[27, 33])
|
| 427 |
+
runner = dict(type='EpochBasedRunnerAmp', max_epochs=36)
|
| 428 |
+
checkpoint_config = dict(interval=1)
|
| 429 |
+
log_config = dict(interval=50, hooks=[dict(type='TextLoggerHook')])
|
| 430 |
+
custom_hooks = [dict(type='NumClassCheckHook')]
|
| 431 |
+
dist_params = dict(backend='nccl')
|
| 432 |
+
log_level = 'INFO'
|
| 433 |
+
load_from = '/root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/pretrained_model/swin_base_mona_llama_moe_8.pth'
|
| 434 |
+
resume_from = None
|
| 435 |
+
workflow = [('train', 1)]
|
| 436 |
+
fp16 = None
|
| 437 |
+
work_dir = './results/train/mona_llama_moe_5_8_1e-4/'
|
| 438 |
+
gpu_ids = range(0, 8)
|
mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/20250620_180057.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/20250620_180057.log.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d92d5ef30b6713785effc9b0d48813c1994270b57e37fdb7d900dc3d6215adf0
|
| 3 |
+
size 186899
|
mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_llama_moe_distill.py
ADDED
|
@@ -0,0 +1,438 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model = dict(
|
| 2 |
+
type='CascadeRCNN_loss',
|
| 3 |
+
pretrained=None,
|
| 4 |
+
backbone=dict(
|
| 5 |
+
type='SwinTransformer_mona_llama_moe_distill',
|
| 6 |
+
embed_dim=128,
|
| 7 |
+
depths=[2, 2, 18, 2],
|
| 8 |
+
num_heads=[4, 8, 16, 32],
|
| 9 |
+
window_size=7,
|
| 10 |
+
mlp_ratio=4.0,
|
| 11 |
+
qkv_bias=True,
|
| 12 |
+
qk_scale=None,
|
| 13 |
+
drop_rate=0.0,
|
| 14 |
+
attn_drop_rate=0.0,
|
| 15 |
+
drop_path_rate=0.3,
|
| 16 |
+
ape=False,
|
| 17 |
+
patch_norm=True,
|
| 18 |
+
out_indices=(0, 1, 2, 3),
|
| 19 |
+
use_checkpoint=False),
|
| 20 |
+
neck=dict(
|
| 21 |
+
type='FPN',
|
| 22 |
+
in_channels=[128, 256, 512, 1024],
|
| 23 |
+
out_channels=256,
|
| 24 |
+
num_outs=5),
|
| 25 |
+
rpn_head=dict(
|
| 26 |
+
type='RPNHead',
|
| 27 |
+
in_channels=256,
|
| 28 |
+
feat_channels=256,
|
| 29 |
+
anchor_generator=dict(
|
| 30 |
+
type='AnchorGenerator',
|
| 31 |
+
scales=[8],
|
| 32 |
+
ratios=[0.5, 1.0, 2.0],
|
| 33 |
+
strides=[4, 8, 16, 32, 64]),
|
| 34 |
+
bbox_coder=dict(
|
| 35 |
+
type='DeltaXYWHBBoxCoder',
|
| 36 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 37 |
+
target_stds=[1.0, 1.0, 1.0, 1.0]),
|
| 38 |
+
loss_cls=dict(
|
| 39 |
+
type='CrossEntropyLoss', use_sigmoid=True, loss_weight=1.0),
|
| 40 |
+
loss_bbox=dict(
|
| 41 |
+
type='SmoothL1Loss', beta=0.1111111111111111, loss_weight=1.0)),
|
| 42 |
+
roi_head=dict(
|
| 43 |
+
type='CascadeRoIHead',
|
| 44 |
+
num_stages=3,
|
| 45 |
+
stage_loss_weights=[1, 0.5, 0.25],
|
| 46 |
+
bbox_roi_extractor=dict(
|
| 47 |
+
type='SingleRoIExtractor',
|
| 48 |
+
roi_layer=dict(type='RoIAlign', output_size=7, sampling_ratio=0),
|
| 49 |
+
out_channels=256,
|
| 50 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 51 |
+
bbox_head=[
|
| 52 |
+
dict(
|
| 53 |
+
type='ConvFCBBoxHead',
|
| 54 |
+
num_shared_convs=4,
|
| 55 |
+
num_shared_fcs=1,
|
| 56 |
+
in_channels=256,
|
| 57 |
+
conv_out_channels=256,
|
| 58 |
+
fc_out_channels=1024,
|
| 59 |
+
roi_feat_size=7,
|
| 60 |
+
num_classes=80,
|
| 61 |
+
bbox_coder=dict(
|
| 62 |
+
type='DeltaXYWHBBoxCoder',
|
| 63 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 64 |
+
target_stds=[0.1, 0.1, 0.2, 0.2]),
|
| 65 |
+
reg_class_agnostic=False,
|
| 66 |
+
reg_decoded_bbox=True,
|
| 67 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 68 |
+
loss_cls=dict(
|
| 69 |
+
type='CrossEntropyLoss',
|
| 70 |
+
use_sigmoid=False,
|
| 71 |
+
loss_weight=1.0),
|
| 72 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 73 |
+
dict(
|
| 74 |
+
type='ConvFCBBoxHead',
|
| 75 |
+
num_shared_convs=4,
|
| 76 |
+
num_shared_fcs=1,
|
| 77 |
+
in_channels=256,
|
| 78 |
+
conv_out_channels=256,
|
| 79 |
+
fc_out_channels=1024,
|
| 80 |
+
roi_feat_size=7,
|
| 81 |
+
num_classes=80,
|
| 82 |
+
bbox_coder=dict(
|
| 83 |
+
type='DeltaXYWHBBoxCoder',
|
| 84 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 85 |
+
target_stds=[0.05, 0.05, 0.1, 0.1]),
|
| 86 |
+
reg_class_agnostic=False,
|
| 87 |
+
reg_decoded_bbox=True,
|
| 88 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 89 |
+
loss_cls=dict(
|
| 90 |
+
type='CrossEntropyLoss',
|
| 91 |
+
use_sigmoid=False,
|
| 92 |
+
loss_weight=1.0),
|
| 93 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 94 |
+
dict(
|
| 95 |
+
type='ConvFCBBoxHead',
|
| 96 |
+
num_shared_convs=4,
|
| 97 |
+
num_shared_fcs=1,
|
| 98 |
+
in_channels=256,
|
| 99 |
+
conv_out_channels=256,
|
| 100 |
+
fc_out_channels=1024,
|
| 101 |
+
roi_feat_size=7,
|
| 102 |
+
num_classes=80,
|
| 103 |
+
bbox_coder=dict(
|
| 104 |
+
type='DeltaXYWHBBoxCoder',
|
| 105 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 106 |
+
target_stds=[0.033, 0.033, 0.067, 0.067]),
|
| 107 |
+
reg_class_agnostic=False,
|
| 108 |
+
reg_decoded_bbox=True,
|
| 109 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 110 |
+
loss_cls=dict(
|
| 111 |
+
type='CrossEntropyLoss',
|
| 112 |
+
use_sigmoid=False,
|
| 113 |
+
loss_weight=1.0),
|
| 114 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
|
| 115 |
+
],
|
| 116 |
+
mask_roi_extractor=dict(
|
| 117 |
+
type='SingleRoIExtractor',
|
| 118 |
+
roi_layer=dict(type='RoIAlign', output_size=14, sampling_ratio=0),
|
| 119 |
+
out_channels=256,
|
| 120 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 121 |
+
mask_head=dict(
|
| 122 |
+
type='FCNMaskHead',
|
| 123 |
+
num_convs=4,
|
| 124 |
+
in_channels=256,
|
| 125 |
+
conv_out_channels=256,
|
| 126 |
+
num_classes=80,
|
| 127 |
+
loss_mask=dict(
|
| 128 |
+
type='CrossEntropyLoss', use_mask=True, loss_weight=1.0))),
|
| 129 |
+
train_cfg=dict(
|
| 130 |
+
rpn=dict(
|
| 131 |
+
assigner=dict(
|
| 132 |
+
type='MaxIoUAssigner',
|
| 133 |
+
pos_iou_thr=0.7,
|
| 134 |
+
neg_iou_thr=0.3,
|
| 135 |
+
min_pos_iou=0.3,
|
| 136 |
+
match_low_quality=True,
|
| 137 |
+
ignore_iof_thr=-1),
|
| 138 |
+
sampler=dict(
|
| 139 |
+
type='RandomSampler',
|
| 140 |
+
num=256,
|
| 141 |
+
pos_fraction=0.5,
|
| 142 |
+
neg_pos_ub=-1,
|
| 143 |
+
add_gt_as_proposals=False),
|
| 144 |
+
allowed_border=0,
|
| 145 |
+
pos_weight=-1,
|
| 146 |
+
debug=False),
|
| 147 |
+
rpn_proposal=dict(
|
| 148 |
+
nms_across_levels=False,
|
| 149 |
+
nms_pre=2000,
|
| 150 |
+
nms_post=2000,
|
| 151 |
+
max_per_img=2000,
|
| 152 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 153 |
+
min_bbox_size=0),
|
| 154 |
+
rcnn=[
|
| 155 |
+
dict(
|
| 156 |
+
assigner=dict(
|
| 157 |
+
type='MaxIoUAssigner',
|
| 158 |
+
pos_iou_thr=0.5,
|
| 159 |
+
neg_iou_thr=0.5,
|
| 160 |
+
min_pos_iou=0.5,
|
| 161 |
+
match_low_quality=False,
|
| 162 |
+
ignore_iof_thr=-1),
|
| 163 |
+
sampler=dict(
|
| 164 |
+
type='RandomSampler',
|
| 165 |
+
num=512,
|
| 166 |
+
pos_fraction=0.25,
|
| 167 |
+
neg_pos_ub=-1,
|
| 168 |
+
add_gt_as_proposals=True),
|
| 169 |
+
mask_size=28,
|
| 170 |
+
pos_weight=-1,
|
| 171 |
+
debug=False),
|
| 172 |
+
dict(
|
| 173 |
+
assigner=dict(
|
| 174 |
+
type='MaxIoUAssigner',
|
| 175 |
+
pos_iou_thr=0.6,
|
| 176 |
+
neg_iou_thr=0.6,
|
| 177 |
+
min_pos_iou=0.6,
|
| 178 |
+
match_low_quality=False,
|
| 179 |
+
ignore_iof_thr=-1),
|
| 180 |
+
sampler=dict(
|
| 181 |
+
type='RandomSampler',
|
| 182 |
+
num=512,
|
| 183 |
+
pos_fraction=0.25,
|
| 184 |
+
neg_pos_ub=-1,
|
| 185 |
+
add_gt_as_proposals=True),
|
| 186 |
+
mask_size=28,
|
| 187 |
+
pos_weight=-1,
|
| 188 |
+
debug=False),
|
| 189 |
+
dict(
|
| 190 |
+
assigner=dict(
|
| 191 |
+
type='MaxIoUAssigner',
|
| 192 |
+
pos_iou_thr=0.7,
|
| 193 |
+
neg_iou_thr=0.7,
|
| 194 |
+
min_pos_iou=0.7,
|
| 195 |
+
match_low_quality=False,
|
| 196 |
+
ignore_iof_thr=-1),
|
| 197 |
+
sampler=dict(
|
| 198 |
+
type='RandomSampler',
|
| 199 |
+
num=512,
|
| 200 |
+
pos_fraction=0.25,
|
| 201 |
+
neg_pos_ub=-1,
|
| 202 |
+
add_gt_as_proposals=True),
|
| 203 |
+
mask_size=28,
|
| 204 |
+
pos_weight=-1,
|
| 205 |
+
debug=False)
|
| 206 |
+
]),
|
| 207 |
+
test_cfg=dict(
|
| 208 |
+
rpn=dict(
|
| 209 |
+
nms_across_levels=False,
|
| 210 |
+
nms_pre=1000,
|
| 211 |
+
nms_post=1000,
|
| 212 |
+
max_per_img=1000,
|
| 213 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 214 |
+
min_bbox_size=0),
|
| 215 |
+
rcnn=dict(
|
| 216 |
+
score_thr=0.05,
|
| 217 |
+
nms=dict(type='nms', iou_threshold=0.5),
|
| 218 |
+
max_per_img=100,
|
| 219 |
+
mask_thr_binary=0.5)))
|
| 220 |
+
dataset_type = 'CocoDataset'
|
| 221 |
+
data_root = '/root/autodl-tmp/COCO2017/'
|
| 222 |
+
img_norm_cfg = dict(
|
| 223 |
+
mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
|
| 224 |
+
train_pipeline = [
|
| 225 |
+
dict(type='LoadImageFromFile'),
|
| 226 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 227 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 228 |
+
dict(
|
| 229 |
+
type='AutoAugment',
|
| 230 |
+
policies=[[{
|
| 231 |
+
'type':
|
| 232 |
+
'Resize',
|
| 233 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333), (576, 1333),
|
| 234 |
+
(608, 1333), (640, 1333), (672, 1333), (704, 1333),
|
| 235 |
+
(736, 1333), (768, 1333), (800, 1333)],
|
| 236 |
+
'multiscale_mode':
|
| 237 |
+
'value',
|
| 238 |
+
'keep_ratio':
|
| 239 |
+
True
|
| 240 |
+
}],
|
| 241 |
+
[{
|
| 242 |
+
'type': 'Resize',
|
| 243 |
+
'img_scale': [(400, 1333), (500, 1333), (600, 1333)],
|
| 244 |
+
'multiscale_mode': 'value',
|
| 245 |
+
'keep_ratio': True
|
| 246 |
+
}, {
|
| 247 |
+
'type': 'RandomCrop',
|
| 248 |
+
'crop_type': 'absolute_range',
|
| 249 |
+
'crop_size': (384, 600),
|
| 250 |
+
'allow_negative_crop': True
|
| 251 |
+
}, {
|
| 252 |
+
'type':
|
| 253 |
+
'Resize',
|
| 254 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 255 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 256 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 257 |
+
(768, 1333), (800, 1333)],
|
| 258 |
+
'multiscale_mode':
|
| 259 |
+
'value',
|
| 260 |
+
'override':
|
| 261 |
+
True,
|
| 262 |
+
'keep_ratio':
|
| 263 |
+
True
|
| 264 |
+
}]]),
|
| 265 |
+
dict(
|
| 266 |
+
type='Normalize',
|
| 267 |
+
mean=[123.675, 116.28, 103.53],
|
| 268 |
+
std=[58.395, 57.12, 57.375],
|
| 269 |
+
to_rgb=True),
|
| 270 |
+
dict(type='Pad', size_divisor=32),
|
| 271 |
+
dict(type='DefaultFormatBundle'),
|
| 272 |
+
dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 273 |
+
]
|
| 274 |
+
test_pipeline = [
|
| 275 |
+
dict(type='LoadImageFromFile'),
|
| 276 |
+
dict(
|
| 277 |
+
type='MultiScaleFlipAug',
|
| 278 |
+
img_scale=(1333, 800),
|
| 279 |
+
flip=False,
|
| 280 |
+
transforms=[
|
| 281 |
+
dict(type='Resize', keep_ratio=True),
|
| 282 |
+
dict(type='RandomFlip'),
|
| 283 |
+
dict(
|
| 284 |
+
type='Normalize',
|
| 285 |
+
mean=[123.675, 116.28, 103.53],
|
| 286 |
+
std=[58.395, 57.12, 57.375],
|
| 287 |
+
to_rgb=True),
|
| 288 |
+
dict(type='Pad', size_divisor=32),
|
| 289 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 290 |
+
dict(type='Collect', keys=['img'])
|
| 291 |
+
])
|
| 292 |
+
]
|
| 293 |
+
data = dict(
|
| 294 |
+
samples_per_gpu=1,
|
| 295 |
+
workers_per_gpu=4,
|
| 296 |
+
train=dict(
|
| 297 |
+
type='CocoDataset',
|
| 298 |
+
ann_file=
|
| 299 |
+
'/root/autodl-tmp/COCO2017/annotations/instances_train2017.json',
|
| 300 |
+
img_prefix='/root/autodl-tmp/COCO2017/train2017/',
|
| 301 |
+
pipeline=[
|
| 302 |
+
dict(type='LoadImageFromFile'),
|
| 303 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 304 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 305 |
+
dict(
|
| 306 |
+
type='AutoAugment',
|
| 307 |
+
policies=[[{
|
| 308 |
+
'type':
|
| 309 |
+
'Resize',
|
| 310 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 311 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 312 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 313 |
+
(768, 1333), (800, 1333)],
|
| 314 |
+
'multiscale_mode':
|
| 315 |
+
'value',
|
| 316 |
+
'keep_ratio':
|
| 317 |
+
True
|
| 318 |
+
}],
|
| 319 |
+
[{
|
| 320 |
+
'type': 'Resize',
|
| 321 |
+
'img_scale': [(400, 1333), (500, 1333),
|
| 322 |
+
(600, 1333)],
|
| 323 |
+
'multiscale_mode': 'value',
|
| 324 |
+
'keep_ratio': True
|
| 325 |
+
}, {
|
| 326 |
+
'type': 'RandomCrop',
|
| 327 |
+
'crop_type': 'absolute_range',
|
| 328 |
+
'crop_size': (384, 600),
|
| 329 |
+
'allow_negative_crop': True
|
| 330 |
+
}, {
|
| 331 |
+
'type':
|
| 332 |
+
'Resize',
|
| 333 |
+
'img_scale': [(480, 1333), (512, 1333),
|
| 334 |
+
(544, 1333), (576, 1333),
|
| 335 |
+
(608, 1333), (640, 1333),
|
| 336 |
+
(672, 1333), (704, 1333),
|
| 337 |
+
(736, 1333), (768, 1333),
|
| 338 |
+
(800, 1333)],
|
| 339 |
+
'multiscale_mode':
|
| 340 |
+
'value',
|
| 341 |
+
'override':
|
| 342 |
+
True,
|
| 343 |
+
'keep_ratio':
|
| 344 |
+
True
|
| 345 |
+
}]]),
|
| 346 |
+
dict(
|
| 347 |
+
type='Normalize',
|
| 348 |
+
mean=[123.675, 116.28, 103.53],
|
| 349 |
+
std=[58.395, 57.12, 57.375],
|
| 350 |
+
to_rgb=True),
|
| 351 |
+
dict(type='Pad', size_divisor=32),
|
| 352 |
+
dict(type='DefaultFormatBundle'),
|
| 353 |
+
dict(
|
| 354 |
+
type='Collect',
|
| 355 |
+
keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 356 |
+
]),
|
| 357 |
+
val=dict(
|
| 358 |
+
type='CocoDataset',
|
| 359 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 360 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 361 |
+
pipeline=[
|
| 362 |
+
dict(type='LoadImageFromFile'),
|
| 363 |
+
dict(
|
| 364 |
+
type='MultiScaleFlipAug',
|
| 365 |
+
img_scale=(1333, 800),
|
| 366 |
+
flip=False,
|
| 367 |
+
transforms=[
|
| 368 |
+
dict(type='Resize', keep_ratio=True),
|
| 369 |
+
dict(type='RandomFlip'),
|
| 370 |
+
dict(
|
| 371 |
+
type='Normalize',
|
| 372 |
+
mean=[123.675, 116.28, 103.53],
|
| 373 |
+
std=[58.395, 57.12, 57.375],
|
| 374 |
+
to_rgb=True),
|
| 375 |
+
dict(type='Pad', size_divisor=32),
|
| 376 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 377 |
+
dict(type='Collect', keys=['img'])
|
| 378 |
+
])
|
| 379 |
+
]),
|
| 380 |
+
test=dict(
|
| 381 |
+
type='CocoDataset',
|
| 382 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 383 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 384 |
+
pipeline=[
|
| 385 |
+
dict(type='LoadImageFromFile'),
|
| 386 |
+
dict(
|
| 387 |
+
type='MultiScaleFlipAug',
|
| 388 |
+
img_scale=(1333, 800),
|
| 389 |
+
flip=False,
|
| 390 |
+
transforms=[
|
| 391 |
+
dict(type='Resize', keep_ratio=True),
|
| 392 |
+
dict(type='RandomFlip'),
|
| 393 |
+
dict(
|
| 394 |
+
type='Normalize',
|
| 395 |
+
mean=[123.675, 116.28, 103.53],
|
| 396 |
+
std=[58.395, 57.12, 57.375],
|
| 397 |
+
to_rgb=True),
|
| 398 |
+
dict(type='Pad', size_divisor=32),
|
| 399 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 400 |
+
dict(type='Collect', keys=['img'])
|
| 401 |
+
])
|
| 402 |
+
]))
|
| 403 |
+
evaluation = dict(metric=['bbox', 'segm'], gpu_collect=True)
|
| 404 |
+
optimizer = dict(
|
| 405 |
+
type='AdamW',
|
| 406 |
+
lr=5e-05,
|
| 407 |
+
betas=(0.9, 0.999),
|
| 408 |
+
weight_decay=0.05,
|
| 409 |
+
paramwise_cfg=dict(
|
| 410 |
+
custom_keys=dict(
|
| 411 |
+
absolute_pos_embed=dict(decay_mult=0.0),
|
| 412 |
+
relative_position_bias_table=dict(decay_mult=0.0),
|
| 413 |
+
norm=dict(decay_mult=0.0))))
|
| 414 |
+
optimizer_config = dict(
|
| 415 |
+
grad_clip=None,
|
| 416 |
+
type='DistOptimizerHook',
|
| 417 |
+
update_interval=1,
|
| 418 |
+
coalesce=True,
|
| 419 |
+
bucket_size_mb=-1,
|
| 420 |
+
use_fp16=True)
|
| 421 |
+
lr_config = dict(
|
| 422 |
+
policy='step',
|
| 423 |
+
warmup='linear',
|
| 424 |
+
warmup_iters=500,
|
| 425 |
+
warmup_ratio=0.001,
|
| 426 |
+
step=[27, 33])
|
| 427 |
+
runner = dict(type='EpochBasedRunnerAmp', max_epochs=36)
|
| 428 |
+
checkpoint_config = dict(interval=1)
|
| 429 |
+
log_config = dict(interval=50, hooks=[dict(type='TextLoggerHook')])
|
| 430 |
+
custom_hooks = [dict(type='NumClassCheckHook')]
|
| 431 |
+
dist_params = dict(backend='nccl')
|
| 432 |
+
log_level = 'INFO'
|
| 433 |
+
load_from = '/root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/pretrained_model/swin_base_mona_llama_moe_distill_16.pth'
|
| 434 |
+
resume_from = None
|
| 435 |
+
workflow = [('train', 1)]
|
| 436 |
+
fp16 = None
|
| 437 |
+
work_dir = './results/train/mona_llama_moe_distill_4_16_1e-4/'
|
| 438 |
+
gpu_ids = range(0, 8)
|
mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/epoch_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc2cb92fdcb1e2431fdb251f9f7ddecc2cf3d661fd9f5a453f4adad43e31f271
|
| 3 |
+
size 2075183216
|
mmdet/results/train/mona_llama_moe_distill_4_16_1e-4/latest.pth
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
epoch_1.pth
|
mmdet/results/train/mona_moe_4_16_1e-4_balance/20250619_111115.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
mmdet/results/train/mona_moe_4_16_1e-4_balance/20250619_111115.log.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fabb30cd2bc8e09aa912a92d4d408f467bc0ca5a516da8a4698ce6a1ccc68675
|
| 3 |
+
size 160512
|
mmdet/results/train/mona_moe_4_16_1e-4_balance/cascade_mask_swin_base_3x_coco_sample_1_bs_16_mona_moe.py
ADDED
|
@@ -0,0 +1,438 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model = dict(
|
| 2 |
+
type='CascadeRCNN_loss',
|
| 3 |
+
pretrained=None,
|
| 4 |
+
backbone=dict(
|
| 5 |
+
type='SwinTransformer_mona_moe',
|
| 6 |
+
embed_dim=128,
|
| 7 |
+
depths=[2, 2, 18, 2],
|
| 8 |
+
num_heads=[4, 8, 16, 32],
|
| 9 |
+
window_size=7,
|
| 10 |
+
mlp_ratio=4.0,
|
| 11 |
+
qkv_bias=True,
|
| 12 |
+
qk_scale=None,
|
| 13 |
+
drop_rate=0.0,
|
| 14 |
+
attn_drop_rate=0.0,
|
| 15 |
+
drop_path_rate=0.3,
|
| 16 |
+
ape=False,
|
| 17 |
+
patch_norm=True,
|
| 18 |
+
out_indices=(0, 1, 2, 3),
|
| 19 |
+
use_checkpoint=False),
|
| 20 |
+
neck=dict(
|
| 21 |
+
type='FPN',
|
| 22 |
+
in_channels=[128, 256, 512, 1024],
|
| 23 |
+
out_channels=256,
|
| 24 |
+
num_outs=5),
|
| 25 |
+
rpn_head=dict(
|
| 26 |
+
type='RPNHead',
|
| 27 |
+
in_channels=256,
|
| 28 |
+
feat_channels=256,
|
| 29 |
+
anchor_generator=dict(
|
| 30 |
+
type='AnchorGenerator',
|
| 31 |
+
scales=[8],
|
| 32 |
+
ratios=[0.5, 1.0, 2.0],
|
| 33 |
+
strides=[4, 8, 16, 32, 64]),
|
| 34 |
+
bbox_coder=dict(
|
| 35 |
+
type='DeltaXYWHBBoxCoder',
|
| 36 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 37 |
+
target_stds=[1.0, 1.0, 1.0, 1.0]),
|
| 38 |
+
loss_cls=dict(
|
| 39 |
+
type='CrossEntropyLoss', use_sigmoid=True, loss_weight=1.0),
|
| 40 |
+
loss_bbox=dict(
|
| 41 |
+
type='SmoothL1Loss', beta=0.1111111111111111, loss_weight=1.0)),
|
| 42 |
+
roi_head=dict(
|
| 43 |
+
type='CascadeRoIHead',
|
| 44 |
+
num_stages=3,
|
| 45 |
+
stage_loss_weights=[1, 0.5, 0.25],
|
| 46 |
+
bbox_roi_extractor=dict(
|
| 47 |
+
type='SingleRoIExtractor',
|
| 48 |
+
roi_layer=dict(type='RoIAlign', output_size=7, sampling_ratio=0),
|
| 49 |
+
out_channels=256,
|
| 50 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 51 |
+
bbox_head=[
|
| 52 |
+
dict(
|
| 53 |
+
type='ConvFCBBoxHead',
|
| 54 |
+
num_shared_convs=4,
|
| 55 |
+
num_shared_fcs=1,
|
| 56 |
+
in_channels=256,
|
| 57 |
+
conv_out_channels=256,
|
| 58 |
+
fc_out_channels=1024,
|
| 59 |
+
roi_feat_size=7,
|
| 60 |
+
num_classes=80,
|
| 61 |
+
bbox_coder=dict(
|
| 62 |
+
type='DeltaXYWHBBoxCoder',
|
| 63 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 64 |
+
target_stds=[0.1, 0.1, 0.2, 0.2]),
|
| 65 |
+
reg_class_agnostic=False,
|
| 66 |
+
reg_decoded_bbox=True,
|
| 67 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 68 |
+
loss_cls=dict(
|
| 69 |
+
type='CrossEntropyLoss',
|
| 70 |
+
use_sigmoid=False,
|
| 71 |
+
loss_weight=1.0),
|
| 72 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 73 |
+
dict(
|
| 74 |
+
type='ConvFCBBoxHead',
|
| 75 |
+
num_shared_convs=4,
|
| 76 |
+
num_shared_fcs=1,
|
| 77 |
+
in_channels=256,
|
| 78 |
+
conv_out_channels=256,
|
| 79 |
+
fc_out_channels=1024,
|
| 80 |
+
roi_feat_size=7,
|
| 81 |
+
num_classes=80,
|
| 82 |
+
bbox_coder=dict(
|
| 83 |
+
type='DeltaXYWHBBoxCoder',
|
| 84 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 85 |
+
target_stds=[0.05, 0.05, 0.1, 0.1]),
|
| 86 |
+
reg_class_agnostic=False,
|
| 87 |
+
reg_decoded_bbox=True,
|
| 88 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 89 |
+
loss_cls=dict(
|
| 90 |
+
type='CrossEntropyLoss',
|
| 91 |
+
use_sigmoid=False,
|
| 92 |
+
loss_weight=1.0),
|
| 93 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0)),
|
| 94 |
+
dict(
|
| 95 |
+
type='ConvFCBBoxHead',
|
| 96 |
+
num_shared_convs=4,
|
| 97 |
+
num_shared_fcs=1,
|
| 98 |
+
in_channels=256,
|
| 99 |
+
conv_out_channels=256,
|
| 100 |
+
fc_out_channels=1024,
|
| 101 |
+
roi_feat_size=7,
|
| 102 |
+
num_classes=80,
|
| 103 |
+
bbox_coder=dict(
|
| 104 |
+
type='DeltaXYWHBBoxCoder',
|
| 105 |
+
target_means=[0.0, 0.0, 0.0, 0.0],
|
| 106 |
+
target_stds=[0.033, 0.033, 0.067, 0.067]),
|
| 107 |
+
reg_class_agnostic=False,
|
| 108 |
+
reg_decoded_bbox=True,
|
| 109 |
+
norm_cfg=dict(type='SyncBN', requires_grad=True),
|
| 110 |
+
loss_cls=dict(
|
| 111 |
+
type='CrossEntropyLoss',
|
| 112 |
+
use_sigmoid=False,
|
| 113 |
+
loss_weight=1.0),
|
| 114 |
+
loss_bbox=dict(type='GIoULoss', loss_weight=10.0))
|
| 115 |
+
],
|
| 116 |
+
mask_roi_extractor=dict(
|
| 117 |
+
type='SingleRoIExtractor',
|
| 118 |
+
roi_layer=dict(type='RoIAlign', output_size=14, sampling_ratio=0),
|
| 119 |
+
out_channels=256,
|
| 120 |
+
featmap_strides=[4, 8, 16, 32]),
|
| 121 |
+
mask_head=dict(
|
| 122 |
+
type='FCNMaskHead',
|
| 123 |
+
num_convs=4,
|
| 124 |
+
in_channels=256,
|
| 125 |
+
conv_out_channels=256,
|
| 126 |
+
num_classes=80,
|
| 127 |
+
loss_mask=dict(
|
| 128 |
+
type='CrossEntropyLoss', use_mask=True, loss_weight=1.0))),
|
| 129 |
+
train_cfg=dict(
|
| 130 |
+
rpn=dict(
|
| 131 |
+
assigner=dict(
|
| 132 |
+
type='MaxIoUAssigner',
|
| 133 |
+
pos_iou_thr=0.7,
|
| 134 |
+
neg_iou_thr=0.3,
|
| 135 |
+
min_pos_iou=0.3,
|
| 136 |
+
match_low_quality=True,
|
| 137 |
+
ignore_iof_thr=-1),
|
| 138 |
+
sampler=dict(
|
| 139 |
+
type='RandomSampler',
|
| 140 |
+
num=256,
|
| 141 |
+
pos_fraction=0.5,
|
| 142 |
+
neg_pos_ub=-1,
|
| 143 |
+
add_gt_as_proposals=False),
|
| 144 |
+
allowed_border=0,
|
| 145 |
+
pos_weight=-1,
|
| 146 |
+
debug=False),
|
| 147 |
+
rpn_proposal=dict(
|
| 148 |
+
nms_across_levels=False,
|
| 149 |
+
nms_pre=2000,
|
| 150 |
+
nms_post=2000,
|
| 151 |
+
max_per_img=2000,
|
| 152 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 153 |
+
min_bbox_size=0),
|
| 154 |
+
rcnn=[
|
| 155 |
+
dict(
|
| 156 |
+
assigner=dict(
|
| 157 |
+
type='MaxIoUAssigner',
|
| 158 |
+
pos_iou_thr=0.5,
|
| 159 |
+
neg_iou_thr=0.5,
|
| 160 |
+
min_pos_iou=0.5,
|
| 161 |
+
match_low_quality=False,
|
| 162 |
+
ignore_iof_thr=-1),
|
| 163 |
+
sampler=dict(
|
| 164 |
+
type='RandomSampler',
|
| 165 |
+
num=512,
|
| 166 |
+
pos_fraction=0.25,
|
| 167 |
+
neg_pos_ub=-1,
|
| 168 |
+
add_gt_as_proposals=True),
|
| 169 |
+
mask_size=28,
|
| 170 |
+
pos_weight=-1,
|
| 171 |
+
debug=False),
|
| 172 |
+
dict(
|
| 173 |
+
assigner=dict(
|
| 174 |
+
type='MaxIoUAssigner',
|
| 175 |
+
pos_iou_thr=0.6,
|
| 176 |
+
neg_iou_thr=0.6,
|
| 177 |
+
min_pos_iou=0.6,
|
| 178 |
+
match_low_quality=False,
|
| 179 |
+
ignore_iof_thr=-1),
|
| 180 |
+
sampler=dict(
|
| 181 |
+
type='RandomSampler',
|
| 182 |
+
num=512,
|
| 183 |
+
pos_fraction=0.25,
|
| 184 |
+
neg_pos_ub=-1,
|
| 185 |
+
add_gt_as_proposals=True),
|
| 186 |
+
mask_size=28,
|
| 187 |
+
pos_weight=-1,
|
| 188 |
+
debug=False),
|
| 189 |
+
dict(
|
| 190 |
+
assigner=dict(
|
| 191 |
+
type='MaxIoUAssigner',
|
| 192 |
+
pos_iou_thr=0.7,
|
| 193 |
+
neg_iou_thr=0.7,
|
| 194 |
+
min_pos_iou=0.7,
|
| 195 |
+
match_low_quality=False,
|
| 196 |
+
ignore_iof_thr=-1),
|
| 197 |
+
sampler=dict(
|
| 198 |
+
type='RandomSampler',
|
| 199 |
+
num=512,
|
| 200 |
+
pos_fraction=0.25,
|
| 201 |
+
neg_pos_ub=-1,
|
| 202 |
+
add_gt_as_proposals=True),
|
| 203 |
+
mask_size=28,
|
| 204 |
+
pos_weight=-1,
|
| 205 |
+
debug=False)
|
| 206 |
+
]),
|
| 207 |
+
test_cfg=dict(
|
| 208 |
+
rpn=dict(
|
| 209 |
+
nms_across_levels=False,
|
| 210 |
+
nms_pre=1000,
|
| 211 |
+
nms_post=1000,
|
| 212 |
+
max_per_img=1000,
|
| 213 |
+
nms=dict(type='nms', iou_threshold=0.7),
|
| 214 |
+
min_bbox_size=0),
|
| 215 |
+
rcnn=dict(
|
| 216 |
+
score_thr=0.05,
|
| 217 |
+
nms=dict(type='nms', iou_threshold=0.5),
|
| 218 |
+
max_per_img=100,
|
| 219 |
+
mask_thr_binary=0.5)))
|
| 220 |
+
dataset_type = 'CocoDataset'
|
| 221 |
+
data_root = '/root/autodl-tmp/COCO2017/'
|
| 222 |
+
img_norm_cfg = dict(
|
| 223 |
+
mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True)
|
| 224 |
+
train_pipeline = [
|
| 225 |
+
dict(type='LoadImageFromFile'),
|
| 226 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 227 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 228 |
+
dict(
|
| 229 |
+
type='AutoAugment',
|
| 230 |
+
policies=[[{
|
| 231 |
+
'type':
|
| 232 |
+
'Resize',
|
| 233 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333), (576, 1333),
|
| 234 |
+
(608, 1333), (640, 1333), (672, 1333), (704, 1333),
|
| 235 |
+
(736, 1333), (768, 1333), (800, 1333)],
|
| 236 |
+
'multiscale_mode':
|
| 237 |
+
'value',
|
| 238 |
+
'keep_ratio':
|
| 239 |
+
True
|
| 240 |
+
}],
|
| 241 |
+
[{
|
| 242 |
+
'type': 'Resize',
|
| 243 |
+
'img_scale': [(400, 1333), (500, 1333), (600, 1333)],
|
| 244 |
+
'multiscale_mode': 'value',
|
| 245 |
+
'keep_ratio': True
|
| 246 |
+
}, {
|
| 247 |
+
'type': 'RandomCrop',
|
| 248 |
+
'crop_type': 'absolute_range',
|
| 249 |
+
'crop_size': (384, 600),
|
| 250 |
+
'allow_negative_crop': True
|
| 251 |
+
}, {
|
| 252 |
+
'type':
|
| 253 |
+
'Resize',
|
| 254 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 255 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 256 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 257 |
+
(768, 1333), (800, 1333)],
|
| 258 |
+
'multiscale_mode':
|
| 259 |
+
'value',
|
| 260 |
+
'override':
|
| 261 |
+
True,
|
| 262 |
+
'keep_ratio':
|
| 263 |
+
True
|
| 264 |
+
}]]),
|
| 265 |
+
dict(
|
| 266 |
+
type='Normalize',
|
| 267 |
+
mean=[123.675, 116.28, 103.53],
|
| 268 |
+
std=[58.395, 57.12, 57.375],
|
| 269 |
+
to_rgb=True),
|
| 270 |
+
dict(type='Pad', size_divisor=32),
|
| 271 |
+
dict(type='DefaultFormatBundle'),
|
| 272 |
+
dict(type='Collect', keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 273 |
+
]
|
| 274 |
+
test_pipeline = [
|
| 275 |
+
dict(type='LoadImageFromFile'),
|
| 276 |
+
dict(
|
| 277 |
+
type='MultiScaleFlipAug',
|
| 278 |
+
img_scale=(1333, 800),
|
| 279 |
+
flip=False,
|
| 280 |
+
transforms=[
|
| 281 |
+
dict(type='Resize', keep_ratio=True),
|
| 282 |
+
dict(type='RandomFlip'),
|
| 283 |
+
dict(
|
| 284 |
+
type='Normalize',
|
| 285 |
+
mean=[123.675, 116.28, 103.53],
|
| 286 |
+
std=[58.395, 57.12, 57.375],
|
| 287 |
+
to_rgb=True),
|
| 288 |
+
dict(type='Pad', size_divisor=32),
|
| 289 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 290 |
+
dict(type='Collect', keys=['img'])
|
| 291 |
+
])
|
| 292 |
+
]
|
| 293 |
+
data = dict(
|
| 294 |
+
samples_per_gpu=2,
|
| 295 |
+
workers_per_gpu=4,
|
| 296 |
+
train=dict(
|
| 297 |
+
type='CocoDataset',
|
| 298 |
+
ann_file=
|
| 299 |
+
'/root/autodl-tmp/COCO2017/annotations/instances_train2017.json',
|
| 300 |
+
img_prefix='/root/autodl-tmp/COCO2017/train2017/',
|
| 301 |
+
pipeline=[
|
| 302 |
+
dict(type='LoadImageFromFile'),
|
| 303 |
+
dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
|
| 304 |
+
dict(type='RandomFlip', flip_ratio=0.5),
|
| 305 |
+
dict(
|
| 306 |
+
type='AutoAugment',
|
| 307 |
+
policies=[[{
|
| 308 |
+
'type':
|
| 309 |
+
'Resize',
|
| 310 |
+
'img_scale': [(480, 1333), (512, 1333), (544, 1333),
|
| 311 |
+
(576, 1333), (608, 1333), (640, 1333),
|
| 312 |
+
(672, 1333), (704, 1333), (736, 1333),
|
| 313 |
+
(768, 1333), (800, 1333)],
|
| 314 |
+
'multiscale_mode':
|
| 315 |
+
'value',
|
| 316 |
+
'keep_ratio':
|
| 317 |
+
True
|
| 318 |
+
}],
|
| 319 |
+
[{
|
| 320 |
+
'type': 'Resize',
|
| 321 |
+
'img_scale': [(400, 1333), (500, 1333),
|
| 322 |
+
(600, 1333)],
|
| 323 |
+
'multiscale_mode': 'value',
|
| 324 |
+
'keep_ratio': True
|
| 325 |
+
}, {
|
| 326 |
+
'type': 'RandomCrop',
|
| 327 |
+
'crop_type': 'absolute_range',
|
| 328 |
+
'crop_size': (384, 600),
|
| 329 |
+
'allow_negative_crop': True
|
| 330 |
+
}, {
|
| 331 |
+
'type':
|
| 332 |
+
'Resize',
|
| 333 |
+
'img_scale': [(480, 1333), (512, 1333),
|
| 334 |
+
(544, 1333), (576, 1333),
|
| 335 |
+
(608, 1333), (640, 1333),
|
| 336 |
+
(672, 1333), (704, 1333),
|
| 337 |
+
(736, 1333), (768, 1333),
|
| 338 |
+
(800, 1333)],
|
| 339 |
+
'multiscale_mode':
|
| 340 |
+
'value',
|
| 341 |
+
'override':
|
| 342 |
+
True,
|
| 343 |
+
'keep_ratio':
|
| 344 |
+
True
|
| 345 |
+
}]]),
|
| 346 |
+
dict(
|
| 347 |
+
type='Normalize',
|
| 348 |
+
mean=[123.675, 116.28, 103.53],
|
| 349 |
+
std=[58.395, 57.12, 57.375],
|
| 350 |
+
to_rgb=True),
|
| 351 |
+
dict(type='Pad', size_divisor=32),
|
| 352 |
+
dict(type='DefaultFormatBundle'),
|
| 353 |
+
dict(
|
| 354 |
+
type='Collect',
|
| 355 |
+
keys=['img', 'gt_bboxes', 'gt_labels', 'gt_masks'])
|
| 356 |
+
]),
|
| 357 |
+
val=dict(
|
| 358 |
+
type='CocoDataset',
|
| 359 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 360 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 361 |
+
pipeline=[
|
| 362 |
+
dict(type='LoadImageFromFile'),
|
| 363 |
+
dict(
|
| 364 |
+
type='MultiScaleFlipAug',
|
| 365 |
+
img_scale=(1333, 800),
|
| 366 |
+
flip=False,
|
| 367 |
+
transforms=[
|
| 368 |
+
dict(type='Resize', keep_ratio=True),
|
| 369 |
+
dict(type='RandomFlip'),
|
| 370 |
+
dict(
|
| 371 |
+
type='Normalize',
|
| 372 |
+
mean=[123.675, 116.28, 103.53],
|
| 373 |
+
std=[58.395, 57.12, 57.375],
|
| 374 |
+
to_rgb=True),
|
| 375 |
+
dict(type='Pad', size_divisor=32),
|
| 376 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 377 |
+
dict(type='Collect', keys=['img'])
|
| 378 |
+
])
|
| 379 |
+
]),
|
| 380 |
+
test=dict(
|
| 381 |
+
type='CocoDataset',
|
| 382 |
+
ann_file='/root/autodl-tmp/COCO2017/annotations/instances_val2017.json',
|
| 383 |
+
img_prefix='/root/autodl-tmp/COCO2017/val2017/',
|
| 384 |
+
pipeline=[
|
| 385 |
+
dict(type='LoadImageFromFile'),
|
| 386 |
+
dict(
|
| 387 |
+
type='MultiScaleFlipAug',
|
| 388 |
+
img_scale=(1333, 800),
|
| 389 |
+
flip=False,
|
| 390 |
+
transforms=[
|
| 391 |
+
dict(type='Resize', keep_ratio=True),
|
| 392 |
+
dict(type='RandomFlip'),
|
| 393 |
+
dict(
|
| 394 |
+
type='Normalize',
|
| 395 |
+
mean=[123.675, 116.28, 103.53],
|
| 396 |
+
std=[58.395, 57.12, 57.375],
|
| 397 |
+
to_rgb=True),
|
| 398 |
+
dict(type='Pad', size_divisor=32),
|
| 399 |
+
dict(type='ImageToTensor', keys=['img']),
|
| 400 |
+
dict(type='Collect', keys=['img'])
|
| 401 |
+
])
|
| 402 |
+
]))
|
| 403 |
+
evaluation = dict(metric=['bbox', 'segm'], gpu_collect=True)
|
| 404 |
+
optimizer = dict(
|
| 405 |
+
type='AdamW',
|
| 406 |
+
lr=0.0001,
|
| 407 |
+
betas=(0.9, 0.999),
|
| 408 |
+
weight_decay=0.05,
|
| 409 |
+
paramwise_cfg=dict(
|
| 410 |
+
custom_keys=dict(
|
| 411 |
+
absolute_pos_embed=dict(decay_mult=0.0),
|
| 412 |
+
relative_position_bias_table=dict(decay_mult=0.0),
|
| 413 |
+
norm=dict(decay_mult=0.0))))
|
| 414 |
+
optimizer_config = dict(
|
| 415 |
+
grad_clip=None,
|
| 416 |
+
type='DistOptimizerHook',
|
| 417 |
+
update_interval=1,
|
| 418 |
+
coalesce=True,
|
| 419 |
+
bucket_size_mb=-1,
|
| 420 |
+
use_fp16=True)
|
| 421 |
+
lr_config = dict(
|
| 422 |
+
policy='step',
|
| 423 |
+
warmup='linear',
|
| 424 |
+
warmup_iters=500,
|
| 425 |
+
warmup_ratio=0.001,
|
| 426 |
+
step=[27, 33])
|
| 427 |
+
runner = dict(type='EpochBasedRunnerAmp', max_epochs=36)
|
| 428 |
+
checkpoint_config = dict(interval=1)
|
| 429 |
+
log_config = dict(interval=50, hooks=[dict(type='TextLoggerHook')])
|
| 430 |
+
custom_hooks = [dict(type='NumClassCheckHook')]
|
| 431 |
+
dist_params = dict(backend='nccl')
|
| 432 |
+
log_level = 'INFO'
|
| 433 |
+
load_from = '/root/autodl-tmp/caihaojie/mona/Swin-Transformer-Object-Detection/pretrained_model/swin_base_mona_moe_16.pth'
|
| 434 |
+
resume_from = None
|
| 435 |
+
workflow = [('train', 1)]
|
| 436 |
+
fp16 = None
|
| 437 |
+
work_dir = './results/train/mona_moe_4_16_1e-4_balance/'
|
| 438 |
+
gpu_ids = range(0, 8)
|
mmdet/results/train/mona_moe_4_16_1e-4_balance/epoch_1.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa684495d3d42db79db33c0fa006545da2fddb8817b463aba4dbba7ad76cf616
|
| 3 |
+
size 1517228592
|
mmdet/{checkpoints/swin_base_mona_moe_4_16_epoch_4.pth → results/train/mona_moe_4_16_1e-4_balance/epoch_2.pth}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1517228720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1a24272473556393087e0bf9c8a39fc192cc0c64e589091613221391826ec6c4
|
| 3 |
size 1517228720
|
mmdet/results/train/mona_moe_4_16_1e-4_balance/latest.pth
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
epoch_2.pth
|
mmdet/results/train/mona_moe_4_16_1e-4_gate/20250618_110426.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
mmdet/results/train/mona_moe_4_16_1e-4_gate/20250618_110426.log.json
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14eb75b182e65d6da64bd2a44f1d6d959815bdfc7e58297910472c65c0612cdb
|
| 3 |
+
size 187274
|