Chikap421 commited on
Commit
597a85a
·
verified ·
1 Parent(s): de7c24f

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. experiment/thermal_run1/checkpoints/checkpoint.pt +3 -0
  2. experiment/thermal_run1/checkpoints/checkpoint_1.pt +3 -0
  3. experiment/thermal_run1/checkpoints/checkpoint_10.pt +3 -0
  4. experiment/thermal_run1/checkpoints/checkpoint_11.pt +3 -0
  5. experiment/thermal_run1/checkpoints/checkpoint_12.pt +3 -0
  6. experiment/thermal_run1/checkpoints/checkpoint_13.pt +3 -0
  7. experiment/thermal_run1/checkpoints/checkpoint_14.pt +3 -0
  8. experiment/thermal_run1/checkpoints/checkpoint_15.pt +3 -0
  9. experiment/thermal_run1/checkpoints/checkpoint_16.pt +3 -0
  10. experiment/thermal_run1/checkpoints/checkpoint_17.pt +3 -0
  11. experiment/thermal_run1/checkpoints/checkpoint_18.pt +3 -0
  12. experiment/thermal_run1/checkpoints/checkpoint_19.pt +3 -0
  13. experiment/thermal_run1/checkpoints/checkpoint_2.pt +3 -0
  14. experiment/thermal_run1/checkpoints/checkpoint_20.pt +3 -0
  15. experiment/thermal_run1/checkpoints/checkpoint_21.pt +3 -0
  16. experiment/thermal_run1/checkpoints/checkpoint_22.pt +3 -0
  17. experiment/thermal_run1/checkpoints/checkpoint_23.pt +3 -0
  18. experiment/thermal_run1/checkpoints/checkpoint_24.pt +3 -0
  19. experiment/thermal_run1/checkpoints/checkpoint_25.pt +3 -0
  20. experiment/thermal_run1/checkpoints/checkpoint_26.pt +3 -0
  21. experiment/thermal_run1/checkpoints/checkpoint_27.pt +3 -0
  22. experiment/thermal_run1/checkpoints/checkpoint_28.pt +3 -0
  23. experiment/thermal_run1/checkpoints/checkpoint_29.pt +3 -0
  24. experiment/thermal_run1/checkpoints/checkpoint_3.pt +3 -0
  25. experiment/thermal_run1/checkpoints/checkpoint_30.pt +3 -0
  26. experiment/thermal_run1/checkpoints/checkpoint_31.pt +3 -0
  27. experiment/thermal_run1/checkpoints/checkpoint_32.pt +3 -0
  28. experiment/thermal_run1/checkpoints/checkpoint_33.pt +3 -0
  29. experiment/thermal_run1/checkpoints/checkpoint_34.pt +3 -0
  30. experiment/thermal_run1/checkpoints/checkpoint_35.pt +3 -0
  31. experiment/thermal_run1/checkpoints/checkpoint_36.pt +3 -0
  32. experiment/thermal_run1/checkpoints/checkpoint_37.pt +3 -0
  33. experiment/thermal_run1/checkpoints/checkpoint_38.pt +3 -0
  34. experiment/thermal_run1/checkpoints/checkpoint_39.pt +3 -0
  35. experiment/thermal_run1/checkpoints/checkpoint_4.pt +3 -0
  36. experiment/thermal_run1/checkpoints/checkpoint_40.pt +3 -0
  37. experiment/thermal_run1/checkpoints/checkpoint_5.pt +3 -0
  38. experiment/thermal_run1/checkpoints/checkpoint_6.pt +3 -0
  39. experiment/thermal_run1/checkpoints/checkpoint_7.pt +3 -0
  40. experiment/thermal_run1/checkpoints/checkpoint_8.pt +3 -0
  41. experiment/thermal_run1/checkpoints/checkpoint_9.pt +3 -0
  42. experiment/thermal_run1/config.yaml +313 -0
  43. experiment/thermal_run1/config_resolved.yaml +351 -0
  44. experiment/thermal_run1/logs/best_stats.json +40 -0
  45. experiment/thermal_run1/logs/log.txt +732 -0
  46. experiment/thermal_run1/logs/train_stats.json +40 -0
  47. experiment/thermal_run1/tensorboard/events.out.tfevents.1759750510.gpub060.delta.ncsa.illinois.edu.921762.0c94822e4-1523-4465-a797-8a6fd58b2af0 +3 -0
  48. sam2.1_hiera_base_plus.pt +3 -0
  49. sam2.1_hiera_large.pt +3 -0
  50. sam2.1_hiera_small.pt +3 -0
experiment/thermal_run1/checkpoints/checkpoint.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a08cacd09cd24a7afa1704b1b728229b0c2d26f85b8b8bc71c4c938816f3cddd
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_1.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8be8e0e9be5d1bd7f16e7bdd5dde033a23e380a7f8f35b605db755ee6fe6c935
3
+ size 910662430
experiment/thermal_run1/checkpoints/checkpoint_10.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf4aed853f9a17594becbb8e5be9083aede7dee0f1a8a925bdaf5fea34556113
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_11.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e988c851be054f9c9358b0e7898962705ec7dbf66b9c6b6ecd17eee53d2e7ef7
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_12.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:741638750ae87f08f11310a62b6629b0621742e260e2379b39568f2d450c26c6
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_13.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7127b6697fdc6af359133b1f581f8e02bc991bdc208de84dffc1ef5fb71a43f0
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_14.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65557d72abed4de1571980f2a8a1f209479bead51c8586e347ff5414c2983689
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_15.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:154609c3c910e5328c62ddb7a7a69cffb8ac3c808558296192852c1abcce1211
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_16.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28a5f59da4849fa333917f55c52b1b6a25d7b4732d6714fb5c8c066d93a03ab1
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_17.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97b9f700b06a797f06049f86294bffb405fc2bdba2249bf2ab34e5f836a6ab4a
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_18.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e90e450f66a8181bead198544fd60de5f37e40d474a402b6cafa3c10dd923725
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_19.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18141f1ba0926e7e3f013313f04d7ea6d7e925a46c0e1b9b83f5dd2aa11dfaaa
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_2.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ce4f830aea93cf1923ba745483ea278063876bc4427650d095a8bf2e397d035
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_20.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5723da2d8804c7bc5e6c52ae85faa90fc81e6eaa5c8aa7ccf82fc15dba07581b
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_21.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a16f8b06bdc8d228f1b465aede71197ad4a3e33eba292550bc94b3025c47f96d
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_22.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8913122ef939840271327177ddbee90bec6ccd1d4598030d479117dd4676139b
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_23.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c897512fbc9533c6ae0171af2f735cc6618e9f2af5c69d761c26123efe82f158
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_24.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c4e754eee30de9285b3e59c6b953eae6423d0d0938139b3ba29f1a76aee04a5
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_25.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a58e92dd643fc840ac89e729580cb3caa78f6747725bae72a602934c07d64af6
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_26.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94d51b6043964ee7ff657ecb0d3aa3fc811ce72806141469982ec46eefcbcd54
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_27.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:deb0f245104633753716ceebdd899ef41b62dea134e50815b3d2fdc2bd83a30f
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_28.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5615b19809b17430a340ea91456ea928010b3fe40c0ae599d51d09e3d4ed7e7e
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_29.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9c1198b55bb8a39cb9d5adf80306a9a79508b541e48252a2ed1a3e6263d0566
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_3.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab49e18e7cf1dbb6bcda0c8769cb1f7c29be04e1db72552a9ac12cb1eb502fe6
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_30.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:121f13583903cc30bc200fa77eacb0c0d0cec5302d9612055b046e0b1f787fe8
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_31.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b87ed7ead47522fe96481d9f140aa56365b5633a00cd4ff28473d03aa366a3e
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_32.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c972da36a8eb74204a8c2aaa24dbf108ba470e94e1996e2925d2ed78fd83115
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_33.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:559dcdb27c480d5a437fc1495ff01756822150051ea82364a6b3ad9b2bd4194a
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_34.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fe3db97948547e415a25243ba68263b26a51ac0266cf8ba5cbbbcbdcf78cc88
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_35.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:535c531bfefc6ca4cd50d387f961b303232a3c2fa218399ab5e77ac7328355ae
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_36.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6296c062a7b607dd86dc000b9857bee0eb04cc3362922652818f16b45e2d866d
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_37.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0e196e40a20f07a7356a4cde873430988e4131e587a65ad7883977e611302fa
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_38.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5370354b5e917526695cb893303d3b2ff55ed11ff4c7a395c8c5c49da4bfc1ee
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_39.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ab630fa6bd6535ee263f5aa584281f268b9ece7d5501e8564bba7696fac07f1
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_4.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4173e21af1808616ece284564e2d8ba44ade31ccec5ecb457b46d172bc2e6d73
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_40.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a08cacd09cd24a7afa1704b1b728229b0c2d26f85b8b8bc71c4c938816f3cddd
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_5.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2cda5c769cdb24325396bf8fa9601a1adc277ffdeb9a4bc2ae4ca2c8a92e879d
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_6.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a772cd7044f36d52d9a96ea314f7a09590f85f42d2c3534d86ae0f8ddc2ffa3d
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_7.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53ebacbd40cf8a0855fbdedb7f9795d80f169f18ae02aa2b146a065c521d8a97
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_8.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c24089637368598c6ae5302fbf61c1ef46994a950cbd4c5f3c114a82e925f6a1
3
+ size 910662494
experiment/thermal_run1/checkpoints/checkpoint_9.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e2f521f3db0b6438a03e61df33d1339ca910a8c89f9a8fe222b1481bb5a8a384
3
+ size 910662494
experiment/thermal_run1/config.yaml ADDED
@@ -0,0 +1,313 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ scratch:
2
+ resolution: 1024
3
+ train_batch_size: 1
4
+ num_train_workers: 10
5
+ num_frames: 1
6
+ max_num_objects: 3
7
+ base_lr: 5.0e-06
8
+ vision_lr: 3.0e-06
9
+ phases_per_epoch: 1
10
+ num_epochs: 40
11
+ dataset:
12
+ img_folder: /work/nvme/bfgd/cmaduabuchi/DATA/thermal_video/thriveseg/train/images
13
+ gt_folder: /work/nvme/bfgd/cmaduabuchi/DATA/thermal_video/thriveseg/train/masks
14
+ file_list_txt: null
15
+ multiplier: 2
16
+ vos:
17
+ train_transforms:
18
+ - _target_: training.dataset.transforms.ComposeAPI
19
+ transforms:
20
+ - _target_: training.dataset.transforms.RandomHorizontalFlip
21
+ consistent_transform: true
22
+ - _target_: training.dataset.transforms.RandomAffine
23
+ degrees: 25
24
+ shear: 20
25
+ image_interpolation: bilinear
26
+ consistent_transform: true
27
+ - _target_: training.dataset.transforms.RandomResizeAPI
28
+ sizes: ${scratch.resolution}
29
+ square: true
30
+ consistent_transform: true
31
+ - _target_: training.dataset.transforms.ColorJitter
32
+ consistent_transform: true
33
+ brightness: 0.1
34
+ contrast: 0.03
35
+ saturation: 0.03
36
+ hue: null
37
+ - _target_: training.dataset.transforms.RandomGrayscale
38
+ p: 0.05
39
+ consistent_transform: true
40
+ - _target_: training.dataset.transforms.ColorJitter
41
+ consistent_transform: false
42
+ brightness: 0.1
43
+ contrast: 0.05
44
+ saturation: 0.05
45
+ hue: null
46
+ - _target_: training.dataset.transforms.ToTensorAPI
47
+ - _target_: training.dataset.transforms.NormalizeAPI
48
+ mean:
49
+ - 0.485
50
+ - 0.456
51
+ - 0.406
52
+ std:
53
+ - 0.229
54
+ - 0.224
55
+ - 0.225
56
+ trainer:
57
+ _target_: training.trainer.Trainer
58
+ mode: train_only
59
+ max_epochs: ${times:${scratch.num_epochs},${scratch.phases_per_epoch}}
60
+ accelerator: cuda
61
+ seed_value: 123
62
+ model:
63
+ _target_: training.model.sam2.SAM2Train
64
+ image_encoder:
65
+ _target_: sam2.modeling.backbones.image_encoder.ImageEncoder
66
+ scalp: 1
67
+ trunk:
68
+ _target_: sam2.modeling.backbones.hieradet.Hiera
69
+ embed_dim: 112
70
+ num_heads: 2
71
+ drop_path_rate: 0.1
72
+ neck:
73
+ _target_: sam2.modeling.backbones.image_encoder.FpnNeck
74
+ position_encoding:
75
+ _target_: sam2.modeling.position_encoding.PositionEmbeddingSine
76
+ num_pos_feats: 256
77
+ normalize: true
78
+ scale: null
79
+ temperature: 10000
80
+ d_model: 256
81
+ backbone_channel_list:
82
+ - 896
83
+ - 448
84
+ - 224
85
+ - 112
86
+ fpn_top_down_levels:
87
+ - 2
88
+ - 3
89
+ fpn_interp_model: nearest
90
+ memory_attention:
91
+ _target_: sam2.modeling.memory_attention.MemoryAttention
92
+ d_model: 256
93
+ pos_enc_at_input: true
94
+ layer:
95
+ _target_: sam2.modeling.memory_attention.MemoryAttentionLayer
96
+ activation: relu
97
+ dim_feedforward: 2048
98
+ dropout: 0.1
99
+ pos_enc_at_attn: false
100
+ self_attention:
101
+ _target_: sam2.modeling.sam.transformer.RoPEAttention
102
+ rope_theta: 10000.0
103
+ feat_sizes:
104
+ - 64
105
+ - 64
106
+ embedding_dim: 256
107
+ num_heads: 1
108
+ downsample_rate: 1
109
+ dropout: 0.1
110
+ d_model: 256
111
+ pos_enc_at_cross_attn_keys: true
112
+ pos_enc_at_cross_attn_queries: false
113
+ cross_attention:
114
+ _target_: sam2.modeling.sam.transformer.RoPEAttention
115
+ rope_theta: 10000.0
116
+ feat_sizes:
117
+ - 64
118
+ - 64
119
+ rope_k_repeat: true
120
+ embedding_dim: 256
121
+ num_heads: 1
122
+ downsample_rate: 1
123
+ dropout: 0.1
124
+ kv_in_dim: 64
125
+ num_layers: 4
126
+ memory_encoder:
127
+ _target_: sam2.modeling.memory_encoder.MemoryEncoder
128
+ out_dim: 64
129
+ position_encoding:
130
+ _target_: sam2.modeling.position_encoding.PositionEmbeddingSine
131
+ num_pos_feats: 64
132
+ normalize: true
133
+ scale: null
134
+ temperature: 10000
135
+ mask_downsampler:
136
+ _target_: sam2.modeling.memory_encoder.MaskDownSampler
137
+ kernel_size: 3
138
+ stride: 2
139
+ padding: 1
140
+ fuser:
141
+ _target_: sam2.modeling.memory_encoder.Fuser
142
+ layer:
143
+ _target_: sam2.modeling.memory_encoder.CXBlock
144
+ dim: 256
145
+ kernel_size: 7
146
+ padding: 3
147
+ layer_scale_init_value: 1.0e-06
148
+ use_dwconv: true
149
+ num_layers: 2
150
+ num_maskmem: 7
151
+ image_size: ${scratch.resolution}
152
+ sigmoid_scale_for_mem_enc: 20.0
153
+ sigmoid_bias_for_mem_enc: -10.0
154
+ use_mask_input_as_output_without_sam: true
155
+ directly_add_no_mem_embed: true
156
+ no_obj_embed_spatial: true
157
+ use_high_res_features_in_sam: true
158
+ multimask_output_in_sam: true
159
+ iou_prediction_use_sigmoid: true
160
+ use_obj_ptrs_in_encoder: true
161
+ add_tpos_enc_to_obj_ptrs: true
162
+ proj_tpos_enc_in_obj_ptrs: true
163
+ use_signed_tpos_enc_to_obj_ptrs: true
164
+ only_obj_ptrs_in_the_past_for_eval: true
165
+ pred_obj_scores: true
166
+ pred_obj_scores_mlp: true
167
+ fixed_no_obj_ptr: true
168
+ multimask_output_for_tracking: true
169
+ use_multimask_token_for_obj_ptr: true
170
+ multimask_min_pt_num: 0
171
+ multimask_max_pt_num: 1
172
+ use_mlp_for_obj_ptr_proj: true
173
+ prob_to_use_pt_input_for_train: 0.5
174
+ prob_to_use_pt_input_for_eval: 0.0
175
+ prob_to_use_box_input_for_train: 0.5
176
+ prob_to_use_box_input_for_eval: 0.0
177
+ prob_to_sample_from_gt_for_train: 0.1
178
+ num_frames_to_correct_for_train: 2
179
+ num_frames_to_correct_for_eval: 1
180
+ rand_frames_to_correct_for_train: true
181
+ add_all_frames_to_correct_as_cond: true
182
+ num_init_cond_frames_for_train: 2
183
+ rand_init_cond_frames_for_train: true
184
+ num_correction_pt_per_frame: 7
185
+ use_act_ckpt_iterative_pt_sampling: false
186
+ num_init_cond_frames_for_eval: 1
187
+ forward_backbone_per_frame_for_eval: true
188
+ data:
189
+ train:
190
+ _target_: training.dataset.sam2_datasets.TorchTrainMixedDataset
191
+ phases_per_epoch: ${scratch.phases_per_epoch}
192
+ batch_sizes:
193
+ - ${scratch.train_batch_size}
194
+ datasets:
195
+ - _target_: training.dataset.utils.RepeatFactorWrapper
196
+ dataset:
197
+ _target_: training.dataset.utils.ConcatDataset
198
+ datasets:
199
+ - _target_: training.dataset.vos_dataset.VOSDataset
200
+ transforms: ${vos.train_transforms}
201
+ training: true
202
+ video_dataset:
203
+ _target_: training.dataset.binary_png_raw_dataset.BinaryPNGRawDataset
204
+ img_folder: ${dataset.img_folder}
205
+ gt_folder: ${dataset.gt_folder}
206
+ file_list_txt: ${dataset.file_list_txt}
207
+ sampler:
208
+ _target_: training.dataset.vos_sampler.RandomUniformSampler
209
+ num_frames: ${scratch.num_frames}
210
+ max_num_objects: ${scratch.max_num_objects}
211
+ multiplier: ${dataset.multiplier}
212
+ shuffle: true
213
+ num_workers: ${scratch.num_train_workers}
214
+ pin_memory: true
215
+ drop_last: true
216
+ collate_fn:
217
+ _target_: training.utils.data_utils.collate_fn
218
+ _partial_: true
219
+ dict_key: all
220
+ optim:
221
+ amp:
222
+ enabled: true
223
+ amp_dtype: bfloat16
224
+ optimizer:
225
+ _target_: torch.optim.AdamW
226
+ gradient_clip:
227
+ _target_: training.optimizer.GradientClipper
228
+ max_norm: 0.1
229
+ norm_type: 2
230
+ param_group_modifiers:
231
+ - _target_: training.optimizer.layer_decay_param_modifier
232
+ _partial_: true
233
+ layer_decay_value: 0.9
234
+ apply_to: image_encoder.trunk
235
+ overrides:
236
+ - pattern: '*pos_embed*'
237
+ value: 1.0
238
+ options:
239
+ lr:
240
+ - scheduler:
241
+ _target_: fvcore.common.param_scheduler.CosineParamScheduler
242
+ start_value: ${scratch.base_lr}
243
+ end_value: ${divide:${scratch.base_lr},10}
244
+ - scheduler:
245
+ _target_: fvcore.common.param_scheduler.CosineParamScheduler
246
+ start_value: ${scratch.vision_lr}
247
+ end_value: ${divide:${scratch.vision_lr},10}
248
+ param_names:
249
+ - image_encoder.*
250
+ weight_decay:
251
+ - scheduler:
252
+ _target_: fvcore.common.param_scheduler.ConstantParamScheduler
253
+ value: 0.1
254
+ - scheduler:
255
+ _target_: fvcore.common.param_scheduler.ConstantParamScheduler
256
+ value: 0.0
257
+ param_names:
258
+ - '*bias*'
259
+ module_cls_names:
260
+ - torch.nn.LayerNorm
261
+ loss:
262
+ all:
263
+ _target_: training.loss_fns.MultiStepMultiMasksAndIous
264
+ weight_dict:
265
+ loss_mask: 20
266
+ loss_dice: 1
267
+ loss_iou: 1
268
+ loss_class: 1
269
+ supervise_all_iou: true
270
+ iou_use_l1_loss: true
271
+ pred_obj_scores: true
272
+ focal_gamma_obj_score: 0.0
273
+ focal_alpha_obj_score: -1.0
274
+ distributed:
275
+ backend: nccl
276
+ find_unused_parameters: true
277
+ logging:
278
+ tensorboard_writer:
279
+ _target_: training.utils.logger.make_tensorboard_logger
280
+ log_dir: ${launcher.experiment_log_dir}/tensorboard
281
+ flush_secs: 120
282
+ should_log: true
283
+ log_dir: ${launcher.experiment_log_dir}/logs
284
+ log_freq: 10
285
+ checkpoint:
286
+ save_dir: ${launcher.experiment_log_dir}/checkpoints
287
+ save_freq: 1
288
+ model_weight_initializer:
289
+ _partial_: true
290
+ _target_: training.utils.checkpoint_utils.load_state_dict_into_model
291
+ strict: true
292
+ ignore_unexpected_keys: null
293
+ ignore_missing_keys: null
294
+ state_dict:
295
+ _target_: training.utils.checkpoint_utils.load_checkpoint_and_apply_kernels
296
+ checkpoint_path: /work/nvme/bfgd/cmaduabuchi/MODELS/THRIVESEG/sam2.1_hiera_base_plus.pt
297
+ ckpt_state_dict_keys:
298
+ - model
299
+ launcher:
300
+ num_nodes: 1
301
+ gpus_per_node: 8
302
+ experiment_log_dir: /work/nvme/bfgd/cmaduabuchi/MODELS/THRIVESEG/experiment/thermal_run1
303
+ submitit:
304
+ partition: null
305
+ account: null
306
+ qos: null
307
+ cpus_per_task: 10
308
+ use_cluster: false
309
+ timeout_hour: 24
310
+ name: null
311
+ port_range:
312
+ - 10000
313
+ - 65000
experiment/thermal_run1/config_resolved.yaml ADDED
@@ -0,0 +1,351 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ scratch:
2
+ resolution: 1024
3
+ train_batch_size: 1
4
+ num_train_workers: 10
5
+ num_frames: 1
6
+ max_num_objects: 3
7
+ base_lr: 5.0e-06
8
+ vision_lr: 3.0e-06
9
+ phases_per_epoch: 1
10
+ num_epochs: 40
11
+ dataset:
12
+ img_folder: /work/nvme/bfgd/cmaduabuchi/DATA/thermal_video/thriveseg/train/images
13
+ gt_folder: /work/nvme/bfgd/cmaduabuchi/DATA/thermal_video/thriveseg/train/masks
14
+ file_list_txt: null
15
+ multiplier: 2
16
+ vos:
17
+ train_transforms:
18
+ - _target_: training.dataset.transforms.ComposeAPI
19
+ transforms:
20
+ - _target_: training.dataset.transforms.RandomHorizontalFlip
21
+ consistent_transform: true
22
+ - _target_: training.dataset.transforms.RandomAffine
23
+ degrees: 25
24
+ shear: 20
25
+ image_interpolation: bilinear
26
+ consistent_transform: true
27
+ - _target_: training.dataset.transforms.RandomResizeAPI
28
+ sizes: 1024
29
+ square: true
30
+ consistent_transform: true
31
+ - _target_: training.dataset.transforms.ColorJitter
32
+ consistent_transform: true
33
+ brightness: 0.1
34
+ contrast: 0.03
35
+ saturation: 0.03
36
+ hue: null
37
+ - _target_: training.dataset.transforms.RandomGrayscale
38
+ p: 0.05
39
+ consistent_transform: true
40
+ - _target_: training.dataset.transforms.ColorJitter
41
+ consistent_transform: false
42
+ brightness: 0.1
43
+ contrast: 0.05
44
+ saturation: 0.05
45
+ hue: null
46
+ - _target_: training.dataset.transforms.ToTensorAPI
47
+ - _target_: training.dataset.transforms.NormalizeAPI
48
+ mean:
49
+ - 0.485
50
+ - 0.456
51
+ - 0.406
52
+ std:
53
+ - 0.229
54
+ - 0.224
55
+ - 0.225
56
+ trainer:
57
+ _target_: training.trainer.Trainer
58
+ mode: train_only
59
+ max_epochs: 40
60
+ accelerator: cuda
61
+ seed_value: 123
62
+ model:
63
+ _target_: training.model.sam2.SAM2Train
64
+ image_encoder:
65
+ _target_: sam2.modeling.backbones.image_encoder.ImageEncoder
66
+ scalp: 1
67
+ trunk:
68
+ _target_: sam2.modeling.backbones.hieradet.Hiera
69
+ embed_dim: 112
70
+ num_heads: 2
71
+ drop_path_rate: 0.1
72
+ neck:
73
+ _target_: sam2.modeling.backbones.image_encoder.FpnNeck
74
+ position_encoding:
75
+ _target_: sam2.modeling.position_encoding.PositionEmbeddingSine
76
+ num_pos_feats: 256
77
+ normalize: true
78
+ scale: null
79
+ temperature: 10000
80
+ d_model: 256
81
+ backbone_channel_list:
82
+ - 896
83
+ - 448
84
+ - 224
85
+ - 112
86
+ fpn_top_down_levels:
87
+ - 2
88
+ - 3
89
+ fpn_interp_model: nearest
90
+ memory_attention:
91
+ _target_: sam2.modeling.memory_attention.MemoryAttention
92
+ d_model: 256
93
+ pos_enc_at_input: true
94
+ layer:
95
+ _target_: sam2.modeling.memory_attention.MemoryAttentionLayer
96
+ activation: relu
97
+ dim_feedforward: 2048
98
+ dropout: 0.1
99
+ pos_enc_at_attn: false
100
+ self_attention:
101
+ _target_: sam2.modeling.sam.transformer.RoPEAttention
102
+ rope_theta: 10000.0
103
+ feat_sizes:
104
+ - 64
105
+ - 64
106
+ embedding_dim: 256
107
+ num_heads: 1
108
+ downsample_rate: 1
109
+ dropout: 0.1
110
+ d_model: 256
111
+ pos_enc_at_cross_attn_keys: true
112
+ pos_enc_at_cross_attn_queries: false
113
+ cross_attention:
114
+ _target_: sam2.modeling.sam.transformer.RoPEAttention
115
+ rope_theta: 10000.0
116
+ feat_sizes:
117
+ - 64
118
+ - 64
119
+ rope_k_repeat: true
120
+ embedding_dim: 256
121
+ num_heads: 1
122
+ downsample_rate: 1
123
+ dropout: 0.1
124
+ kv_in_dim: 64
125
+ num_layers: 4
126
+ memory_encoder:
127
+ _target_: sam2.modeling.memory_encoder.MemoryEncoder
128
+ out_dim: 64
129
+ position_encoding:
130
+ _target_: sam2.modeling.position_encoding.PositionEmbeddingSine
131
+ num_pos_feats: 64
132
+ normalize: true
133
+ scale: null
134
+ temperature: 10000
135
+ mask_downsampler:
136
+ _target_: sam2.modeling.memory_encoder.MaskDownSampler
137
+ kernel_size: 3
138
+ stride: 2
139
+ padding: 1
140
+ fuser:
141
+ _target_: sam2.modeling.memory_encoder.Fuser
142
+ layer:
143
+ _target_: sam2.modeling.memory_encoder.CXBlock
144
+ dim: 256
145
+ kernel_size: 7
146
+ padding: 3
147
+ layer_scale_init_value: 1.0e-06
148
+ use_dwconv: true
149
+ num_layers: 2
150
+ num_maskmem: 7
151
+ image_size: 1024
152
+ sigmoid_scale_for_mem_enc: 20.0
153
+ sigmoid_bias_for_mem_enc: -10.0
154
+ use_mask_input_as_output_without_sam: true
155
+ directly_add_no_mem_embed: true
156
+ no_obj_embed_spatial: true
157
+ use_high_res_features_in_sam: true
158
+ multimask_output_in_sam: true
159
+ iou_prediction_use_sigmoid: true
160
+ use_obj_ptrs_in_encoder: true
161
+ add_tpos_enc_to_obj_ptrs: true
162
+ proj_tpos_enc_in_obj_ptrs: true
163
+ use_signed_tpos_enc_to_obj_ptrs: true
164
+ only_obj_ptrs_in_the_past_for_eval: true
165
+ pred_obj_scores: true
166
+ pred_obj_scores_mlp: true
167
+ fixed_no_obj_ptr: true
168
+ multimask_output_for_tracking: true
169
+ use_multimask_token_for_obj_ptr: true
170
+ multimask_min_pt_num: 0
171
+ multimask_max_pt_num: 1
172
+ use_mlp_for_obj_ptr_proj: true
173
+ prob_to_use_pt_input_for_train: 0.5
174
+ prob_to_use_pt_input_for_eval: 0.0
175
+ prob_to_use_box_input_for_train: 0.5
176
+ prob_to_use_box_input_for_eval: 0.0
177
+ prob_to_sample_from_gt_for_train: 0.1
178
+ num_frames_to_correct_for_train: 2
179
+ num_frames_to_correct_for_eval: 1
180
+ rand_frames_to_correct_for_train: true
181
+ add_all_frames_to_correct_as_cond: true
182
+ num_init_cond_frames_for_train: 2
183
+ rand_init_cond_frames_for_train: true
184
+ num_correction_pt_per_frame: 7
185
+ use_act_ckpt_iterative_pt_sampling: false
186
+ num_init_cond_frames_for_eval: 1
187
+ forward_backbone_per_frame_for_eval: true
188
+ data:
189
+ train:
190
+ _target_: training.dataset.sam2_datasets.TorchTrainMixedDataset
191
+ phases_per_epoch: 1
192
+ batch_sizes:
193
+ - 1
194
+ datasets:
195
+ - _target_: training.dataset.utils.RepeatFactorWrapper
196
+ dataset:
197
+ _target_: training.dataset.utils.ConcatDataset
198
+ datasets:
199
+ - _target_: training.dataset.vos_dataset.VOSDataset
200
+ transforms:
201
+ - _target_: training.dataset.transforms.ComposeAPI
202
+ transforms:
203
+ - _target_: training.dataset.transforms.RandomHorizontalFlip
204
+ consistent_transform: true
205
+ - _target_: training.dataset.transforms.RandomAffine
206
+ degrees: 25
207
+ shear: 20
208
+ image_interpolation: bilinear
209
+ consistent_transform: true
210
+ - _target_: training.dataset.transforms.RandomResizeAPI
211
+ sizes: 1024
212
+ square: true
213
+ consistent_transform: true
214
+ - _target_: training.dataset.transforms.ColorJitter
215
+ consistent_transform: true
216
+ brightness: 0.1
217
+ contrast: 0.03
218
+ saturation: 0.03
219
+ hue: null
220
+ - _target_: training.dataset.transforms.RandomGrayscale
221
+ p: 0.05
222
+ consistent_transform: true
223
+ - _target_: training.dataset.transforms.ColorJitter
224
+ consistent_transform: false
225
+ brightness: 0.1
226
+ contrast: 0.05
227
+ saturation: 0.05
228
+ hue: null
229
+ - _target_: training.dataset.transforms.ToTensorAPI
230
+ - _target_: training.dataset.transforms.NormalizeAPI
231
+ mean:
232
+ - 0.485
233
+ - 0.456
234
+ - 0.406
235
+ std:
236
+ - 0.229
237
+ - 0.224
238
+ - 0.225
239
+ training: true
240
+ video_dataset:
241
+ _target_: training.dataset.binary_png_raw_dataset.BinaryPNGRawDataset
242
+ img_folder: /work/nvme/bfgd/cmaduabuchi/DATA/thermal_video/thriveseg/train/images
243
+ gt_folder: /work/nvme/bfgd/cmaduabuchi/DATA/thermal_video/thriveseg/train/masks
244
+ file_list_txt: null
245
+ sampler:
246
+ _target_: training.dataset.vos_sampler.RandomUniformSampler
247
+ num_frames: 1
248
+ max_num_objects: 3
249
+ multiplier: 2
250
+ shuffle: true
251
+ num_workers: 10
252
+ pin_memory: true
253
+ drop_last: true
254
+ collate_fn:
255
+ _target_: training.utils.data_utils.collate_fn
256
+ _partial_: true
257
+ dict_key: all
258
+ optim:
259
+ amp:
260
+ enabled: true
261
+ amp_dtype: bfloat16
262
+ optimizer:
263
+ _target_: torch.optim.AdamW
264
+ gradient_clip:
265
+ _target_: training.optimizer.GradientClipper
266
+ max_norm: 0.1
267
+ norm_type: 2
268
+ param_group_modifiers:
269
+ - _target_: training.optimizer.layer_decay_param_modifier
270
+ _partial_: true
271
+ layer_decay_value: 0.9
272
+ apply_to: image_encoder.trunk
273
+ overrides:
274
+ - pattern: '*pos_embed*'
275
+ value: 1.0
276
+ options:
277
+ lr:
278
+ - scheduler:
279
+ _target_: fvcore.common.param_scheduler.CosineParamScheduler
280
+ start_value: 5.0e-06
281
+ end_value: 5.000000000000001e-07
282
+ - scheduler:
283
+ _target_: fvcore.common.param_scheduler.CosineParamScheduler
284
+ start_value: 3.0e-06
285
+ end_value: 3.0e-07
286
+ param_names:
287
+ - image_encoder.*
288
+ weight_decay:
289
+ - scheduler:
290
+ _target_: fvcore.common.param_scheduler.ConstantParamScheduler
291
+ value: 0.1
292
+ - scheduler:
293
+ _target_: fvcore.common.param_scheduler.ConstantParamScheduler
294
+ value: 0.0
295
+ param_names:
296
+ - '*bias*'
297
+ module_cls_names:
298
+ - torch.nn.LayerNorm
299
+ loss:
300
+ all:
301
+ _target_: training.loss_fns.MultiStepMultiMasksAndIous
302
+ weight_dict:
303
+ loss_mask: 20
304
+ loss_dice: 1
305
+ loss_iou: 1
306
+ loss_class: 1
307
+ supervise_all_iou: true
308
+ iou_use_l1_loss: true
309
+ pred_obj_scores: true
310
+ focal_gamma_obj_score: 0.0
311
+ focal_alpha_obj_score: -1.0
312
+ distributed:
313
+ backend: nccl
314
+ find_unused_parameters: true
315
+ logging:
316
+ tensorboard_writer:
317
+ _target_: training.utils.logger.make_tensorboard_logger
318
+ log_dir: /work/nvme/bfgd/cmaduabuchi/MODELS/THRIVESEG/experiment/thermal_run1/tensorboard
319
+ flush_secs: 120
320
+ should_log: true
321
+ log_dir: /work/nvme/bfgd/cmaduabuchi/MODELS/THRIVESEG/experiment/thermal_run1/logs
322
+ log_freq: 10
323
+ checkpoint:
324
+ save_dir: /work/nvme/bfgd/cmaduabuchi/MODELS/THRIVESEG/experiment/thermal_run1/checkpoints
325
+ save_freq: 1
326
+ model_weight_initializer:
327
+ _partial_: true
328
+ _target_: training.utils.checkpoint_utils.load_state_dict_into_model
329
+ strict: true
330
+ ignore_unexpected_keys: null
331
+ ignore_missing_keys: null
332
+ state_dict:
333
+ _target_: training.utils.checkpoint_utils.load_checkpoint_and_apply_kernels
334
+ checkpoint_path: /work/nvme/bfgd/cmaduabuchi/MODELS/THRIVESEG/sam2.1_hiera_base_plus.pt
335
+ ckpt_state_dict_keys:
336
+ - model
337
+ launcher:
338
+ num_nodes: 1
339
+ gpus_per_node: 8
340
+ experiment_log_dir: /work/nvme/bfgd/cmaduabuchi/MODELS/THRIVESEG/experiment/thermal_run1
341
+ submitit:
342
+ partition: null
343
+ account: null
344
+ qos: null
345
+ cpus_per_task: 10
346
+ use_cluster: false
347
+ timeout_hour: 24
348
+ name: null
349
+ port_range:
350
+ - 10000
351
+ - 65000
experiment/thermal_run1/logs/best_stats.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"Trainer/where": 0.0249937374749499, "Trainer/epoch": 0, "Trainer/steps_train": 3992}
2
+ {"Trainer/where": 0.0499937374749499, "Trainer/epoch": 1, "Trainer/steps_train": 7984}
3
+ {"Trainer/where": 0.0749937374749499, "Trainer/epoch": 2, "Trainer/steps_train": 11976}
4
+ {"Trainer/where": 0.09999373747494991, "Trainer/epoch": 3, "Trainer/steps_train": 15968}
5
+ {"Trainer/where": 0.1249937374749499, "Trainer/epoch": 4, "Trainer/steps_train": 19960}
6
+ {"Trainer/where": 0.1499937374749499, "Trainer/epoch": 5, "Trainer/steps_train": 23952}
7
+ {"Trainer/where": 0.1749937374749499, "Trainer/epoch": 6, "Trainer/steps_train": 27944}
8
+ {"Trainer/where": 0.19999373747494992, "Trainer/epoch": 7, "Trainer/steps_train": 31936}
9
+ {"Trainer/where": 0.2249937374749499, "Trainer/epoch": 8, "Trainer/steps_train": 35928}
10
+ {"Trainer/where": 0.2499937374749499, "Trainer/epoch": 9, "Trainer/steps_train": 39920}
11
+ {"Trainer/where": 0.27499373747494993, "Trainer/epoch": 10, "Trainer/steps_train": 43912}
12
+ {"Trainer/where": 0.2999937374749499, "Trainer/epoch": 11, "Trainer/steps_train": 47904}
13
+ {"Trainer/where": 0.3249937374749499, "Trainer/epoch": 12, "Trainer/steps_train": 51896}
14
+ {"Trainer/where": 0.3499937374749499, "Trainer/epoch": 13, "Trainer/steps_train": 55888}
15
+ {"Trainer/where": 0.3749937374749499, "Trainer/epoch": 14, "Trainer/steps_train": 59880}
16
+ {"Trainer/where": 0.39999373747494993, "Trainer/epoch": 15, "Trainer/steps_train": 63872}
17
+ {"Trainer/where": 0.4249937374749499, "Trainer/epoch": 16, "Trainer/steps_train": 67864}
18
+ {"Trainer/where": 0.4499937374749499, "Trainer/epoch": 17, "Trainer/steps_train": 71856}
19
+ {"Trainer/where": 0.4749937374749499, "Trainer/epoch": 18, "Trainer/steps_train": 75848}
20
+ {"Trainer/where": 0.4999937374749499, "Trainer/epoch": 19, "Trainer/steps_train": 79840}
21
+ {"Trainer/where": 0.5249937374749499, "Trainer/epoch": 20, "Trainer/steps_train": 83832}
22
+ {"Trainer/where": 0.54999373747495, "Trainer/epoch": 21, "Trainer/steps_train": 87824}
23
+ {"Trainer/where": 0.5749937374749499, "Trainer/epoch": 22, "Trainer/steps_train": 91816}
24
+ {"Trainer/where": 0.5999937374749499, "Trainer/epoch": 23, "Trainer/steps_train": 95808}
25
+ {"Trainer/where": 0.6249937374749499, "Trainer/epoch": 24, "Trainer/steps_train": 99800}
26
+ {"Trainer/where": 0.6499937374749499, "Trainer/epoch": 25, "Trainer/steps_train": 103792}
27
+ {"Trainer/where": 0.67499373747495, "Trainer/epoch": 26, "Trainer/steps_train": 107784}
28
+ {"Trainer/where": 0.6999937374749499, "Trainer/epoch": 27, "Trainer/steps_train": 111776}
29
+ {"Trainer/where": 0.7249937374749499, "Trainer/epoch": 28, "Trainer/steps_train": 115768}
30
+ {"Trainer/where": 0.7499937374749499, "Trainer/epoch": 29, "Trainer/steps_train": 119760}
31
+ {"Trainer/where": 0.7749937374749499, "Trainer/epoch": 30, "Trainer/steps_train": 123752}
32
+ {"Trainer/where": 0.79999373747495, "Trainer/epoch": 31, "Trainer/steps_train": 127744}
33
+ {"Trainer/where": 0.8249937374749499, "Trainer/epoch": 32, "Trainer/steps_train": 131736}
34
+ {"Trainer/where": 0.8499937374749498, "Trainer/epoch": 33, "Trainer/steps_train": 135728}
35
+ {"Trainer/where": 0.8749937374749498, "Trainer/epoch": 34, "Trainer/steps_train": 139720}
36
+ {"Trainer/where": 0.8999937374749498, "Trainer/epoch": 35, "Trainer/steps_train": 143712}
37
+ {"Trainer/where": 0.9249937374749498, "Trainer/epoch": 36, "Trainer/steps_train": 147704}
38
+ {"Trainer/where": 0.9499937374749499, "Trainer/epoch": 37, "Trainer/steps_train": 151696}
39
+ {"Trainer/where": 0.9749937374749498, "Trainer/epoch": 38, "Trainer/steps_train": 155688}
40
+ {"Trainer/where": 0.9999937374749498, "Trainer/epoch": 39, "Trainer/steps_train": 159680}
experiment/thermal_run1/logs/log.txt ADDED
@@ -0,0 +1,732 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ INFO 2025-10-06 06:35:10,376 train_utils.py: 109: MACHINE SEED: 4920
2
+ INFO 2025-10-06 06:35:10,389 train_utils.py: 155: Logging ENV_VARIABLES
3
+ INFO 2025-10-06 06:35:10,389 train_utils.py: 156: BASH_ENV=/usr/share/lmod/lmod/init/bash
4
+ BASH_FUNC_ml%%=() { eval "$($LMOD_DIR/ml_cmd "$@")"
5
+ }
6
+ BASH_FUNC_module%%=() { if [ -z "${LMOD_SH_DBG_ON+x}" ]; then
7
+ case "$-" in
8
+ *v*x*)
9
+ __lmod_sh_dbg='vx'
10
+ ;;
11
+ *v*)
12
+ __lmod_sh_dbg='v'
13
+ ;;
14
+ *x*)
15
+ __lmod_sh_dbg='x'
16
+ ;;
17
+ esac;
18
+ fi;
19
+ if [ -n "${__lmod_sh_dbg:-}" ]; then
20
+ set +$__lmod_sh_dbg;
21
+ echo "Shell debugging temporarily silenced: export LMOD_SH_DBG_ON=1 for Lmod's output" 1>&2;
22
+ fi;
23
+ eval "$($LMOD_CMD shell "$@")" && eval "$(${LMOD_SETTARG_CMD:-:} -s sh)";
24
+ __lmod_my_status=$?;
25
+ if [ -n "${__lmod_sh_dbg:-}" ]; then
26
+ echo "Shell debugging restarted" 1>&2;
27
+ set -$__lmod_sh_dbg;
28
+ fi;
29
+ unset __lmod_sh_dbg;
30
+ return $__lmod_my_status
31
+ }
32
+ BASH_FUNC_which%%=() { ( alias;
33
+ eval ${which_declare} ) | /usr/bin/which --tty-only --read-alias --read-functions --show-tilde --show-dot $@
34
+ }
35
+ BROWSER=/u/cmaduabuchi/.vscode-server/cli/servers/Stable-0f0d87fa9e96c856c5212fc86db137ac0d783365/server/bin/helpers/browser.sh
36
+ BUNDLED_DEBUGPY_PATH=/u/cmaduabuchi/.vscode-server/extensions/ms-python.debugpy-2025.10.0-linux-x64/bundled/libs/debugpy
37
+ CC=/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/bin/gcc
38
+ CMAKE_PREFIX_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku
39
+ COLORTERM=truecolor
40
+ CONDA_DEFAULT_ENV=sam2
41
+ CONDA_EXE=/sw/external/python/anaconda3/bin/conda
42
+ CONDA_PREFIX=/u/cmaduabuchi/.conda/envs/sam2
43
+ CONDA_PREFIX_1=/sw/external/python/anaconda3
44
+ CONDA_PREFIX_2=/u/cmaduabuchi/.conda/envs/sam2
45
+ CONDA_PREFIX_3=/sw/external/python/anaconda3
46
+ CONDA_PROMPT_MODIFIER=(sam2)
47
+ CONDA_PYTHON_EXE=/sw/external/python/anaconda3/bin/python
48
+ CONDA_SHLVL=4
49
+ CPLUS_INCLUDE_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/include:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/include:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/include
50
+ CRAY_ENABLE_PE=/etc/cray-pe.d/enable-pe.sh
51
+ CUDA_HOME=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc
52
+ CUDA_MODULE_LOADING=LAZY
53
+ CUDA_VISIBLE_DEVICES=0
54
+ CUE_CLUSTER_HOME=/u/cmaduabuchi
55
+ CUE_DOCS=https://portal.xsede.org/ncsa-delta
56
+ CUE_HOME=/u/cmaduabuchi
57
+ CUE_HOME_TYPE=lustre-2.14
58
+ CUE_HOSTNAME=dt-login03.delta.ncsa.illinois.edu
59
+ CUE_PROMPT_HOST=dt-login03.delta
60
+ CUE_RESOURCE_ID=delta-cpu.ncsa.xsede.org
61
+ CXX=/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/bin/g++
62
+ C_INCLUDE_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/include:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/include:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/include
63
+ DBUS_SESSION_BUS_ADDRESS=unix:path=/run/user/77886/bus
64
+ F77=/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/bin/gfortran
65
+ FC=/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/bin/gfortran
66
+ FPATH=/usr/share/lmod/lmod/init/ksh_funcs
67
+ GCC_HOME=/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku
68
+ GIT_ASKPASS=/u/cmaduabuchi/.vscode-server/cli/servers/Stable-0f0d87fa9e96c856c5212fc86db137ac0d783365/server/extensions/git/dist/askpass.sh
69
+ GPU_DEVICE_ORDINAL=0
70
+ HISTCONTROL=ignoredups
71
+ HISTFILE=/u/cmaduabuchi/.bash_commands.log
72
+ HISTSIZE=50000
73
+ HISTTIMEFORMAT=%h %d %H:%M:%S
74
+ HOME=/u/cmaduabuchi
75
+ HOSTNAME=dt-login03.delta.ncsa.illinois.edu
76
+ HYDRA_BOOTSTRAP=slurm
77
+ HYDRA_FULL_ERROR=1
78
+ HYDRA_LAUNCHER_EXTRA_ARGS=--external-launcher
79
+ INCLUDE=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/include:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/include:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/include
80
+ I_MPI_HYDRA_BOOTSTRAP=slurm
81
+ I_MPI_HYDRA_BOOTSTRAP_EXEC_EXTRA_ARGS=--external-launcher
82
+ LANG=en_US.UTF-8
83
+ LD_LIBRARY_PATH=/sw/spack/delta-2022-03/apps/gcc/11.2.0-gcc-8.4.1-fxgnsyr/lib64:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/lib64:/opt/cray/libfabric/1.15.2.0/lib64:/opt/cray/libfabric/1.15.2.0/lib
84
+ LESSOPEN=||/usr/bin/lesspipe.sh %s
85
+ LIBRARY_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/lib64:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/lib:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/lib64:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/lib
86
+ LMOD_AVAIL_STYLE=system
87
+ LMOD_CMD=/usr/share/lmod/lmod/libexec/lmod
88
+ LMOD_COLORIZE=yes
89
+ LMOD_DIR=/usr/share/lmod/lmod/libexec
90
+ LMOD_FAMILY_COMPILER=gcc
91
+ LMOD_FAMILY_COMPILER_VERSION=11.4.0
92
+ LMOD_FAMILY_MPI=openmpi
93
+ LMOD_FAMILY_MPI_VERSION=4.1.6
94
+ LMOD_FULL_SETTARG_SUPPORT=no
95
+ LMOD_MPI_NAME=openmpi
96
+ LMOD_MPI_VERSION=4.1.6-lranp74
97
+ LMOD_PKG=/usr/share/lmod/lmod
98
+ LMOD_PREPEND_BLOCK=normal
99
+ LMOD_ROOT=/usr/share/lmod
100
+ LMOD_SETTARG_CMD=:
101
+ LMOD_SETTARG_FULL_SUPPORT=no
102
+ LMOD_SITE_NAME=NCSA
103
+ LMOD_SYSTEM_DEFAULT_MODULES=default-s11
104
+ LMOD_SYSTEM_NAME=Delta
105
+ LMOD_VERSION=8.7.55
106
+ LMOD_arch=x86_64
107
+ LMOD_sys=Linux
108
+ LOADEDMODULES=gcc/11.4.0:openmpi/4.1.6:cuda/11.8.0:cue-login-env/1.1:slurm-env/0.1:default-s11:anaconda3_cpu/23.7.4
109
+ LOCAL_RANK=0
110
+ LOGNAME=cmaduabuchi
111
+ MAIL=/var/spool/mail/cmaduabuchi
112
+ MANPATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/share/man:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/share/man:/usr/share/lmod/lmod/share/man:/usr/local/share/man:/usr/share/man:/opt/ddn/ime/share/man:/opt/puppetlabs/puppet/share/man:/sw/external/python/anaconda3_cpu/man:/sw/external/python/anaconda3/man:/u/cmaduabuchi/.local/share/man:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/share/man:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/share/man:/usr/local/share/man:/usr/share/man:/opt/ddn/ime/share/man:/sw/external/python/anaconda3/man:/sw/external/python/anaconda3_cpu/man:/u/cmaduabuchi/.local/share/man:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/share/man:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/share/man:/usr/local/share/man:/usr/share/man:/opt/ddn/ime/share/man:/opt/ddn/ime/share/man:/opt/ddn/ime/share/man:/opt/ddn/ime/share/man:/opt/ddn/ime/share/man
113
+ MASTER_ADDR=localhost
114
+ MASTER_PORT=48488
115
+ MODULEPATH=/sw/spack/deltas11-2023-03/modules/lmod/openmpi/4.1.6-lo6xae6/gcc/11.4.0:/sw/spack/deltas11-2023-03/modules/lmod/openmpi/4.1.6-lranp74/gcc/11.4.0:/sw/spack/deltas11-2023-03/modules/lmod/gcc/11.4.0:/sw/user/modules:/sw/spack/deltas11-2023-03/modules/lmod/Core:/opt/cray/pe/lmod/modulefiles/craype-targets/default:/opt/cray/pe/lmod/modulefiles/core:/opt/cray/modulefiles:/sw/external/lmod/modulefiles/core:/usr/share/lmod/lmod/modulefiles/Core
116
+ MODULEPATH_ROOT=/
117
+ MODULESHOME=/usr/share/lmod/lmod
118
+ MPICC=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/bin/mpicc
119
+ MPICXX=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/bin/mpic++
120
+ MPIF77=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/bin/mpif77
121
+ MPIF90=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/bin/mpif90
122
+ NCSA_FAMILY_COMPILER=gcc
123
+ NCSA_FAMILY_COMPILER_VERSION=11.4.0
124
+ NCSA_FAMILY_MPI=openmpi
125
+ NCSA_FAMILY_MPI_VERSION=4.1.6
126
+ NVHPC_CUDA_HOME=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc
127
+ OLDPWD=/work/nvme/bfgd/cmaduabuchi/THRIVESEG/sam2
128
+ OMPI_MCA_btl_tcp_endpoint_cache=67108864
129
+ OMPI_MCA_btl_tcp_latency_hsn0=2
130
+ OMPI_MCA_btl_tcp_rdma_pipeline_send_length=1048576
131
+ OMPI_MCA_mtl_ofi_provider_include=cxi
132
+ OMPI_MCA_opal_common_ucx_opal_mem_hooks=1
133
+ OMPI_MCA_opal_warn_on_missing_libcuda=0
134
+ OMPI_MCA_plm_slurm_args=--external-launcher
135
+ OMPI_MCA_ras_base_verbose=10
136
+ OPENMPI_HOME=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74
137
+ PATH=/u/cmaduabuchi/.vscode-server/cli/servers/Stable-0f0d87fa9e96c856c5212fc86db137ac0d783365/server/bin/remote-cli:/u/cmaduabuchi/.conda/envs/sam2/bin:/sw/external/python/anaconda3/condabin:/sw/external/python/anaconda3_cpu/bin:/u/cmaduabuchi/.local/bin:/u/cmaduabuchi/bin:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/bin:/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/bin:/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/bin:/sw/user/scripts:/usr/local/bin:/usr/bin:/usr/local/sbin:/usr/sbin:/opt/ddn/ime/bin:/opt/puppetlabs/bin:/opt/ddn/ime/bin:/u/cmaduabuchi/.vscode-server/extensions/ms-python.debugpy-2025.10.0-linux-x64/bundled/scripts/noConfigScripts:/u/cmaduabuchi/.vscode-server/data/User/globalStorage/github.copilot-chat/debugCommand:/opt/ddn/ime/bin:/opt/ddn/ime/bin:/opt/ddn/ime/bin
138
+ PKG_CONFIG_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/lib/pkgconfig
139
+ PMI_FD=10
140
+ PMI_JOBID=12652122.0
141
+ PMI_RANK=0
142
+ PMI_SIZE=1
143
+ PRTE_MCA_plm_slurm_args=--external-launcher
144
+ PWD=/work/nvme/bfgd/cmaduabuchi/THRIVESEG/sam2
145
+ PYDEVD_DISABLE_FILE_VALIDATION=1
146
+ PYTHONSTARTUP=/u/cmaduabuchi/.vscode-server/data/User/workspaceStorage/e99aa778c8fbcf5603c74656a7713b05/ms-python.python/pythonrc.py
147
+ PYTHON_BASIC_REPL=1
148
+ RANK=0
149
+ ROCR_VISIBLE_DEVICES=0
150
+ SALLOC_KILL_CMD=1
151
+ SHELL=/bin/bash
152
+ SHLVL=8
153
+ SLURMD_DEBUG=2
154
+ SLURMD_NODENAME=gpub060
155
+ SLURM_CLUSTER_NAME=delta
156
+ SLURM_CONF=/var/spool/slurmd/conf-cache/slurm.conf
157
+ SLURM_CPUS_ON_NODE=16
158
+ SLURM_CPUS_PER_GPU=16
159
+ SLURM_CPU_BIND=quiet,mask_cpu:0x0000000000FFFF00
160
+ SLURM_CPU_BIND_LIST=0x0000000000FFFF00
161
+ SLURM_CPU_BIND_TYPE=mask_cpu:
162
+ SLURM_CPU_BIND_VERBOSE=quiet
163
+ SLURM_GPUS_ON_NODE=1
164
+ SLURM_GPUS_PER_NODE=1
165
+ SLURM_GTIDS=0
166
+ SLURM_JOBID=12652122
167
+ SLURM_JOB_ACCOUNT=becs-delta-gpu
168
+ SLURM_JOB_CPUS_PER_NODE=16
169
+ SLURM_JOB_END_TIME=1759922844
170
+ SLURM_JOB_GID=202
171
+ SLURM_JOB_GROUP=grp_202
172
+ SLURM_JOB_ID=12652122
173
+ SLURM_JOB_NAME=demo
174
+ SLURM_JOB_NODELIST=gpub060
175
+ SLURM_JOB_NUM_NODES=1
176
+ SLURM_JOB_PARTITION=gpuA40x4
177
+ SLURM_JOB_QOS=becs-delta-gpu
178
+ SLURM_JOB_START_TIME=1759750044
179
+ SLURM_JOB_UID=77886
180
+ SLURM_JOB_USER=cmaduabuchi
181
+ SLURM_LAUNCH_NODE_IPADDR=141.142.253.42
182
+ SLURM_LOCALID=0
183
+ SLURM_MEM_PER_GPU=81920
184
+ SLURM_MPI_TYPE=pmi2
185
+ SLURM_NNODES=1
186
+ SLURM_NODEID=0
187
+ SLURM_NODELIST=gpub060
188
+ SLURM_NPROCS=1
189
+ SLURM_NTASKS=1
190
+ SLURM_PRIO_PROCESS=0
191
+ SLURM_PROCID=0
192
+ SLURM_PTY_PORT=39771
193
+ SLURM_PTY_WIN_COL=91
194
+ SLURM_PTY_WIN_ROW=69
195
+ SLURM_SRUN_COMM_HOST=141.142.253.42
196
+ SLURM_SRUN_COMM_PORT=43569
197
+ SLURM_STEPID=0
198
+ SLURM_STEP_GPUS=1
199
+ SLURM_STEP_ID=0
200
+ SLURM_STEP_LAUNCHER_PORT=43569
201
+ SLURM_STEP_NODELIST=gpub060
202
+ SLURM_STEP_NUM_NODES=1
203
+ SLURM_STEP_NUM_TASKS=1
204
+ SLURM_STEP_TASKS_PER_NODE=1
205
+ SLURM_SUBMIT_DIR=/work/nvme/bfgd/cmaduabuchi
206
+ SLURM_SUBMIT_HOST=dt-login03.delta.ncsa.illinois.edu
207
+ SLURM_TASKS_PER_NODE=1
208
+ SLURM_TASK_PID=916888
209
+ SLURM_TOPOLOGY_ADDR=ss00.ss11.gpub060
210
+ SLURM_TOPOLOGY_ADDR_PATTERN=switch.switch.node
211
+ SLURM_UMASK=0077
212
+ SQUEUE_FORMAT=%.12i %.12P %.12j %.14u %.2t %.10M %.6D %.18R %f
213
+ SRUN_DEBUG=3
214
+ SSH_CLIENT=128.195.95.47 32161 22
215
+ SSH_CONNECTION=169.234.226.25 58665 141.142.140.196 22
216
+ SSL_CERT_DIR=/etc/pki/tls/certs
217
+ SSL_CERT_FILE=/etc/pki/ca-trust/extracted/pem/tls-ca-bundle.pem
218
+ TERM=screen
219
+ TERM_PROGRAM=vscode
220
+ TERM_PROGRAM_VERSION=1.104.1
221
+ TMOUT=86400
222
+ TMPDIR=/tmp
223
+ TMUX=/tmp/tmux-77886/default,3561957,1
224
+ TMUX_PANE=%1
225
+ TORCH_NCCL_ASYNC_ERROR_HANDLING=1
226
+ USER=cmaduabuchi
227
+ VSCODE_DEBUGPY_ADAPTER_ENDPOINTS=/u/cmaduabuchi/.vscode-server/extensions/ms-python.debugpy-2025.10.0-linux-x64/.noConfigDebugAdapterEndpoints/endpoint-ad8f8f00eace4009.txt
228
+ VSCODE_GIT_ASKPASS_EXTRA_ARGS=
229
+ VSCODE_GIT_ASKPASS_MAIN=/u/cmaduabuchi/.vscode-server/cli/servers/Stable-0f0d87fa9e96c856c5212fc86db137ac0d783365/server/extensions/git/dist/askpass-main.js
230
+ VSCODE_GIT_ASKPASS_NODE=/u/cmaduabuchi/.vscode-server/cli/servers/Stable-0f0d87fa9e96c856c5212fc86db137ac0d783365/server/node
231
+ VSCODE_GIT_IPC_HANDLE=/run/user/77886/vscode-git-922d1ac20a.sock
232
+ VSCODE_IPC_HOOK_CLI=/run/user/77886/vscode-ipc-4d775fc7-d69f-439f-a012-2b869d146d9e.sock
233
+ VSCODE_PYTHON_AUTOACTIVATE_GUARD=1
234
+ WORLD_SIZE=1
235
+ XDG_RUNTIME_DIR=/run/user/77886
236
+ XDG_SESSION_ID=114322
237
+ ZE_AFFINITY_MASK=0
238
+ _=/u/cmaduabuchi/.conda/envs/sam2/bin/python
239
+ _CE_CONDA=
240
+ _CE_M=
241
+ _LMFILES_=/sw/spack/deltas11-2023-03/modules/lmod/Core/gcc/11.4.0.lua:/sw/spack/deltas11-2023-03/modules/lmod/gcc/11.4.0/openmpi/4.1.6.lua:/sw/spack/deltas11-2023-03/modules/lmod/gcc/11.4.0/cuda/11.8.0.lua:/sw/user/modules/cue-login-env/1.1.lua:/sw/user/modules/slurm-env/0.1.lua:/sw/user/modules/default-s11.lua:/sw/user/modules/anaconda3_cpu/23.7.4.lua
242
+ _ModuleTable001_=X01vZHVsZVRhYmxlXyA9IHsKTVR2ZXJzaW9uID0gMywKY19yZWJ1aWxkVGltZSA9IGZhbHNlLApjX3Nob3J0VGltZSA9IGZhbHNlLApkZXB0aFQgPSB7fSwKZmFtaWx5ID0gewpjb21waWxlciA9ICJnY2MiLAptcGkgPSAib3Blbm1waSIsCn0sCm1UID0gewphbmFjb25kYTNfY3B1ID0gewpmbiA9ICIvc3cvdXNlci9tb2R1bGVzL2FuYWNvbmRhM19jcHUvMjMuNy40Lmx1YSIsCmZ1bGxOYW1lID0gImFuYWNvbmRhM19jcHUvMjMuNy40IiwKbG9hZE9yZGVyID0gNywKcHJvcFQgPSB7fSwKc3RhY2tEZXB0aCA9IDAsCnN0YXR1cyA9ICJhY3RpdmUiLAp1c2VyTmFtZSA9ICJhbmFjb25kYTNfY3B1LzIzLjcuNCIsCndWID0gIl4wMDAwMDAyMy4wMDAwMDAwMDcuMDAwMDAwMDA0Lip6
243
+ _ModuleTable002_=ZmluYWwiLAp9LApjdWRhID0gewpmbiA9ICIvc3cvc3BhY2svZGVsdGFzMTEtMjAyMy0wMy9tb2R1bGVzL2xtb2QvZ2NjLzExLjQuMC9jdWRhLzExLjguMC5sdWEiLApmdWxsTmFtZSA9ICJjdWRhLzExLjguMCIsCmxvYWRPcmRlciA9IDMsCnByb3BUID0ge30sCnN0YWNrRGVwdGggPSAxLApzdGF0dXMgPSAiYWN0aXZlIiwKdXNlck5hbWUgPSAiY3VkYSIsCndWID0gIl4wMDAwMDAxMS4wMDAwMDAwMDguKnpmaW5hbCIsCn0sClsiY3VlLWxvZ2luLWVudiJdID0gewpmbiA9ICIvc3cvdXNlci9tb2R1bGVzL2N1ZS1sb2dpbi1lbnYvMS4xLmx1YSIsCmZ1bGxOYW1lID0gImN1ZS1sb2dpbi1lbnYvMS4xIiwKbG9hZE9yZGVyID0gNCwKcHJvcFQgPSB7fSwKc3RhY2tEZXB0aCA9IDEs
244
+ _ModuleTable003_=CnN0YXR1cyA9ICJhY3RpdmUiLAp1c2VyTmFtZSA9ICJjdWUtbG9naW4tZW52IiwKd1YgPSAiMDAwMDAwMDAxLjAwMDAwMDAwMS4qemZpbmFsIiwKfSwKWyJkZWZhdWx0LXMxMSJdID0gewpmbiA9ICIvc3cvdXNlci9tb2R1bGVzL2RlZmF1bHQtczExLmx1YSIsCmZ1bGxOYW1lID0gImRlZmF1bHQtczExIiwKbG9hZE9yZGVyID0gNiwKcHJvcFQgPSB7fSwKc3RhY2tEZXB0aCA9IDAsCnN0YXR1cyA9ICJhY3RpdmUiLAp1c2VyTmFtZSA9ICJkZWZhdWx0LXMxMSIsCndWID0gIk0uKnpmaW5hbCIsCn0sCmdjYyA9IHsKYWN0aW9uQSA9IHsKInByZXBlbmRfcGF0aChcIk1PRFVMRVBBVEhcIixcIi9zdy9zcGFjay9kZWx0YXMxMS0yMDIzLTAzL21vZHVsZXMvbG1vZC9nY2MvMTEuNC4w
245
+ _ModuleTable004_=XCIpIiwKfSwKZm4gPSAiL3N3L3NwYWNrL2RlbHRhczExLTIwMjMtMDMvbW9kdWxlcy9sbW9kL0NvcmUvZ2NjLzExLjQuMC5sdWEiLApmdWxsTmFtZSA9ICJnY2MvMTEuNC4wIiwKbG9hZE9yZGVyID0gMSwKcHJvcFQgPSB7fSwKc3RhY2tEZXB0aCA9IDEsCnN0YXR1cyA9ICJhY3RpdmUiLAp1c2VyTmFtZSA9ICJnY2MiLAp3ViA9ICJeMDAwMDAwMTEuMDAwMDAwMDA0Lip6ZmluYWwiLAp9LApvcGVubXBpID0gewphY3Rpb25BID0gewoKInByZXBlbmRfcGF0aChcIk1PRFVMRVBBVEhcIixcIi9zdy9zcGFjay9kZWx0YXMxMS0yMDIzLTAzL21vZHVsZXMvbG1vZC9vcGVubXBpLzQuMS42LWxyYW5wNzQvZ2NjLzExLjQuMFwiKSIsICJwcmVwZW5kX3BhdGgoXCJNT0RVTEVQQVRIXCIs
246
+ _ModuleTable005_=XCIvc3cvc3BhY2svZGVsdGFzMTEtMjAyMy0wMy9tb2R1bGVzL2xtb2Qvb3Blbm1waS80LjEuNi1sbzZ4YWU2L2djYy8xMS40LjBcIikiLAp9LApmbiA9ICIvc3cvc3BhY2svZGVsdGFzMTEtMjAyMy0wMy9tb2R1bGVzL2xtb2QvZ2NjLzExLjQuMC9vcGVubXBpLzQuMS42Lmx1YSIsCmZ1bGxOYW1lID0gIm9wZW5tcGkvNC4xLjYiLApsb2FkT3JkZXIgPSAyLApwcm9wVCA9IHt9LApzdGFja0RlcHRoID0gMSwKc3RhdHVzID0gImFjdGl2ZSIsCnVzZXJOYW1lID0gIm9wZW5tcGkiLAp3ViA9ICJeMDAwMDAwMDQuMDAwMDAwMDAxLjAwMDAwMDAwNi4qemZpbmFsIiwKfSwKWyJzbHVybS1lbnYiXSA9IHsKZm4gPSAiL3N3L3VzZXIvbW9kdWxlcy9zbHVybS1lbnYvMC4xLmx1YSIsCmZ1
247
+ _ModuleTable006_=bGxOYW1lID0gInNsdXJtLWVudi8wLjEiLApsb2FkT3JkZXIgPSA1LApwcm9wVCA9IHt9LApzdGFja0RlcHRoID0gMSwKc3RhdHVzID0gImFjdGl2ZSIsCnVzZXJOYW1lID0gInNsdXJtLWVudiIsCndWID0gIjAwMDAwMDAwMC4wMDAwMDAwMDEuKnpmaW5hbCIsCn0sCn0sCm1wYXRoQSA9IHsKIi9zdy9zcGFjay9kZWx0YXMxMS0yMDIzLTAzL21vZHVsZXMvbG1vZC9vcGVubXBpLzQuMS42LWxvNnhhZTYvZ2NjLzExLjQuMCIKLCAiL3N3L3NwYWNrL2RlbHRhczExLTIwMjMtMDMvbW9kdWxlcy9sbW9kL29wZW5tcGkvNC4xLjYtbHJhbnA3NC9nY2MvMTEuNC4wIgosICIvc3cvc3BhY2svZGVsdGFzMTEtMjAyMy0wMy9tb2R1bGVzL2xtb2QvZ2NjLzExLjQuMCIsICIvc3cvdXNlci9t
248
+ _ModuleTable007_=b2R1bGVzIgosICIvc3cvc3BhY2svZGVsdGFzMTEtMjAyMy0wMy9tb2R1bGVzL2xtb2QvQ29yZSIKLCAiL29wdC9jcmF5L3BlL2xtb2QvbW9kdWxlZmlsZXMvY3JheXBlLXRhcmdldHMvZGVmYXVsdCIKLCAiL29wdC9jcmF5L3BlL2xtb2QvbW9kdWxlZmlsZXMvY29yZSIsICIvb3B0L2NyYXkvbW9kdWxlZmlsZXMiCiwgIi9zdy9leHRlcm5hbC9sbW9kL21vZHVsZWZpbGVzL2NvcmUiLCAiL3Vzci9zaGFyZS9sbW9kL2xtb2QvbW9kdWxlZmlsZXMvQ29yZSIsCn0sCnN5c3RlbUJhc2VNUEFUSCA9ICIvc3cvdXNlci9tb2R1bGVzOi9zdy9zcGFjay9kZWx0YXMxMS0yMDIzLTAzL21vZHVsZXMvbG1vZC9Db3JlOi9vcHQvY3JheS9wZS9sbW9kL21vZHVsZWZpbGVzL2NyYXlwZS10YXJn
249
+ _ModuleTable008_=ZXRzL2RlZmF1bHQ6L29wdC9jcmF5L3BlL2xtb2QvbW9kdWxlZmlsZXMvY29yZTovb3B0L2NyYXkvbW9kdWxlZmlsZXM6L3N3L2V4dGVybmFsL2xtb2QvbW9kdWxlZmlsZXMvY29yZTovdXNyL3NoYXJlL2xtb2QvbG1vZC9tb2R1bGVmaWxlcy9Db3JlIiwKfQo=
250
+ _ModuleTable_Sz_=8
251
+ __Init_Default_Modules=1
252
+ __LMOD_REF_COUNT_CMAKE_PREFIX_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc:2;/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74:2;/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku:2
253
+ __LMOD_REF_COUNT_CPLUS_INCLUDE_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/include:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/include:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/include:1
254
+ __LMOD_REF_COUNT_C_INCLUDE_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/include:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/include:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/include:1
255
+ __LMOD_REF_COUNT_INCLUDE=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/include:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/include:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/include:1
256
+ __LMOD_REF_COUNT_LD_LIBRARY_PATH=/sw/spack/delta-2022-03/apps/gcc/11.2.0-gcc-8.4.1-fxgnsyr/lib64:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/lib64:1;/opt/cray/libfabric/1.15.2.0/lib64:1;/opt/cray/libfabric/1.15.2.0/lib:1
257
+ __LMOD_REF_COUNT_LIBRARY_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/lib64:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/lib:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/lib64:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/lib:1
258
+ __LMOD_REF_COUNT_MANPATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/share/man:2;/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/share/man:2;/usr/share/lmod/lmod/share/man:1;/usr/local/share/man:1;/usr/share/man:1;/opt/ddn/ime/share/man:1;/opt/puppetlabs/puppet/share/man:1;:2
259
+ __LMOD_REF_COUNT_MODULEPATH=/sw/spack/deltas11-2023-03/modules/lmod/openmpi/4.1.6-lo6xae6/gcc/11.4.0:1;/sw/spack/deltas11-2023-03/modules/lmod/openmpi/4.1.6-lranp74/gcc/11.4.0:1;/sw/spack/deltas11-2023-03/modules/lmod/gcc/11.4.0:1;/sw/user/modules:1;/sw/spack/deltas11-2023-03/modules/lmod/Core:1;/opt/cray/pe/lmod/modulefiles/craype-targets/default:1;/opt/cray/pe/lmod/modulefiles/core:1;/opt/cray/modulefiles:1;/sw/external/lmod/modulefiles/core:1;/usr/share/lmod/lmod/modulefiles/Core:1
260
+ __LMOD_REF_COUNT_PATH=/sw/external/python/anaconda3_cpu/bin:1;/u/cmaduabuchi/.vscode-server/cli/servers/Stable-0f0d87fa9e96c856c5212fc86db137ac0d783365/server/bin/remote-cli:1;/sw/external/python/anaconda3/bin:1;/sw/external/python/anaconda3/condabin:1;/u/cmaduabuchi/.local/bin:1;/u/cmaduabuchi/bin:1;/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/cuda-11.8.0-vfixfmc/bin:2;/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/bin:2;/sw/spack/deltas11-2023-03/apps/linux-rhel8-x86_64/gcc-8.5.0/gcc-11.4.0-yycklku/bin:2;/sw/user/scripts:1;/usr/local/bin:1;/usr/bin:1;/usr/local/sbin:1;/usr/sbin:1;/opt/ddn/ime/bin:3;/opt/puppetlabs/bin:1;/u/cmaduabuchi/.vscode-server/extensions/ms-python.debugpy-2025.10.0-linux-x64/bundled/scripts/noConfigScripts:1;/u/cmaduabuchi/.vscode-server/data/User/globalStorage/github.copilot-chat/debugCommand:1
261
+ __LMOD_REF_COUNT_PKG_CONFIG_PATH=/sw/spack/deltas11-2023-03/apps/linux-rhel8-zen3/gcc-11.4.0/openmpi-4.1.6-lranp74/lib/pkgconfig:2
262
+ which_declare=declare -f
263
+
264
+ INFO 2025-10-06 06:35:10,389 trainer.py: 989: Setting up components: Model, loss, optim, meters etc.
265
+ INFO 2025-10-06 06:35:10,398 logger.py: 66: TensorBoard SummaryWriter instantiated. Files will be stored in: /work/nvme/bfgd/cmaduabuchi/MODELS/THRIVESEG/experiment/thermal_run1/tensorboard
266
+ INFO 2025-10-06 06:35:11,529 sam2.py: 81: Training with points (sampled from masks) as inputs with p=0.5
267
+ INFO 2025-10-06 06:35:11,532 trainer.py:1059: ====================
268
+ INFO 2025-10-06 06:35:11,532 trainer.py:1060: Summary for model <class 'training.model.sam2.SAM2Train'>
269
+ INFO 2025-10-06 06:35:11,534 trainer.py:1061: Model is SAM2Train(
270
+ (image_encoder): ImageEncoder(
271
+ (trunk): Hiera(
272
+ (patch_embed): PatchEmbed(
273
+ (proj): Conv2d(3, 112, kernel_size=(7, 7), stride=(4, 4), padding=(3, 3))
274
+ )
275
+ (blocks): ModuleList(
276
+ (0): MultiScaleBlock(
277
+ (norm1): LayerNorm((112,), eps=1e-06, elementwise_affine=True)
278
+ (attn): MultiScaleAttention(
279
+ (qkv): Linear(in_features=112, out_features=336, bias=True)
280
+ (proj): Linear(in_features=112, out_features=112, bias=True)
281
+ )
282
+ (drop_path): Identity()
283
+ (norm2): LayerNorm((112,), eps=1e-06, elementwise_affine=True)
284
+ (mlp): MLP(
285
+ (layers): ModuleList(
286
+ (0): Linear(in_features=112, out_features=448, bias=True)
287
+ (1): Linear(in_features=448, out_features=112, bias=True)
288
+ )
289
+ (act): GELU(approximate='none')
290
+ )
291
+ )
292
+ (1): MultiScaleBlock(
293
+ (norm1): LayerNorm((112,), eps=1e-06, elementwise_affine=True)
294
+ (attn): MultiScaleAttention(
295
+ (qkv): Linear(in_features=112, out_features=336, bias=True)
296
+ (proj): Linear(in_features=112, out_features=112, bias=True)
297
+ )
298
+ (drop_path): DropPath()
299
+ (norm2): LayerNorm((112,), eps=1e-06, elementwise_affine=True)
300
+ (mlp): MLP(
301
+ (layers): ModuleList(
302
+ (0): Linear(in_features=112, out_features=448, bias=True)
303
+ (1): Linear(in_features=448, out_features=112, bias=True)
304
+ )
305
+ (act): GELU(approximate='none')
306
+ )
307
+ )
308
+ (2): MultiScaleBlock(
309
+ (norm1): LayerNorm((112,), eps=1e-06, elementwise_affine=True)
310
+ (pool): MaxPool2d(kernel_size=(2, 2), stride=(2, 2), padding=0, dilation=1, ceil_mode=False)
311
+ (attn): MultiScaleAttention(
312
+ (q_pool): MaxPool2d(kernel_size=(2, 2), stride=(2, 2), padding=0, dilation=1, ceil_mode=False)
313
+ (qkv): Linear(in_features=112, out_features=672, bias=True)
314
+ (proj): Linear(in_features=224, out_features=224, bias=True)
315
+ )
316
+ (drop_path): DropPath()
317
+ (norm2): LayerNorm((224,), eps=1e-06, elementwise_affine=True)
318
+ (mlp): MLP(
319
+ (layers): ModuleList(
320
+ (0): Linear(in_features=224, out_features=896, bias=True)
321
+ (1): Linear(in_features=896, out_features=224, bias=True)
322
+ )
323
+ (act): GELU(approximate='none')
324
+ )
325
+ (proj): Linear(in_features=112, out_features=224, bias=True)
326
+ )
327
+ (3-4): 2 x MultiScaleBlock(
328
+ (norm1): LayerNorm((224,), eps=1e-06, elementwise_affine=True)
329
+ (attn): MultiScaleAttention(
330
+ (qkv): Linear(in_features=224, out_features=672, bias=True)
331
+ (proj): Linear(in_features=224, out_features=224, bias=True)
332
+ )
333
+ (drop_path): DropPath()
334
+ (norm2): LayerNorm((224,), eps=1e-06, elementwise_affine=True)
335
+ (mlp): MLP(
336
+ (layers): ModuleList(
337
+ (0): Linear(in_features=224, out_features=896, bias=True)
338
+ (1): Linear(in_features=896, out_features=224, bias=True)
339
+ )
340
+ (act): GELU(approximate='none')
341
+ )
342
+ )
343
+ (5): MultiScaleBlock(
344
+ (norm1): LayerNorm((224,), eps=1e-06, elementwise_affine=True)
345
+ (pool): MaxPool2d(kernel_size=(2, 2), stride=(2, 2), padding=0, dilation=1, ceil_mode=False)
346
+ (attn): MultiScaleAttention(
347
+ (q_pool): MaxPool2d(kernel_size=(2, 2), stride=(2, 2), padding=0, dilation=1, ceil_mode=False)
348
+ (qkv): Linear(in_features=224, out_features=1344, bias=True)
349
+ (proj): Linear(in_features=448, out_features=448, bias=True)
350
+ )
351
+ (drop_path): DropPath()
352
+ (norm2): LayerNorm((448,), eps=1e-06, elementwise_affine=True)
353
+ (mlp): MLP(
354
+ (layers): ModuleList(
355
+ (0): Linear(in_features=448, out_features=1792, bias=True)
356
+ (1): Linear(in_features=1792, out_features=448, bias=True)
357
+ )
358
+ (act): GELU(approximate='none')
359
+ )
360
+ (proj): Linear(in_features=224, out_features=448, bias=True)
361
+ )
362
+ (6-20): 15 x MultiScaleBlock(
363
+ (norm1): LayerNorm((448,), eps=1e-06, elementwise_affine=True)
364
+ (attn): MultiScaleAttention(
365
+ (qkv): Linear(in_features=448, out_features=1344, bias=True)
366
+ (proj): Linear(in_features=448, out_features=448, bias=True)
367
+ )
368
+ (drop_path): DropPath()
369
+ (norm2): LayerNorm((448,), eps=1e-06, elementwise_affine=True)
370
+ (mlp): MLP(
371
+ (layers): ModuleList(
372
+ (0): Linear(in_features=448, out_features=1792, bias=True)
373
+ (1): Linear(in_features=1792, out_features=448, bias=True)
374
+ )
375
+ (act): GELU(approximate='none')
376
+ )
377
+ )
378
+ (21): MultiScaleBlock(
379
+ (norm1): LayerNorm((448,), eps=1e-06, elementwise_affine=True)
380
+ (pool): MaxPool2d(kernel_size=(2, 2), stride=(2, 2), padding=0, dilation=1, ceil_mode=False)
381
+ (attn): MultiScaleAttention(
382
+ (q_pool): MaxPool2d(kernel_size=(2, 2), stride=(2, 2), padding=0, dilation=1, ceil_mode=False)
383
+ (qkv): Linear(in_features=448, out_features=2688, bias=True)
384
+ (proj): Linear(in_features=896, out_features=896, bias=True)
385
+ )
386
+ (drop_path): DropPath()
387
+ (norm2): LayerNorm((896,), eps=1e-06, elementwise_affine=True)
388
+ (mlp): MLP(
389
+ (layers): ModuleList(
390
+ (0): Linear(in_features=896, out_features=3584, bias=True)
391
+ (1): Linear(in_features=3584, out_features=896, bias=True)
392
+ )
393
+ (act): GELU(approximate='none')
394
+ )
395
+ (proj): Linear(in_features=448, out_features=896, bias=True)
396
+ )
397
+ (22-23): 2 x MultiScaleBlock(
398
+ (norm1): LayerNorm((896,), eps=1e-06, elementwise_affine=True)
399
+ (attn): MultiScaleAttention(
400
+ (qkv): Linear(in_features=896, out_features=2688, bias=True)
401
+ (proj): Linear(in_features=896, out_features=896, bias=True)
402
+ )
403
+ (drop_path): DropPath()
404
+ (norm2): LayerNorm((896,), eps=1e-06, elementwise_affine=True)
405
+ (mlp): MLP(
406
+ (layers): ModuleList(
407
+ (0): Linear(in_features=896, out_features=3584, bias=True)
408
+ (1): Linear(in_features=3584, out_features=896, bias=True)
409
+ )
410
+ (act): GELU(approximate='none')
411
+ )
412
+ )
413
+ )
414
+ )
415
+ (neck): FpnNeck(
416
+ (position_encoding): PositionEmbeddingSine()
417
+ (convs): ModuleList(
418
+ (0): Sequential(
419
+ (conv): Conv2d(896, 256, kernel_size=(1, 1), stride=(1, 1))
420
+ )
421
+ (1): Sequential(
422
+ (conv): Conv2d(448, 256, kernel_size=(1, 1), stride=(1, 1))
423
+ )
424
+ (2): Sequential(
425
+ (conv): Conv2d(224, 256, kernel_size=(1, 1), stride=(1, 1))
426
+ )
427
+ (3): Sequential(
428
+ (conv): Conv2d(112, 256, kernel_size=(1, 1), stride=(1, 1))
429
+ )
430
+ )
431
+ )
432
+ )
433
+ (mask_downsample): Conv2d(1, 1, kernel_size=(4, 4), stride=(4, 4))
434
+ (memory_attention): MemoryAttention(
435
+ (layers): ModuleList(
436
+ (0-3): 4 x MemoryAttentionLayer(
437
+ (self_attn): RoPEAttention(
438
+ (q_proj): Linear(in_features=256, out_features=256, bias=True)
439
+ (k_proj): Linear(in_features=256, out_features=256, bias=True)
440
+ (v_proj): Linear(in_features=256, out_features=256, bias=True)
441
+ (out_proj): Linear(in_features=256, out_features=256, bias=True)
442
+ )
443
+ (cross_attn_image): RoPEAttention(
444
+ (q_proj): Linear(in_features=256, out_features=256, bias=True)
445
+ (k_proj): Linear(in_features=64, out_features=256, bias=True)
446
+ (v_proj): Linear(in_features=64, out_features=256, bias=True)
447
+ (out_proj): Linear(in_features=256, out_features=256, bias=True)
448
+ )
449
+ (linear1): Linear(in_features=256, out_features=2048, bias=True)
450
+ (dropout): Dropout(p=0.1, inplace=False)
451
+ (linear2): Linear(in_features=2048, out_features=256, bias=True)
452
+ (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
453
+ (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
454
+ (norm3): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
455
+ (dropout1): Dropout(p=0.1, inplace=False)
456
+ (dropout2): Dropout(p=0.1, inplace=False)
457
+ (dropout3): Dropout(p=0.1, inplace=False)
458
+ )
459
+ )
460
+ (norm): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
461
+ )
462
+ (memory_encoder): MemoryEncoder(
463
+ (mask_downsampler): MaskDownSampler(
464
+ (encoder): Sequential(
465
+ (0): Conv2d(1, 4, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1))
466
+ (1): LayerNorm2d()
467
+ (2): GELU(approximate='none')
468
+ (3): Conv2d(4, 16, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1))
469
+ (4): LayerNorm2d()
470
+ (5): GELU(approximate='none')
471
+ (6): Conv2d(16, 64, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1))
472
+ (7): LayerNorm2d()
473
+ (8): GELU(approximate='none')
474
+ (9): Conv2d(64, 256, kernel_size=(3, 3), stride=(2, 2), padding=(1, 1))
475
+ (10): LayerNorm2d()
476
+ (11): GELU(approximate='none')
477
+ (12): Conv2d(256, 256, kernel_size=(1, 1), stride=(1, 1))
478
+ )
479
+ )
480
+ (pix_feat_proj): Conv2d(256, 256, kernel_size=(1, 1), stride=(1, 1))
481
+ (fuser): Fuser(
482
+ (proj): Identity()
483
+ (layers): ModuleList(
484
+ (0-1): 2 x CXBlock(
485
+ (dwconv): Conv2d(256, 256, kernel_size=(7, 7), stride=(1, 1), padding=(3, 3), groups=256)
486
+ (norm): LayerNorm2d()
487
+ (pwconv1): Linear(in_features=256, out_features=1024, bias=True)
488
+ (act): GELU(approximate='none')
489
+ (pwconv2): Linear(in_features=1024, out_features=256, bias=True)
490
+ (drop_path): Identity()
491
+ )
492
+ )
493
+ )
494
+ (position_encoding): PositionEmbeddingSine()
495
+ (out_proj): Conv2d(256, 64, kernel_size=(1, 1), stride=(1, 1))
496
+ )
497
+ (sam_prompt_encoder): PromptEncoder(
498
+ (pe_layer): PositionEmbeddingRandom()
499
+ (point_embeddings): ModuleList(
500
+ (0-3): 4 x Embedding(1, 256)
501
+ )
502
+ (not_a_point_embed): Embedding(1, 256)
503
+ (mask_downscaling): Sequential(
504
+ (0): Conv2d(1, 4, kernel_size=(2, 2), stride=(2, 2))
505
+ (1): LayerNorm2d()
506
+ (2): GELU(approximate='none')
507
+ (3): Conv2d(4, 16, kernel_size=(2, 2), stride=(2, 2))
508
+ (4): LayerNorm2d()
509
+ (5): GELU(approximate='none')
510
+ (6): Conv2d(16, 256, kernel_size=(1, 1), stride=(1, 1))
511
+ )
512
+ (no_mask_embed): Embedding(1, 256)
513
+ )
514
+ (sam_mask_decoder): MaskDecoder(
515
+ (transformer): TwoWayTransformer(
516
+ (layers): ModuleList(
517
+ (0-1): 2 x TwoWayAttentionBlock(
518
+ (self_attn): Attention(
519
+ (q_proj): Linear(in_features=256, out_features=256, bias=True)
520
+ (k_proj): Linear(in_features=256, out_features=256, bias=True)
521
+ (v_proj): Linear(in_features=256, out_features=256, bias=True)
522
+ (out_proj): Linear(in_features=256, out_features=256, bias=True)
523
+ )
524
+ (norm1): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
525
+ (cross_attn_token_to_image): Attention(
526
+ (q_proj): Linear(in_features=256, out_features=128, bias=True)
527
+ (k_proj): Linear(in_features=256, out_features=128, bias=True)
528
+ (v_proj): Linear(in_features=256, out_features=128, bias=True)
529
+ (out_proj): Linear(in_features=128, out_features=256, bias=True)
530
+ )
531
+ (norm2): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
532
+ (mlp): MLP(
533
+ (layers): ModuleList(
534
+ (0): Linear(in_features=256, out_features=2048, bias=True)
535
+ (1): Linear(in_features=2048, out_features=256, bias=True)
536
+ )
537
+ (act): ReLU()
538
+ )
539
+ (norm3): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
540
+ (norm4): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
541
+ (cross_attn_image_to_token): Attention(
542
+ (q_proj): Linear(in_features=256, out_features=128, bias=True)
543
+ (k_proj): Linear(in_features=256, out_features=128, bias=True)
544
+ (v_proj): Linear(in_features=256, out_features=128, bias=True)
545
+ (out_proj): Linear(in_features=128, out_features=256, bias=True)
546
+ )
547
+ )
548
+ )
549
+ (final_attn_token_to_image): Attention(
550
+ (q_proj): Linear(in_features=256, out_features=128, bias=True)
551
+ (k_proj): Linear(in_features=256, out_features=128, bias=True)
552
+ (v_proj): Linear(in_features=256, out_features=128, bias=True)
553
+ (out_proj): Linear(in_features=128, out_features=256, bias=True)
554
+ )
555
+ (norm_final_attn): LayerNorm((256,), eps=1e-05, elementwise_affine=True)
556
+ )
557
+ (iou_token): Embedding(1, 256)
558
+ (mask_tokens): Embedding(4, 256)
559
+ (obj_score_token): Embedding(1, 256)
560
+ (output_upscaling): Sequential(
561
+ (0): ConvTranspose2d(256, 64, kernel_size=(2, 2), stride=(2, 2))
562
+ (1): LayerNorm2d()
563
+ (2): GELU(approximate='none')
564
+ (3): ConvTranspose2d(64, 32, kernel_size=(2, 2), stride=(2, 2))
565
+ (4): GELU(approximate='none')
566
+ )
567
+ (conv_s0): Conv2d(256, 32, kernel_size=(1, 1), stride=(1, 1))
568
+ (conv_s1): Conv2d(256, 64, kernel_size=(1, 1), stride=(1, 1))
569
+ (output_hypernetworks_mlps): ModuleList(
570
+ (0-3): 4 x MLP(
571
+ (layers): ModuleList(
572
+ (0-1): 2 x Linear(in_features=256, out_features=256, bias=True)
573
+ (2): Linear(in_features=256, out_features=32, bias=True)
574
+ )
575
+ (act): ReLU()
576
+ )
577
+ )
578
+ (iou_prediction_head): MLP(
579
+ (layers): ModuleList(
580
+ (0-1): 2 x Linear(in_features=256, out_features=256, bias=True)
581
+ (2): Linear(in_features=256, out_features=4, bias=True)
582
+ )
583
+ (act): ReLU()
584
+ )
585
+ (pred_obj_score_head): MLP(
586
+ (layers): ModuleList(
587
+ (0-1): 2 x Linear(in_features=256, out_features=256, bias=True)
588
+ (2): Linear(in_features=256, out_features=1, bias=True)
589
+ )
590
+ (act): ReLU()
591
+ )
592
+ )
593
+ (obj_ptr_proj): MLP(
594
+ (layers): ModuleList(
595
+ (0-2): 3 x Linear(in_features=256, out_features=256, bias=True)
596
+ )
597
+ (act): ReLU()
598
+ )
599
+ (obj_ptr_tpos_proj): Linear(in_features=256, out_features=64, bias=True)
600
+ )
601
+ INFO 2025-10-06 06:35:11,535 trainer.py:1062: Total parameters 80.9 M
602
+ INFO 2025-10-06 06:35:11,535 trainer.py:1063: Trainable parameters 80.9 M
603
+ INFO 2025-10-06 06:35:11,535 trainer.py:1066: Non-Trainable parameters 0
604
+ INFO 2025-10-06 06:35:11,535 trainer.py:1069: ====================
605
+ INFO 2025-10-06 06:35:11,540 trainer.py:1023: Finished setting up components: Model, loss, optim, meters etc.
606
+ INFO 2025-10-06 06:35:11,540 trainer.py: 314: Moving components to device cuda:0 and local rank 0.
607
+ INFO 2025-10-06 06:35:11,614 trainer.py: 320: Done moving components to device cuda:0 and local rank 0.
608
+ INFO 2025-10-06 06:35:11,631 optimizer.py: 248: Matches for param_name [image_encoder.*]: {'image_encoder.trunk.blocks.3.mlp.layers.0.bias', 'image_encoder.neck.convs.0.conv.weight', 'image_encoder.trunk.blocks.19.mlp.layers.1.bias', 'image_encoder.trunk.blocks.18.mlp.layers.0.weight', 'image_encoder.trunk.blocks.21.attn.proj.weight', 'image_encoder.trunk.blocks.15.attn.qkv.bias', 'image_encoder.trunk.blocks.21.mlp.layers.0.bias', 'image_encoder.trunk.blocks.9.norm1.bias', 'image_encoder.neck.convs.2.conv.weight', 'image_encoder.trunk.blocks.2.norm1.bias', 'image_encoder.trunk.blocks.5.attn.proj.weight', 'image_encoder.trunk.blocks.16.norm2.weight', 'image_encoder.trunk.blocks.0.mlp.layers.1.weight', 'image_encoder.trunk.blocks.4.norm1.weight', 'image_encoder.trunk.blocks.13.mlp.layers.1.weight', 'image_encoder.trunk.blocks.8.norm1.bias', 'image_encoder.trunk.blocks.19.attn.proj.bias', 'image_encoder.trunk.blocks.2.norm2.bias', 'image_encoder.trunk.blocks.19.norm1.weight', 'image_encoder.trunk.blocks.5.attn.qkv.bias', 'image_encoder.trunk.blocks.22.attn.qkv.bias', 'image_encoder.trunk.blocks.13.attn.proj.weight', 'image_encoder.trunk.blocks.19.mlp.layers.1.weight', 'image_encoder.trunk.blocks.1.norm1.weight', 'image_encoder.trunk.blocks.10.mlp.layers.0.bias', 'image_encoder.trunk.blocks.8.mlp.layers.1.bias', 'image_encoder.trunk.blocks.21.proj.bias', 'image_encoder.trunk.blocks.2.norm2.weight', 'image_encoder.trunk.blocks.5.norm2.weight', 'image_encoder.trunk.blocks.2.attn.proj.weight', 'image_encoder.trunk.blocks.11.mlp.layers.0.weight', 'image_encoder.trunk.blocks.1.attn.qkv.bias', 'image_encoder.trunk.blocks.12.mlp.layers.0.weight', 'image_encoder.trunk.blocks.16.norm1.bias', 'image_encoder.trunk.blocks.0.norm2.bias', 'image_encoder.trunk.blocks.10.norm1.bias', 'image_encoder.trunk.blocks.1.mlp.layers.0.weight', 'image_encoder.trunk.blocks.14.mlp.layers.1.bias', 'image_encoder.trunk.blocks.19.norm2.bias', 'image_encoder.trunk.blocks.14.norm1.bias', 'image_encoder.trunk.blocks.20.attn.qkv.bias', 'image_encoder.trunk.blocks.6.attn.qkv.weight', 'image_encoder.trunk.blocks.12.norm2.weight', 'image_encoder.trunk.blocks.21.mlp.layers.0.weight', 'image_encoder.trunk.blocks.18.mlp.layers.0.bias', 'image_encoder.trunk.blocks.1.mlp.layers.0.bias', 'image_encoder.trunk.blocks.23.norm2.bias', 'image_encoder.trunk.blocks.4.norm2.weight', 'image_encoder.trunk.blocks.9.attn.proj.weight', 'image_encoder.trunk.blocks.23.attn.qkv.weight', 'image_encoder.trunk.blocks.17.norm1.weight', 'image_encoder.trunk.blocks.17.mlp.layers.0.bias', 'image_encoder.trunk.blocks.6.mlp.layers.0.bias', 'image_encoder.trunk.blocks.1.attn.proj.weight', 'image_encoder.neck.convs.0.conv.bias', 'image_encoder.trunk.blocks.3.attn.proj.bias', 'image_encoder.trunk.blocks.15.norm1.bias', 'image_encoder.trunk.blocks.7.attn.proj.weight', 'image_encoder.trunk.blocks.14.attn.proj.weight', 'image_encoder.trunk.blocks.23.norm1.bias', 'image_encoder.trunk.blocks.3.attn.qkv.bias', 'image_encoder.trunk.blocks.0.attn.proj.weight', 'image_encoder.trunk.blocks.22.norm2.weight', 'image_encoder.trunk.blocks.7.norm1.bias', 'image_encoder.trunk.blocks.12.mlp.layers.0.bias', 'image_encoder.trunk.blocks.22.norm1.weight', 'image_encoder.trunk.blocks.15.mlp.layers.0.bias', 'image_encoder.trunk.blocks.6.mlp.layers.1.bias', 'image_encoder.trunk.blocks.11.mlp.layers.0.bias', 'image_encoder.trunk.blocks.12.mlp.layers.1.weight', 'image_encoder.trunk.blocks.6.attn.qkv.bias', 'image_encoder.trunk.blocks.6.norm2.weight', 'image_encoder.trunk.blocks.14.norm2.weight', 'image_encoder.trunk.blocks.0.norm2.weight', 'image_encoder.trunk.blocks.3.norm1.bias', 'image_encoder.trunk.blocks.18.attn.proj.weight', 'image_encoder.trunk.blocks.23.norm2.weight', 'image_encoder.trunk.blocks.16.attn.proj.weight', 'image_encoder.trunk.blocks.22.attn.proj.weight', 'image_encoder.trunk.blocks.10.mlp.layers.1.bias', 'image_encoder.trunk.blocks.2.norm1.weight', 'image_encoder.trunk.blocks.13.attn.proj.bias', 'image_encoder.trunk.blocks.22.mlp.layers.0.weight', 'image_encoder.trunk.blocks.4.mlp.layers.1.weight', 'image_encoder.trunk.blocks.14.norm1.weight', 'image_encoder.trunk.blocks.1.attn.qkv.weight', 'image_encoder.trunk.blocks.1.attn.proj.bias', 'image_encoder.trunk.blocks.0.attn.proj.bias', 'image_encoder.trunk.blocks.13.norm1.bias', 'image_encoder.trunk.blocks.12.norm2.bias', 'image_encoder.neck.convs.1.conv.weight', 'image_encoder.neck.convs.2.conv.bias', 'image_encoder.trunk.blocks.4.norm2.bias', 'image_encoder.trunk.blocks.22.attn.qkv.weight', 'image_encoder.trunk.blocks.21.proj.weight', 'image_encoder.trunk.blocks.18.mlp.layers.1.bias', 'image_encoder.trunk.blocks.10.norm2.weight', 'image_encoder.trunk.blocks.19.attn.qkv.weight', 'image_encoder.trunk.blocks.9.norm2.weight', 'image_encoder.trunk.blocks.10.norm2.bias', 'image_encoder.trunk.blocks.5.proj.weight', 'image_encoder.trunk.blocks.17.norm2.bias', 'image_encoder.trunk.blocks.17.attn.proj.bias', 'image_encoder.trunk.blocks.5.mlp.layers.0.bias', 'image_encoder.trunk.blocks.15.norm2.bias', 'image_encoder.trunk.blocks.21.norm2.bias', 'image_encoder.trunk.blocks.6.norm1.bias', 'image_encoder.trunk.blocks.20.mlp.layers.0.weight', 'image_encoder.trunk.blocks.0.mlp.layers.0.bias', 'image_encoder.trunk.blocks.20.mlp.layers.1.bias', 'image_encoder.trunk.blocks.4.attn.proj.bias', 'image_encoder.trunk.blocks.18.attn.qkv.weight', 'image_encoder.trunk.blocks.21.mlp.layers.1.weight', 'image_encoder.trunk.blocks.11.attn.proj.weight', 'image_encoder.trunk.blocks.8.attn.qkv.bias', 'image_encoder.trunk.blocks.21.norm1.bias', 'image_encoder.trunk.blocks.16.mlp.layers.0.weight', 'image_encoder.trunk.blocks.2.mlp.layers.1.weight', 'image_encoder.neck.convs.3.conv.bias', 'image_encoder.trunk.blocks.1.mlp.layers.1.bias', 'image_encoder.trunk.blocks.5.norm2.bias', 'image_encoder.trunk.blocks.11.norm1.weight', 'image_encoder.trunk.blocks.3.mlp.layers.1.weight', 'image_encoder.trunk.blocks.18.norm1.bias', 'image_encoder.trunk.blocks.8.norm1.weight', 'image_encoder.trunk.blocks.15.attn.proj.weight', 'image_encoder.trunk.blocks.3.attn.proj.weight', 'image_encoder.trunk.blocks.23.attn.qkv.bias', 'image_encoder.trunk.blocks.2.mlp.layers.1.bias', 'image_encoder.trunk.blocks.23.mlp.layers.0.weight', 'image_encoder.trunk.blocks.0.attn.qkv.weight', 'image_encoder.trunk.blocks.23.attn.proj.bias', 'image_encoder.trunk.blocks.4.norm1.bias', 'image_encoder.trunk.blocks.22.norm1.bias', 'image_encoder.trunk.blocks.14.norm2.bias', 'image_encoder.trunk.blocks.9.mlp.layers.1.weight', 'image_encoder.trunk.blocks.9.norm2.bias', 'image_encoder.trunk.blocks.12.norm1.bias', 'image_encoder.trunk.blocks.10.norm1.weight', 'image_encoder.trunk.blocks.18.mlp.layers.1.weight', 'image_encoder.trunk.blocks.6.mlp.layers.1.weight', 'image_encoder.trunk.blocks.2.attn.qkv.bias', 'image_encoder.trunk.blocks.21.attn.qkv.bias', 'image_encoder.trunk.blocks.2.proj.weight', 'image_encoder.trunk.blocks.12.attn.qkv.bias', 'image_encoder.trunk.blocks.7.attn.qkv.bias', 'image_encoder.trunk.blocks.10.attn.qkv.bias', 'image_encoder.trunk.blocks.9.mlp.layers.0.bias', 'image_encoder.trunk.blocks.9.norm1.weight', 'image_encoder.trunk.blocks.17.attn.qkv.bias', 'image_encoder.trunk.blocks.14.mlp.layers.0.weight', 'image_encoder.trunk.blocks.16.mlp.layers.1.weight', 'image_encoder.trunk.blocks.3.attn.qkv.weight', 'image_encoder.trunk.blocks.15.norm1.weight', 'image_encoder.trunk.blocks.16.attn.proj.bias', 'image_encoder.trunk.blocks.22.attn.proj.bias', 'image_encoder.trunk.blocks.0.norm1.bias', 'image_encoder.trunk.blocks.8.attn.qkv.weight', 'image_encoder.trunk.blocks.7.mlp.layers.1.weight', 'image_encoder.trunk.blocks.20.norm2.bias', 'image_encoder.trunk.blocks.5.attn.qkv.weight', 'image_encoder.trunk.blocks.20.mlp.layers.1.weight', 'image_encoder.trunk.blocks.5.mlp.layers.1.bias', 'image_encoder.trunk.blocks.17.norm1.bias', 'image_encoder.trunk.blocks.15.mlp.layers.0.weight', 'image_encoder.trunk.blocks.8.mlp.layers.0.bias', 'image_encoder.trunk.blocks.8.mlp.layers.0.weight', 'image_encoder.trunk.blocks.21.attn.qkv.weight', 'image_encoder.trunk.blocks.15.attn.proj.bias', 'image_encoder.trunk.blocks.19.norm1.bias', 'image_encoder.trunk.blocks.17.mlp.layers.1.weight', 'image_encoder.trunk.blocks.9.attn.qkv.bias', 'image_encoder.trunk.blocks.13.attn.qkv.weight', 'image_encoder.trunk.blocks.6.norm1.weight', 'image_encoder.trunk.blocks.16.attn.qkv.weight', 'image_encoder.trunk.blocks.11.mlp.layers.1.weight', 'image_encoder.trunk.pos_embed_window', 'image_encoder.trunk.blocks.7.mlp.layers.1.bias', 'image_encoder.trunk.blocks.13.mlp.layers.0.bias', 'image_encoder.trunk.blocks.23.attn.proj.weight', 'image_encoder.trunk.blocks.14.attn.proj.bias', 'image_encoder.trunk.blocks.20.attn.proj.weight', 'image_encoder.trunk.blocks.2.mlp.layers.0.bias', 'image_encoder.trunk.blocks.23.mlp.layers.0.bias', 'image_encoder.trunk.blocks.5.mlp.layers.1.weight', 'image_encoder.trunk.blocks.0.norm1.weight', 'image_encoder.trunk.blocks.16.norm2.bias', 'image_encoder.trunk.blocks.10.attn.proj.bias', 'image_encoder.trunk.blocks.3.norm1.weight', 'image_encoder.neck.convs.1.conv.bias', 'image_encoder.trunk.blocks.18.norm2.bias', 'image_encoder.trunk.blocks.19.attn.qkv.bias', 'image_encoder.trunk.blocks.13.norm1.weight', 'image_encoder.trunk.blocks.8.attn.proj.weight', 'image_encoder.trunk.blocks.21.norm2.weight', 'image_encoder.trunk.blocks.12.norm1.weight', 'image_encoder.trunk.blocks.7.norm1.weight', 'image_encoder.trunk.blocks.17.attn.proj.weight', 'image_encoder.trunk.blocks.6.norm2.bias', 'image_encoder.trunk.blocks.18.norm1.weight', 'image_encoder.trunk.blocks.4.mlp.layers.0.bias', 'image_encoder.trunk.blocks.5.proj.bias', 'image_encoder.trunk.blocks.19.mlp.layers.0.bias', 'image_encoder.trunk.blocks.2.attn.qkv.weight', 'image_encoder.trunk.blocks.8.attn.proj.bias', 'image_encoder.trunk.blocks.1.norm2.weight', 'image_encoder.trunk.patch_embed.proj.weight', 'image_encoder.trunk.blocks.23.mlp.layers.1.weight', 'image_encoder.trunk.blocks.11.attn.qkv.weight', 'image_encoder.trunk.blocks.14.attn.qkv.bias', 'image_encoder.trunk.blocks.9.mlp.layers.1.bias', 'image_encoder.trunk.blocks.13.norm2.bias', 'image_encoder.trunk.blocks.4.attn.qkv.weight', 'image_encoder.trunk.blocks.6.attn.proj.weight', 'image_encoder.trunk.blocks.9.attn.proj.bias', 'image_encoder.trunk.blocks.11.attn.qkv.bias', 'image_encoder.trunk.blocks.22.mlp.layers.1.bias', 'image_encoder.trunk.blocks.15.mlp.layers.1.bias', 'image_encoder.trunk.blocks.17.mlp.layers.1.bias', 'image_encoder.trunk.blocks.20.norm2.weight', 'image_encoder.trunk.blocks.12.attn.proj.bias', 'image_encoder.trunk.blocks.1.norm1.bias', 'image_encoder.trunk.blocks.23.norm1.weight', 'image_encoder.trunk.blocks.16.mlp.layers.1.bias', 'image_encoder.trunk.blocks.16.norm1.weight', 'image_encoder.trunk.blocks.18.attn.qkv.bias', 'image_encoder.trunk.blocks.11.norm1.bias', 'image_encoder.trunk.blocks.7.mlp.layers.0.bias', 'image_encoder.trunk.blocks.21.mlp.layers.1.bias', 'image_encoder.trunk.blocks.14.attn.qkv.weight', 'image_encoder.trunk.blocks.5.mlp.layers.0.weight', 'image_encoder.trunk.blocks.21.attn.proj.bias', 'image_encoder.trunk.blocks.11.norm2.weight', 'image_encoder.trunk.blocks.13.mlp.layers.0.weight', 'image_encoder.trunk.blocks.17.mlp.layers.0.weight', 'image_encoder.trunk.blocks.3.mlp.layers.1.bias', 'image_encoder.trunk.blocks.22.mlp.layers.1.weight', 'image_encoder.trunk.blocks.7.attn.proj.bias', 'image_encoder.trunk.blocks.16.attn.qkv.bias', 'image_encoder.trunk.blocks.2.proj.bias', 'image_encoder.trunk.blocks.5.norm1.weight', 'image_encoder.trunk.blocks.4.mlp.layers.1.bias', 'image_encoder.trunk.blocks.23.mlp.layers.1.bias', 'image_encoder.trunk.blocks.0.attn.qkv.bias', 'image_encoder.trunk.blocks.10.attn.proj.weight', 'image_encoder.trunk.blocks.1.norm2.bias', 'image_encoder.trunk.blocks.14.mlp.layers.0.bias', 'image_encoder.trunk.blocks.8.norm2.weight', 'image_encoder.trunk.blocks.8.mlp.layers.1.weight', 'image_encoder.trunk.blocks.11.norm2.bias', 'image_encoder.trunk.blocks.18.attn.proj.bias', 'image_encoder.trunk.blocks.13.mlp.layers.1.bias', 'image_encoder.trunk.blocks.2.mlp.layers.0.weight', 'image_encoder.trunk.blocks.15.mlp.layers.1.weight', 'image_encoder.trunk.blocks.20.norm1.bias', 'image_encoder.trunk.blocks.20.mlp.layers.0.bias', 'image_encoder.trunk.blocks.2.attn.proj.bias', 'image_encoder.trunk.blocks.20.attn.proj.bias', 'image_encoder.trunk.blocks.13.norm2.weight', 'image_encoder.trunk.blocks.19.mlp.layers.0.weight', 'image_encoder.trunk.blocks.7.attn.qkv.weight', 'image_encoder.trunk.blocks.3.norm2.bias', 'image_encoder.trunk.blocks.12.mlp.layers.1.bias', 'image_encoder.trunk.blocks.22.norm2.bias', 'image_encoder.trunk.blocks.17.attn.qkv.weight', 'image_encoder.trunk.blocks.7.norm2.weight', 'image_encoder.trunk.blocks.1.mlp.layers.1.weight', 'image_encoder.trunk.blocks.7.norm2.bias', 'image_encoder.trunk.blocks.15.norm2.weight', 'image_encoder.trunk.blocks.9.mlp.layers.0.weight', 'image_encoder.trunk.patch_embed.proj.bias', 'image_encoder.trunk.blocks.5.attn.proj.bias', 'image_encoder.trunk.blocks.20.attn.qkv.weight', 'image_encoder.trunk.blocks.6.attn.proj.bias', 'image_encoder.trunk.blocks.4.attn.qkv.bias', 'image_encoder.trunk.pos_embed', 'image_encoder.neck.convs.3.conv.weight', 'image_encoder.trunk.blocks.0.mlp.layers.0.weight', 'image_encoder.trunk.blocks.7.mlp.layers.0.weight', 'image_encoder.trunk.blocks.12.attn.qkv.weight', 'image_encoder.trunk.blocks.17.norm2.weight', 'image_encoder.trunk.blocks.3.mlp.layers.0.weight', 'image_encoder.trunk.blocks.4.attn.proj.weight', 'image_encoder.trunk.blocks.6.mlp.layers.0.weight', 'image_encoder.trunk.blocks.22.mlp.layers.0.bias', 'image_encoder.trunk.blocks.13.attn.qkv.bias', 'image_encoder.trunk.blocks.14.mlp.layers.1.weight', 'image_encoder.trunk.blocks.4.mlp.layers.0.weight', 'image_encoder.trunk.blocks.11.mlp.layers.1.bias', 'image_encoder.trunk.blocks.16.mlp.layers.0.bias', 'image_encoder.trunk.blocks.3.norm2.weight', 'image_encoder.trunk.blocks.19.norm2.weight', 'image_encoder.trunk.blocks.5.norm1.bias', 'image_encoder.trunk.blocks.20.norm1.weight', 'image_encoder.trunk.blocks.8.norm2.bias', 'image_encoder.trunk.blocks.19.attn.proj.weight', 'image_encoder.trunk.blocks.9.attn.qkv.weight', 'image_encoder.trunk.blocks.11.attn.proj.bias', 'image_encoder.trunk.blocks.0.mlp.layers.1.bias', 'image_encoder.trunk.blocks.21.norm1.weight', 'image_encoder.trunk.blocks.10.mlp.layers.1.weight', 'image_encoder.trunk.blocks.15.attn.qkv.weight', 'image_encoder.trunk.blocks.18.norm2.weight', 'image_encoder.trunk.blocks.10.attn.qkv.weight', 'image_encoder.trunk.blocks.10.mlp.layers.0.weight', 'image_encoder.trunk.blocks.12.attn.proj.weight'}
609
+ INFO 2025-10-06 06:35:11,632 optimizer.py: 248: Matches for param_name [*bias*]: {'image_encoder.trunk.blocks.3.mlp.layers.0.bias', 'memory_attention.layers.1.linear1.bias', 'image_encoder.trunk.blocks.19.mlp.layers.1.bias', 'memory_attention.layers.3.self_attn.out_proj.bias', 'memory_attention.layers.0.cross_attn_image.out_proj.bias', 'obj_ptr_proj.layers.0.bias', 'sam_mask_decoder.transformer.final_attn_token_to_image.out_proj.bias', 'sam_mask_decoder.pred_obj_score_head.layers.1.bias', 'image_encoder.trunk.blocks.15.attn.qkv.bias', 'image_encoder.trunk.blocks.21.mlp.layers.0.bias', 'sam_mask_decoder.transformer.layers.1.cross_attn_image_to_token.out_proj.bias', 'memory_attention.layers.3.norm3.bias', 'image_encoder.trunk.blocks.9.norm1.bias', 'image_encoder.trunk.blocks.2.norm1.bias', 'image_encoder.trunk.blocks.19.attn.proj.bias', 'image_encoder.trunk.blocks.2.norm2.bias', 'sam_mask_decoder.transformer.layers.0.mlp.layers.0.bias', 'image_encoder.trunk.blocks.8.norm1.bias', 'memory_attention.layers.2.linear1.bias', 'image_encoder.trunk.blocks.5.attn.qkv.bias', 'image_encoder.trunk.blocks.22.attn.qkv.bias', 'sam_mask_decoder.iou_prediction_head.layers.2.bias', 'sam_mask_decoder.transformer.layers.0.self_attn.k_proj.bias', 'image_encoder.trunk.blocks.10.mlp.layers.0.bias', 'memory_attention.layers.3.cross_attn_image.q_proj.bias', 'image_encoder.trunk.blocks.8.mlp.layers.1.bias', 'image_encoder.trunk.blocks.21.proj.bias', 'memory_attention.layers.0.linear2.bias', 'sam_mask_decoder.transformer.layers.1.norm3.bias', 'sam_mask_decoder.transformer.layers.0.mlp.layers.1.bias', 'image_encoder.trunk.blocks.1.attn.qkv.bias', 'sam_mask_decoder.transformer.final_attn_token_to_image.q_proj.bias', 'sam_mask_decoder.transformer.layers.1.mlp.layers.1.bias', 'image_encoder.trunk.blocks.10.norm1.bias', 'image_encoder.trunk.blocks.16.norm1.bias', 'image_encoder.trunk.blocks.0.norm2.bias', 'image_encoder.trunk.blocks.14.mlp.layers.1.bias', 'memory_attention.layers.3.self_attn.q_proj.bias', 'image_encoder.trunk.blocks.19.norm2.bias', 'sam_mask_decoder.transformer.layers.0.norm3.bias', 'image_encoder.trunk.blocks.14.norm1.bias', 'image_encoder.trunk.blocks.20.attn.qkv.bias', 'sam_mask_decoder.transformer.norm_final_attn.bias', 'image_encoder.trunk.blocks.18.mlp.layers.0.bias', 'memory_attention.layers.1.cross_attn_image.q_proj.bias', 'image_encoder.trunk.blocks.1.mlp.layers.0.bias', 'image_encoder.trunk.blocks.23.norm2.bias', 'memory_attention.layers.1.self_attn.q_proj.bias', 'memory_attention.layers.0.self_attn.k_proj.bias', 'memory_encoder.mask_downsampler.encoder.10.bias', 'memory_attention.layers.2.cross_attn_image.q_proj.bias', 'image_encoder.trunk.blocks.17.mlp.layers.0.bias', 'memory_attention.layers.1.self_attn.k_proj.bias', 'image_encoder.trunk.blocks.6.mlp.layers.0.bias', 'memory_attention.layers.3.cross_attn_image.out_proj.bias', 'image_encoder.neck.convs.0.conv.bias', 'sam_mask_decoder.output_upscaling.0.bias', 'image_encoder.trunk.blocks.3.attn.proj.bias', 'image_encoder.trunk.blocks.15.norm1.bias', 'image_encoder.trunk.blocks.23.norm1.bias', 'image_encoder.trunk.blocks.3.attn.qkv.bias', 'image_encoder.trunk.blocks.7.norm1.bias', 'memory_attention.layers.3.self_attn.v_proj.bias', 'sam_mask_decoder.transformer.layers.1.self_attn.q_proj.bias', 'sam_mask_decoder.transformer.layers.1.self_attn.k_proj.bias', 'image_encoder.trunk.blocks.12.mlp.layers.0.bias', 'image_encoder.trunk.blocks.15.mlp.layers.0.bias', 'image_encoder.trunk.blocks.6.mlp.layers.1.bias', 'memory_attention.layers.1.norm3.bias', 'memory_attention.layers.0.linear1.bias', 'memory_attention.layers.1.cross_attn_image.out_proj.bias', 'image_encoder.trunk.blocks.6.attn.qkv.bias', 'sam_mask_decoder.transformer.layers.0.norm2.bias', 'image_encoder.trunk.blocks.11.mlp.layers.0.bias', 'memory_attention.norm.bias', 'memory_attention.layers.0.self_attn.q_proj.bias', 'memory_encoder.mask_downsampler.encoder.7.bias', 'image_encoder.trunk.blocks.3.norm1.bias', 'memory_attention.layers.1.norm2.bias', 'memory_attention.layers.1.norm1.bias', 'image_encoder.trunk.blocks.10.mlp.layers.1.bias', 'sam_mask_decoder.transformer.layers.1.cross_attn_token_to_image.q_proj.bias', 'obj_ptr_proj.layers.1.bias', 'sam_mask_decoder.output_hypernetworks_mlps.1.layers.2.bias', 'sam_prompt_encoder.mask_downscaling.6.bias', 'image_encoder.trunk.blocks.13.attn.proj.bias', 'image_encoder.trunk.blocks.1.attn.proj.bias', 'image_encoder.trunk.blocks.13.norm1.bias', 'image_encoder.trunk.blocks.12.norm2.bias', 'image_encoder.trunk.blocks.0.attn.proj.bias', 'sam_prompt_encoder.mask_downscaling.3.bias', 'sam_mask_decoder.transformer.layers.0.cross_attn_token_to_image.out_proj.bias', 'sam_mask_decoder.transformer.layers.0.cross_attn_token_to_image.k_proj.bias', 'image_encoder.neck.convs.2.conv.bias', 'image_encoder.trunk.blocks.4.norm2.bias', 'image_encoder.trunk.blocks.18.mlp.layers.1.bias', 'sam_mask_decoder.output_hypernetworks_mlps.0.layers.1.bias', 'sam_prompt_encoder.mask_downscaling.1.bias', 'image_encoder.trunk.blocks.10.norm2.bias', 'sam_prompt_encoder.mask_downscaling.0.bias', 'sam_mask_decoder.transformer.final_attn_token_to_image.v_proj.bias', 'image_encoder.trunk.blocks.17.norm2.bias', 'sam_mask_decoder.transformer.layers.0.cross_attn_token_to_image.v_proj.bias', 'image_encoder.trunk.blocks.17.attn.proj.bias', 'sam_mask_decoder.transformer.layers.0.cross_attn_image_to_token.out_proj.bias', 'image_encoder.trunk.blocks.15.norm2.bias', 'image_encoder.trunk.blocks.21.norm2.bias', 'memory_attention.layers.1.self_attn.out_proj.bias', 'image_encoder.trunk.blocks.6.norm1.bias', 'image_encoder.trunk.blocks.5.mlp.layers.0.bias', 'memory_encoder.mask_downsampler.encoder.6.bias', 'image_encoder.trunk.blocks.0.mlp.layers.0.bias', 'memory_encoder.fuser.layers.1.norm.bias', 'image_encoder.trunk.blocks.20.mlp.layers.1.bias', 'image_encoder.trunk.blocks.4.attn.proj.bias', 'memory_encoder.fuser.layers.0.norm.bias', 'sam_mask_decoder.transformer.layers.1.self_attn.v_proj.bias', 'sam_mask_decoder.transformer.layers.1.cross_attn_image_to_token.q_proj.bias', 'memory_attention.layers.0.self_attn.v_proj.bias', 'image_encoder.trunk.blocks.8.attn.qkv.bias', 'sam_mask_decoder.transformer.layers.0.norm1.bias', 'image_encoder.trunk.blocks.21.norm1.bias', 'sam_mask_decoder.output_hypernetworks_mlps.3.layers.0.bias', 'memory_attention.layers.2.norm3.bias', 'image_encoder.trunk.blocks.1.mlp.layers.1.bias', 'image_encoder.neck.convs.3.conv.bias', 'image_encoder.trunk.blocks.5.norm2.bias', 'sam_mask_decoder.output_hypernetworks_mlps.1.layers.0.bias', 'image_encoder.trunk.blocks.18.norm1.bias', 'memory_attention.layers.3.cross_attn_image.k_proj.bias', 'sam_mask_decoder.transformer.layers.1.mlp.layers.0.bias', 'sam_mask_decoder.transformer.layers.1.cross_attn_token_to_image.out_proj.bias', 'sam_mask_decoder.transformer.layers.1.cross_attn_image_to_token.k_proj.bias', 'memory_attention.layers.3.linear1.bias', 'image_encoder.trunk.blocks.2.mlp.layers.1.bias', 'image_encoder.trunk.blocks.23.attn.qkv.bias', 'sam_mask_decoder.output_hypernetworks_mlps.2.layers.2.bias', 'image_encoder.trunk.blocks.23.attn.proj.bias', 'image_encoder.trunk.blocks.4.norm1.bias', 'image_encoder.trunk.blocks.22.norm1.bias', 'image_encoder.trunk.blocks.14.norm2.bias', 'image_encoder.trunk.blocks.9.norm2.bias', 'memory_attention.layers.1.cross_attn_image.k_proj.bias', 'image_encoder.trunk.blocks.12.norm1.bias', 'memory_attention.layers.0.norm2.bias', 'image_encoder.trunk.blocks.2.attn.qkv.bias', 'image_encoder.trunk.blocks.21.attn.qkv.bias', 'sam_mask_decoder.conv_s0.bias', 'image_encoder.trunk.blocks.12.attn.qkv.bias', 'sam_mask_decoder.transformer.layers.1.self_attn.out_proj.bias', 'image_encoder.trunk.blocks.7.attn.qkv.bias', 'image_encoder.trunk.blocks.10.attn.qkv.bias', 'image_encoder.trunk.blocks.9.mlp.layers.0.bias', 'image_encoder.trunk.blocks.17.attn.qkv.bias', 'image_encoder.trunk.blocks.16.attn.proj.bias', 'image_encoder.trunk.blocks.22.attn.proj.bias', 'image_encoder.trunk.blocks.0.norm1.bias', 'sam_mask_decoder.pred_obj_score_head.layers.2.bias', 'memory_attention.layers.1.linear2.bias', 'image_encoder.trunk.blocks.20.norm2.bias', 'sam_mask_decoder.transformer.layers.1.cross_attn_token_to_image.v_proj.bias', 'sam_mask_decoder.output_hypernetworks_mlps.0.layers.2.bias', 'memory_attention.layers.2.cross_attn_image.out_proj.bias', 'image_encoder.trunk.blocks.5.mlp.layers.1.bias', 'image_encoder.trunk.blocks.17.norm1.bias', 'sam_mask_decoder.transformer.layers.1.norm1.bias', 'sam_mask_decoder.conv_s1.bias', 'image_encoder.trunk.blocks.8.mlp.layers.0.bias', 'memory_attention.layers.2.self_attn.k_proj.bias', 'memory_encoder.fuser.layers.0.pwconv2.bias', 'image_encoder.trunk.blocks.15.attn.proj.bias', 'image_encoder.trunk.blocks.19.norm1.bias', 'memory_attention.layers.0.cross_attn_image.k_proj.bias', 'memory_encoder.mask_downsampler.encoder.12.bias', 'image_encoder.trunk.blocks.9.attn.qkv.bias', 'memory_attention.layers.3.norm2.bias', 'memory_encoder.fuser.layers.1.dwconv.bias', 'image_encoder.trunk.blocks.13.mlp.layers.0.bias', 'image_encoder.trunk.blocks.7.mlp.layers.1.bias', 'image_encoder.trunk.blocks.14.attn.proj.bias', 'image_encoder.trunk.blocks.2.mlp.layers.0.bias', 'image_encoder.trunk.blocks.23.mlp.layers.0.bias', 'memory_attention.layers.2.norm1.bias', 'image_encoder.trunk.blocks.16.norm2.bias', 'image_encoder.trunk.blocks.10.attn.proj.bias', 'image_encoder.neck.convs.1.conv.bias', 'image_encoder.trunk.blocks.18.norm2.bias', 'memory_attention.layers.1.cross_attn_image.v_proj.bias', 'sam_mask_decoder.transformer.layers.1.cross_attn_image_to_token.v_proj.bias', 'image_encoder.trunk.blocks.19.attn.qkv.bias', 'sam_mask_decoder.output_hypernetworks_mlps.2.layers.0.bias', 'memory_attention.layers.0.cross_attn_image.v_proj.bias', 'image_encoder.trunk.blocks.6.norm2.bias', 'image_encoder.trunk.blocks.4.mlp.layers.0.bias', 'image_encoder.trunk.blocks.5.proj.bias', 'obj_ptr_tpos_proj.bias', 'image_encoder.trunk.blocks.19.mlp.layers.0.bias', 'image_encoder.trunk.blocks.8.attn.proj.bias', 'image_encoder.trunk.blocks.14.attn.qkv.bias', 'image_encoder.trunk.blocks.9.mlp.layers.1.bias', 'memory_attention.layers.2.self_attn.out_proj.bias', 'memory_encoder.pix_feat_proj.bias', 'image_encoder.trunk.blocks.13.norm2.bias', 'memory_attention.layers.2.linear2.bias', 'sam_mask_decoder.transformer.layers.0.cross_attn_token_to_image.q_proj.bias', 'sam_mask_decoder.transformer.layers.0.self_attn.out_proj.bias', 'image_encoder.trunk.blocks.9.attn.proj.bias', 'image_encoder.trunk.blocks.11.attn.qkv.bias', 'image_encoder.trunk.blocks.22.mlp.layers.1.bias', 'image_encoder.trunk.blocks.15.mlp.layers.1.bias', 'sam_mask_decoder.transformer.layers.0.norm4.bias', 'image_encoder.trunk.blocks.17.mlp.layers.1.bias', 'sam_mask_decoder.transformer.layers.1.cross_attn_token_to_image.k_proj.bias', 'memory_encoder.fuser.layers.0.dwconv.bias', 'image_encoder.trunk.blocks.12.attn.proj.bias', 'image_encoder.trunk.blocks.1.norm1.bias', 'image_encoder.trunk.blocks.16.mlp.layers.1.bias', 'sam_mask_decoder.transformer.layers.1.norm2.bias', 'image_encoder.trunk.blocks.18.attn.qkv.bias', 'image_encoder.trunk.blocks.11.norm1.bias', 'memory_encoder.fuser.layers.1.pwconv2.bias', 'memory_encoder.mask_downsampler.encoder.0.bias', 'image_encoder.trunk.blocks.7.mlp.layers.0.bias', 'image_encoder.trunk.blocks.21.mlp.layers.1.bias', 'image_encoder.trunk.blocks.21.attn.proj.bias', 'mask_downsample.bias', 'image_encoder.trunk.blocks.3.mlp.layers.1.bias', 'image_encoder.trunk.blocks.7.attn.proj.bias', 'image_encoder.trunk.blocks.16.attn.qkv.bias', 'image_encoder.trunk.blocks.2.proj.bias', 'sam_prompt_encoder.mask_downscaling.4.bias', 'memory_attention.layers.2.cross_attn_image.v_proj.bias', 'image_encoder.trunk.blocks.4.mlp.layers.1.bias', 'image_encoder.trunk.blocks.23.mlp.layers.1.bias', 'image_encoder.trunk.blocks.0.attn.qkv.bias', 'image_encoder.trunk.blocks.1.norm2.bias', 'image_encoder.trunk.blocks.14.mlp.layers.0.bias', 'memory_encoder.mask_downsampler.encoder.3.bias', 'memory_encoder.mask_downsampler.encoder.4.bias', 'sam_mask_decoder.output_hypernetworks_mlps.2.layers.1.bias', 'image_encoder.trunk.blocks.11.norm2.bias', 'image_encoder.trunk.blocks.18.attn.proj.bias', 'memory_attention.layers.0.self_attn.out_proj.bias', 'image_encoder.trunk.blocks.13.mlp.layers.1.bias', 'sam_mask_decoder.transformer.layers.0.self_attn.q_proj.bias', 'sam_mask_decoder.transformer.layers.1.norm4.bias', 'sam_mask_decoder.output_hypernetworks_mlps.3.layers.1.bias', 'image_encoder.trunk.blocks.20.norm1.bias', 'image_encoder.trunk.blocks.20.mlp.layers.0.bias', 'memory_attention.layers.2.cross_attn_image.k_proj.bias', 'image_encoder.trunk.blocks.2.attn.proj.bias', 'sam_mask_decoder.output_hypernetworks_mlps.0.layers.0.bias', 'image_encoder.trunk.blocks.20.attn.proj.bias', 'image_encoder.trunk.blocks.3.norm2.bias', 'image_encoder.trunk.blocks.12.mlp.layers.1.bias', 'image_encoder.trunk.blocks.22.norm2.bias', 'memory_attention.layers.0.norm3.bias', 'memory_attention.layers.2.self_attn.q_proj.bias', 'memory_attention.layers.3.norm1.bias', 'image_encoder.trunk.blocks.7.norm2.bias', 'memory_encoder.mask_downsampler.encoder.1.bias', 'image_encoder.trunk.patch_embed.proj.bias', 'image_encoder.trunk.blocks.5.attn.proj.bias', 'image_encoder.trunk.blocks.6.attn.proj.bias', 'sam_mask_decoder.output_hypernetworks_mlps.1.layers.1.bias', 'image_encoder.trunk.blocks.4.attn.qkv.bias', 'memory_attention.layers.3.cross_attn_image.v_proj.bias', 'sam_mask_decoder.transformer.layers.0.cross_attn_image_to_token.q_proj.bias', 'memory_encoder.fuser.layers.0.pwconv1.bias', 'image_encoder.trunk.blocks.22.mlp.layers.0.bias', 'sam_mask_decoder.transformer.final_attn_token_to_image.k_proj.bias', 'sam_mask_decoder.output_upscaling.3.bias', 'image_encoder.trunk.blocks.13.attn.qkv.bias', 'memory_attention.layers.3.linear2.bias', 'memory_attention.layers.0.cross_attn_image.q_proj.bias', 'memory_attention.layers.0.norm1.bias', 'memory_encoder.out_proj.bias', 'sam_mask_decoder.pred_obj_score_head.layers.0.bias', 'image_encoder.trunk.blocks.11.mlp.layers.1.bias', 'memory_attention.layers.2.self_attn.v_proj.bias', 'sam_mask_decoder.transformer.layers.0.self_attn.v_proj.bias', 'obj_ptr_proj.layers.2.bias', 'image_encoder.trunk.blocks.5.norm1.bias', 'memory_attention.layers.2.norm2.bias', 'image_encoder.trunk.blocks.16.mlp.layers.0.bias', 'memory_encoder.fuser.layers.1.pwconv1.bias', 'memory_attention.layers.1.self_attn.v_proj.bias', 'sam_mask_decoder.iou_prediction_head.layers.1.bias', 'sam_mask_decoder.transformer.layers.0.cross_attn_image_to_token.v_proj.bias', 'sam_mask_decoder.output_hypernetworks_mlps.3.layers.2.bias', 'image_encoder.trunk.blocks.8.norm2.bias', 'image_encoder.trunk.blocks.11.attn.proj.bias', 'image_encoder.trunk.blocks.0.mlp.layers.1.bias', 'sam_mask_decoder.transformer.layers.0.cross_attn_image_to_token.k_proj.bias', 'memory_encoder.mask_downsampler.encoder.9.bias', 'sam_mask_decoder.iou_prediction_head.layers.0.bias', 'sam_mask_decoder.output_upscaling.1.bias', 'memory_attention.layers.3.self_attn.k_proj.bias'}
610
+ INFO 2025-10-06 06:35:11,633 optimizer.py: 220: Matches for module_cls_name [torch.nn.LayerNorm]: {'memory_attention.layers.3.norm3.bias', 'image_encoder.trunk.blocks.9.norm1.bias', 'image_encoder.trunk.blocks.2.norm1.bias', 'image_encoder.trunk.blocks.4.norm1.weight', 'image_encoder.trunk.blocks.2.norm2.bias', 'image_encoder.trunk.blocks.16.norm2.weight', 'sam_mask_decoder.transformer.layers.1.norm3.weight', 'image_encoder.trunk.blocks.8.norm1.bias', 'image_encoder.trunk.blocks.19.norm1.weight', 'image_encoder.trunk.blocks.1.norm1.weight', 'image_encoder.trunk.blocks.2.norm2.weight', 'image_encoder.trunk.blocks.5.norm2.weight', 'sam_mask_decoder.transformer.layers.1.norm3.bias', 'image_encoder.trunk.blocks.16.norm1.bias', 'image_encoder.trunk.blocks.0.norm2.bias', 'image_encoder.trunk.blocks.10.norm1.bias', 'memory_attention.layers.2.norm3.weight', 'image_encoder.trunk.blocks.19.norm2.bias', 'image_encoder.trunk.blocks.14.norm1.bias', 'sam_mask_decoder.transformer.layers.0.norm3.bias', 'image_encoder.trunk.blocks.12.norm2.weight', 'memory_attention.layers.1.norm1.weight', 'sam_mask_decoder.transformer.norm_final_attn.bias', 'image_encoder.trunk.blocks.4.norm2.weight', 'image_encoder.trunk.blocks.23.norm2.bias', 'image_encoder.trunk.blocks.17.norm1.weight', 'sam_mask_decoder.transformer.layers.0.norm4.weight', 'memory_attention.layers.2.norm2.weight', 'memory_attention.layers.3.norm2.weight', 'image_encoder.trunk.blocks.15.norm1.bias', 'image_encoder.trunk.blocks.23.norm1.bias', 'image_encoder.trunk.blocks.7.norm1.bias', 'image_encoder.trunk.blocks.22.norm2.weight', 'image_encoder.trunk.blocks.22.norm1.weight', 'memory_attention.layers.1.norm3.bias', 'sam_mask_decoder.transformer.layers.0.norm2.bias', 'memory_attention.norm.bias', 'image_encoder.trunk.blocks.0.norm2.weight', 'image_encoder.trunk.blocks.6.norm2.weight', 'image_encoder.trunk.blocks.14.norm2.weight', 'image_encoder.trunk.blocks.3.norm1.bias', 'image_encoder.trunk.blocks.23.norm2.weight', 'memory_attention.layers.1.norm2.bias', 'memory_attention.layers.0.norm2.weight', 'image_encoder.trunk.blocks.2.norm1.weight', 'memory_attention.layers.1.norm1.bias', 'image_encoder.trunk.blocks.14.norm1.weight', 'image_encoder.trunk.blocks.13.norm1.bias', 'image_encoder.trunk.blocks.12.norm2.bias', 'sam_mask_decoder.transformer.layers.0.norm2.weight', 'image_encoder.trunk.blocks.4.norm2.bias', 'image_encoder.trunk.blocks.10.norm2.weight', 'image_encoder.trunk.blocks.9.norm2.weight', 'image_encoder.trunk.blocks.10.norm2.bias', 'image_encoder.trunk.blocks.17.norm2.bias', 'image_encoder.trunk.blocks.15.norm2.bias', 'image_encoder.trunk.blocks.21.norm2.bias', 'image_encoder.trunk.blocks.6.norm1.bias', 'sam_mask_decoder.transformer.layers.1.norm2.weight', 'image_encoder.trunk.blocks.21.norm1.bias', 'sam_mask_decoder.transformer.layers.0.norm1.bias', 'memory_attention.layers.3.norm3.weight', 'memory_attention.layers.3.norm1.weight', 'memory_attention.layers.2.norm3.bias', 'image_encoder.trunk.blocks.5.norm2.bias', 'image_encoder.trunk.blocks.11.norm1.weight', 'image_encoder.trunk.blocks.18.norm1.bias', 'image_encoder.trunk.blocks.8.norm1.weight', 'image_encoder.trunk.blocks.14.norm2.bias', 'image_encoder.trunk.blocks.22.norm1.bias', 'image_encoder.trunk.blocks.9.norm2.bias', 'image_encoder.trunk.blocks.4.norm1.bias', 'image_encoder.trunk.blocks.12.norm1.bias', 'memory_attention.layers.0.norm2.bias', 'image_encoder.trunk.blocks.10.norm1.weight', 'sam_mask_decoder.transformer.norm_final_attn.weight', 'image_encoder.trunk.blocks.9.norm1.weight', 'memory_attention.layers.0.norm1.weight', 'image_encoder.trunk.blocks.15.norm1.weight', 'image_encoder.trunk.blocks.0.norm1.bias', 'memory_attention.norm.weight', 'image_encoder.trunk.blocks.20.norm2.bias', 'sam_mask_decoder.transformer.layers.1.norm4.weight', 'sam_mask_decoder.transformer.layers.1.norm1.bias', 'image_encoder.trunk.blocks.17.norm1.bias', 'image_encoder.trunk.blocks.19.norm1.bias', 'sam_mask_decoder.transformer.layers.0.norm1.weight', 'image_encoder.trunk.blocks.6.norm1.weight', 'memory_attention.layers.3.norm2.bias', 'image_encoder.trunk.blocks.0.norm1.weight', 'memory_attention.layers.2.norm1.bias', 'image_encoder.trunk.blocks.16.norm2.bias', 'image_encoder.trunk.blocks.3.norm1.weight', 'image_encoder.trunk.blocks.18.norm2.bias', 'image_encoder.trunk.blocks.13.norm1.weight', 'image_encoder.trunk.blocks.21.norm2.weight', 'image_encoder.trunk.blocks.7.norm1.weight', 'image_encoder.trunk.blocks.12.norm1.weight', 'image_encoder.trunk.blocks.6.norm2.bias', 'image_encoder.trunk.blocks.18.norm1.weight', 'image_encoder.trunk.blocks.1.norm2.weight', 'memory_attention.layers.0.norm3.weight', 'image_encoder.trunk.blocks.13.norm2.bias', 'sam_mask_decoder.transformer.layers.0.norm4.bias', 'memory_attention.layers.1.norm2.weight', 'image_encoder.trunk.blocks.20.norm2.weight', 'image_encoder.trunk.blocks.1.norm1.bias', 'image_encoder.trunk.blocks.23.norm1.weight', 'image_encoder.trunk.blocks.16.norm1.weight', 'sam_mask_decoder.transformer.layers.1.norm2.bias', 'image_encoder.trunk.blocks.11.norm1.bias', 'sam_mask_decoder.transformer.layers.1.norm1.weight', 'image_encoder.trunk.blocks.11.norm2.weight', 'image_encoder.trunk.blocks.5.norm1.weight', 'image_encoder.trunk.blocks.1.norm2.bias', 'image_encoder.trunk.blocks.8.norm2.weight', 'image_encoder.trunk.blocks.11.norm2.bias', 'memory_attention.layers.1.norm3.weight', 'sam_mask_decoder.transformer.layers.0.norm3.weight', 'sam_mask_decoder.transformer.layers.1.norm4.bias', 'image_encoder.trunk.blocks.20.norm1.bias', 'image_encoder.trunk.blocks.13.norm2.weight', 'image_encoder.trunk.blocks.3.norm2.bias', 'memory_attention.layers.2.norm1.weight', 'image_encoder.trunk.blocks.22.norm2.bias', 'memory_attention.layers.0.norm3.bias', 'image_encoder.trunk.blocks.7.norm2.weight', 'image_encoder.trunk.blocks.7.norm2.bias', 'memory_attention.layers.3.norm1.bias', 'image_encoder.trunk.blocks.15.norm2.weight', 'image_encoder.trunk.blocks.17.norm2.weight', 'memory_attention.layers.0.norm1.bias', 'image_encoder.trunk.blocks.3.norm2.weight', 'image_encoder.trunk.blocks.19.norm2.weight', 'image_encoder.trunk.blocks.5.norm1.bias', 'memory_attention.layers.2.norm2.bias', 'image_encoder.trunk.blocks.20.norm1.weight', 'image_encoder.trunk.blocks.8.norm2.bias', 'image_encoder.trunk.blocks.18.norm2.weight', 'image_encoder.trunk.blocks.21.norm1.weight'}
611
+ INFO 2025-10-06 06:35:12,861 sam2_datasets.py: 125: Dataset mixing probabilities: [1.0]
612
+ INFO 2025-10-06 06:35:13,341 trainer.py: 417: Loading pretrained checkpoint from {'_partial_': True, '_target_': 'training.utils.checkpoint_utils.load_state_dict_into_model', 'strict': True, 'ignore_unexpected_keys': None, 'ignore_missing_keys': None, 'state_dict': {'_target_': 'training.utils.checkpoint_utils.load_checkpoint_and_apply_kernels', 'checkpoint_path': '/work/nvme/bfgd/cmaduabuchi/MODELS/THRIVESEG/sam2.1_hiera_base_plus.pt', 'ckpt_state_dict_keys': ['model']}}
613
+ INFO 2025-10-06 06:53:51,461 trainer.py: 950: Estimated time remaining: 00d 12h 05m
614
+ INFO 2025-10-06 06:53:51,482 trainer.py: 892: Synchronizing meters
615
+ INFO 2025-10-06 06:53:51,482 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.6424086557137584, 'Losses/train_all_loss_mask': 0.016180070180966514, 'Losses/train_all_loss_dice': 0.2685501508280366, 'Losses/train_all_loss_iou': 0.05025709560852524, 'Losses/train_all_loss_class': 1.2424740680067156e-08, 'Losses/train_all_core_loss': 0.6424086557137584, 'Trainer/where': 0.0249937374749499, 'Trainer/epoch': 0, 'Trainer/steps_train': 3992}
616
+ INFO 2025-10-06 07:12:22,839 trainer.py: 950: Estimated time remaining: 00d 11h 41m
617
+ INFO 2025-10-06 07:12:22,861 trainer.py: 892: Synchronizing meters
618
+ INFO 2025-10-06 07:12:22,861 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.5279103564334108, 'Losses/train_all_loss_mask': 0.012948783188376493, 'Losses/train_all_loss_dice': 0.23409812990016116, 'Losses/train_all_loss_iou': 0.034836555814920164, 'Losses/train_all_loss_class': 1.1137212414612728e-08, 'Losses/train_all_core_loss': 0.5279103564334108, 'Trainer/where': 0.0499937374749499, 'Trainer/epoch': 1, 'Trainer/steps_train': 7984}
619
+ INFO 2025-10-06 07:30:58,749 trainer.py: 950: Estimated time remaining: 00d 11h 25m
620
+ INFO 2025-10-06 07:30:58,771 trainer.py: 892: Synchronizing meters
621
+ INFO 2025-10-06 07:30:58,771 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.46176709332815996, 'Losses/train_all_loss_mask': 0.010168827943158898, 'Losses/train_all_loss_dice': 0.22589266421142704, 'Losses/train_all_loss_iou': 0.03249785962655957, 'Losses/train_all_loss_class': 1.3400916166038667e-08, 'Losses/train_all_core_loss': 0.46176709332815996, 'Trainer/where': 0.0749937374749499, 'Trainer/epoch': 2, 'Trainer/steps_train': 11976}
622
+ INFO 2025-10-06 07:49:42,950 trainer.py: 950: Estimated time remaining: 00d 11h 12m
623
+ INFO 2025-10-06 07:49:42,972 trainer.py: 892: Synchronizing meters
624
+ INFO 2025-10-06 07:49:42,972 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.434850245800041, 'Losses/train_all_loss_mask': 0.008949943296251449, 'Losses/train_all_loss_dice': 0.22050112636688954, 'Losses/train_all_loss_iou': 0.03535024233930884, 'Losses/train_all_loss_class': 1.4512113502645153e-08, 'Losses/train_all_core_loss': 0.434850245800041, 'Trainer/where': 0.09999373747494991, 'Trainer/epoch': 3, 'Trainer/steps_train': 15968}
625
+ INFO 2025-10-06 08:08:34,804 trainer.py: 950: Estimated time remaining: 00d 10h 57m
626
+ INFO 2025-10-06 08:08:34,826 trainer.py: 892: Synchronizing meters
627
+ INFO 2025-10-06 08:08:34,826 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.4899576190065402, 'Losses/train_all_loss_mask': 0.012139334249143563, 'Losses/train_all_loss_dice': 0.2170970643271425, 'Losses/train_all_loss_iou': 0.030073830085804915, 'Losses/train_all_loss_class': 3.6043506326426754e-08, 'Losses/train_all_core_loss': 0.4899576190065402, 'Trainer/where': 0.1249937374749499, 'Trainer/epoch': 4, 'Trainer/steps_train': 19960}
628
+ INFO 2025-10-06 08:27:35,126 trainer.py: 950: Estimated time remaining: 00d 10h 43m
629
+ INFO 2025-10-06 08:27:35,148 trainer.py: 892: Synchronizing meters
630
+ INFO 2025-10-06 08:27:35,148 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.410329947133319, 'Losses/train_all_loss_mask': 0.008565576918526002, 'Losses/train_all_loss_dice': 0.21291188210368395, 'Losses/train_all_loss_iou': 0.026106498928851203, 'Losses/train_all_loss_class': 2.8962244711128784e-08, 'Losses/train_all_core_loss': 0.410329947133319, 'Trainer/where': 0.1499937374749499, 'Trainer/epoch': 5, 'Trainer/steps_train': 23952}
631
+ INFO 2025-10-06 08:46:35,674 trainer.py: 950: Estimated time remaining: 00d 10h 24m
632
+ INFO 2025-10-06 08:46:35,695 trainer.py: 892: Synchronizing meters
633
+ INFO 2025-10-06 08:46:35,695 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.40882908666967405, 'Losses/train_all_loss_mask': 0.008480613211250676, 'Losses/train_all_loss_dice': 0.21131395521706234, 'Losses/train_all_loss_iou': 0.027902849250237918, 'Losses/train_all_loss_class': 2.056003091207329e-08, 'Losses/train_all_core_loss': 0.40882908666967405, 'Trainer/where': 0.1749937374749499, 'Trainer/epoch': 6, 'Trainer/steps_train': 27944}
634
+ INFO 2025-10-06 09:05:27,802 trainer.py: 950: Estimated time remaining: 00d 10h 01m
635
+ INFO 2025-10-06 09:05:27,823 trainer.py: 892: Synchronizing meters
636
+ INFO 2025-10-06 09:05:27,823 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.4277842160713726, 'Losses/train_all_loss_mask': 0.009505709921017888, 'Losses/train_all_loss_dice': 0.2092911386209165, 'Losses/train_all_loss_iou': 0.02837886042178577, 'Losses/train_all_loss_class': 1.8972794202037397e-08, 'Losses/train_all_core_loss': 0.4277842160713726, 'Trainer/where': 0.19999373747494992, 'Trainer/epoch': 7, 'Trainer/steps_train': 31936}
637
+ INFO 2025-10-06 09:24:23,726 trainer.py: 950: Estimated time remaining: 00d 09h 44m
638
+ INFO 2025-10-06 09:24:23,748 trainer.py: 892: Synchronizing meters
639
+ INFO 2025-10-06 09:24:23,749 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3915867800609711, 'Losses/train_all_loss_mask': 0.007933716841337687, 'Losses/train_all_loss_dice': 0.20667340398909811, 'Losses/train_all_loss_iou': 0.02623902521838522, 'Losses/train_all_loss_class': 1.5299105419432164e-08, 'Losses/train_all_core_loss': 0.3915867800609711, 'Trainer/where': 0.2249937374749499, 'Trainer/epoch': 8, 'Trainer/steps_train': 35928}
640
+ INFO 2025-10-06 09:43:05,171 trainer.py: 950: Estimated time remaining: 00d 09h 18m
641
+ INFO 2025-10-06 09:43:05,193 trainer.py: 892: Synchronizing meters
642
+ INFO 2025-10-06 09:43:05,193 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3884903532788829, 'Losses/train_all_loss_mask': 0.00786731781312654, 'Losses/train_all_loss_dice': 0.2054668479936873, 'Losses/train_all_loss_iou': 0.025677137474684822, 'Losses/train_all_loss_class': 1.3447321963829661e-08, 'Losses/train_all_core_loss': 0.3884903532788829, 'Trainer/where': 0.2499937374749499, 'Trainer/epoch': 9, 'Trainer/steps_train': 39920}
643
+ INFO 2025-10-06 10:01:40,978 trainer.py: 950: Estimated time remaining: 00d 08h 57m
644
+ INFO 2025-10-06 10:01:40,999 trainer.py: 892: Synchronizing meters
645
+ INFO 2025-10-06 10:01:41,000 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3757703946919679, 'Losses/train_all_loss_mask': 0.007310912669020113, 'Losses/train_all_loss_dice': 0.20403454606542606, 'Losses/train_all_loss_iou': 0.025517578823297127, 'Losses/train_all_loss_class': 1.685980004621154e-08, 'Losses/train_all_core_loss': 0.3757703946919679, 'Trainer/where': 0.27499373747494993, 'Trainer/epoch': 10, 'Trainer/steps_train': 43912}
646
+ INFO 2025-10-06 10:20:27,893 trainer.py: 950: Estimated time remaining: 00d 08h 43m
647
+ INFO 2025-10-06 10:20:27,913 trainer.py: 892: Synchronizing meters
648
+ INFO 2025-10-06 10:20:27,913 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3717774872969974, 'Losses/train_all_loss_mask': 0.0072885528313850366, 'Losses/train_all_loss_dice': 0.20273731466763484, 'Losses/train_all_loss_iou': 0.023269104299064116, 'Losses/train_all_loss_class': 1.295583962462502e-08, 'Losses/train_all_core_loss': 0.3717774872969974, 'Trainer/where': 0.2999937374749499, 'Trainer/epoch': 11, 'Trainer/steps_train': 47904}
649
+ INFO 2025-10-06 10:39:13,604 trainer.py: 950: Estimated time remaining: 00d 08h 24m
650
+ INFO 2025-10-06 10:39:13,625 trainer.py: 892: Synchronizing meters
651
+ INFO 2025-10-06 10:39:13,625 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3672938159928715, 'Losses/train_all_loss_mask': 0.0071393110150955305, 'Losses/train_all_loss_dice': 0.20154863357066152, 'Losses/train_all_loss_iou': 0.022958954503873592, 'Losses/train_all_loss_class': 9.158463877552852e-09, 'Losses/train_all_core_loss': 0.3672938159928715, 'Trainer/where': 0.3249937374749499, 'Trainer/epoch': 12, 'Trainer/steps_train': 51896}
652
+ INFO 2025-10-06 10:58:10,614 trainer.py: 950: Estimated time remaining: 00d 08h 10m
653
+ INFO 2025-10-06 10:58:10,636 trainer.py: 892: Synchronizing meters
654
+ INFO 2025-10-06 10:58:10,636 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.39827264390161676, 'Losses/train_all_loss_mask': 0.00852792210578642, 'Losses/train_all_loss_dice': 0.2016383660042692, 'Losses/train_all_loss_iou': 0.026075829454423077, 'Losses/train_all_loss_class': 6.9018100357850494e-09, 'Losses/train_all_core_loss': 0.39827264390161676, 'Trainer/where': 0.3499937374749499, 'Trainer/epoch': 13, 'Trainer/steps_train': 55888}
655
+ INFO 2025-10-06 11:17:07,125 trainer.py: 950: Estimated time remaining: 00d 07h 51m
656
+ INFO 2025-10-06 11:17:07,147 trainer.py: 892: Synchronizing meters
657
+ INFO 2025-10-06 11:17:07,147 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3666049185414744, 'Losses/train_all_loss_mask': 0.007134012589840914, 'Losses/train_all_loss_dice': 0.2001152827081556, 'Losses/train_all_loss_iou': 0.023809378810292475, 'Losses/train_all_loss_class': 7.340426579333355e-09, 'Losses/train_all_core_loss': 0.3666049185414744, 'Trainer/where': 0.3749937374749499, 'Trainer/epoch': 14, 'Trainer/steps_train': 59880}
658
+ INFO 2025-10-06 11:36:09,314 trainer.py: 950: Estimated time remaining: 00d 07h 35m
659
+ INFO 2025-10-06 11:36:09,335 trainer.py: 892: Synchronizing meters
660
+ INFO 2025-10-06 11:36:09,335 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.36204657752245556, 'Losses/train_all_loss_mask': 0.0069741076941301034, 'Losses/train_all_loss_dice': 0.1988546567444572, 'Losses/train_all_loss_iou': 0.02370976204282832, 'Losses/train_all_loss_class': 6.914729194342508e-09, 'Losses/train_all_core_loss': 0.36204657752245556, 'Trainer/where': 0.39999373747494993, 'Trainer/epoch': 15, 'Trainer/steps_train': 63872}
661
+ INFO 2025-10-06 11:55:05,493 trainer.py: 950: Estimated time remaining: 00d 07h 13m
662
+ INFO 2025-10-06 11:55:05,515 trainer.py: 892: Synchronizing meters
663
+ INFO 2025-10-06 11:55:05,515 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.36432591524420266, 'Losses/train_all_loss_mask': 0.00711237450751671, 'Losses/train_all_loss_dice': 0.19882314240108273, 'Losses/train_all_loss_iou': 0.023255279706872696, 'Losses/train_all_loss_class': 5.094582148262241e-09, 'Losses/train_all_core_loss': 0.36432591524420266, 'Trainer/where': 0.4249937374749499, 'Trainer/epoch': 16, 'Trainer/steps_train': 67864}
664
+ INFO 2025-10-06 12:14:08,255 trainer.py: 950: Estimated time remaining: 00d 06h 57m
665
+ INFO 2025-10-06 12:14:08,277 trainer.py: 892: Synchronizing meters
666
+ INFO 2025-10-06 12:14:08,277 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3739850448014286, 'Losses/train_all_loss_mask': 0.007661915094332017, 'Losses/train_all_loss_dice': 0.19808480110698806, 'Losses/train_all_loss_iou': 0.02266193838917906, 'Losses/train_all_loss_class': 5.422859437734412e-09, 'Losses/train_all_core_loss': 0.3739850448014286, 'Trainer/where': 0.4499937374749499, 'Trainer/epoch': 17, 'Trainer/steps_train': 71856}
667
+ INFO 2025-10-06 12:33:11,519 trainer.py: 950: Estimated time remaining: 00d 06h 38m
668
+ INFO 2025-10-06 12:33:11,541 trainer.py: 892: Synchronizing meters
669
+ INFO 2025-10-06 12:33:11,541 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3802372602399911, 'Losses/train_all_loss_mask': 0.008000960067011056, 'Losses/train_all_loss_dice': 0.19741905017761524, 'Losses/train_all_loss_iou': 0.02279900476346511, 'Losses/train_all_loss_class': 5.678085751427958e-09, 'Losses/train_all_core_loss': 0.3802372602399911, 'Trainer/where': 0.4749937374749499, 'Trainer/epoch': 18, 'Trainer/steps_train': 75848}
670
+ INFO 2025-10-06 12:52:16,750 trainer.py: 950: Estimated time remaining: 00d 06h 20m
671
+ INFO 2025-10-06 12:52:16,771 trainer.py: 892: Synchronizing meters
672
+ INFO 2025-10-06 12:52:16,772 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.376298183201997, 'Losses/train_all_loss_mask': 0.007830308981010056, 'Losses/train_all_loss_dice': 0.1965342678711983, 'Losses/train_all_loss_iou': 0.023157731618651492, 'Losses/train_all_loss_class': 5.28514186526349e-09, 'Losses/train_all_core_loss': 0.376298183201997, 'Trainer/where': 0.4999937374749499, 'Trainer/epoch': 19, 'Trainer/steps_train': 79840}
673
+ INFO 2025-10-06 13:11:24,458 trainer.py: 950: Estimated time remaining: 00d 06h 02m
674
+ INFO 2025-10-06 13:11:24,479 trainer.py: 892: Synchronizing meters
675
+ INFO 2025-10-06 13:11:24,480 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3772340752292874, 'Losses/train_all_loss_mask': 0.007914954837213077, 'Losses/train_all_loss_dice': 0.19617746839064634, 'Losses/train_all_loss_iou': 0.022757507024552415, 'Losses/train_all_loss_class': 5.4267739055031245e-09, 'Losses/train_all_core_loss': 0.3772340752292874, 'Trainer/where': 0.5249937374749499, 'Trainer/epoch': 20, 'Trainer/steps_train': 83832}
676
+ INFO 2025-10-06 13:30:31,353 trainer.py: 950: Estimated time remaining: 00d 05h 42m
677
+ INFO 2025-10-06 13:30:31,379 trainer.py: 892: Synchronizing meters
678
+ INFO 2025-10-06 13:30:31,379 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.37047547260336655, 'Losses/train_all_loss_mask': 0.007639010061916952, 'Losses/train_all_loss_dice': 0.1958161407786763, 'Losses/train_all_loss_iou': 0.02187912743158927, 'Losses/train_all_loss_class': 5.4363083103324426e-09, 'Losses/train_all_core_loss': 0.37047547260336655, 'Trainer/where': 0.54999373747495, 'Trainer/epoch': 21, 'Trainer/steps_train': 87824}
679
+ INFO 2025-10-06 13:49:40,277 trainer.py: 950: Estimated time remaining: 00d 05h 24m
680
+ INFO 2025-10-06 13:49:40,299 trainer.py: 892: Synchronizing meters
681
+ INFO 2025-10-06 13:49:40,299 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.35376920676995477, 'Losses/train_all_loss_mask': 0.006838303287161567, 'Losses/train_all_loss_dice': 0.19547302056410032, 'Losses/train_all_loss_iou': 0.021530116622054854, 'Losses/train_all_loss_class': 6.322159236068461e-09, 'Losses/train_all_core_loss': 0.35376920676995477, 'Trainer/where': 0.5749937374749499, 'Trainer/epoch': 22, 'Trainer/steps_train': 91816}
682
+ INFO 2025-10-06 14:08:52,182 trainer.py: 950: Estimated time remaining: 00d 05h 06m
683
+ INFO 2025-10-06 14:08:52,203 trainer.py: 892: Synchronizing meters
684
+ INFO 2025-10-06 14:08:52,203 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3551223263956834, 'Losses/train_all_loss_mask': 0.006957760564867117, 'Losses/train_all_loss_dice': 0.1945757962957413, 'Losses/train_all_loss_iou': 0.02139131658811324, 'Losses/train_all_loss_class': 4.68340592482518e-09, 'Losses/train_all_core_loss': 0.3551223263956834, 'Trainer/where': 0.5999937374749499, 'Trainer/epoch': 23, 'Trainer/steps_train': 95808}
685
+ INFO 2025-10-06 14:28:02,935 trainer.py: 950: Estimated time remaining: 00d 04h 46m
686
+ INFO 2025-10-06 14:28:02,956 trainer.py: 892: Synchronizing meters
687
+ INFO 2025-10-06 14:28:02,956 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.35436655999975974, 'Losses/train_all_loss_mask': 0.006915995280616119, 'Losses/train_all_loss_dice': 0.19451504708351736, 'Losses/train_all_loss_iou': 0.0215316050213107, 'Losses/train_all_loss_class': 4.694827900397807e-09, 'Losses/train_all_core_loss': 0.35436655999975974, 'Trainer/where': 0.6249937374749499, 'Trainer/epoch': 24, 'Trainer/steps_train': 99800}
688
+ INFO 2025-10-06 14:47:14,335 trainer.py: 950: Estimated time remaining: 00d 04h 27m
689
+ INFO 2025-10-06 14:47:14,363 trainer.py: 892: Synchronizing meters
690
+ INFO 2025-10-06 14:47:14,363 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3539243154792313, 'Losses/train_all_loss_mask': 0.0069243552351725595, 'Losses/train_all_loss_dice': 0.19411168701364426, 'Losses/train_all_loss_iou': 0.021325522290423973, 'Losses/train_all_loss_class': 4.124210543847477e-09, 'Losses/train_all_core_loss': 0.3539243154792313, 'Trainer/where': 0.6499937374749499, 'Trainer/epoch': 25, 'Trainer/steps_train': 103792}
691
+ INFO 2025-10-06 15:06:27,350 trainer.py: 950: Estimated time remaining: 00d 04h 08m
692
+ INFO 2025-10-06 15:06:27,371 trainer.py: 892: Synchronizing meters
693
+ INFO 2025-10-06 15:06:27,371 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3885851017036615, 'Losses/train_all_loss_mask': 0.008587317138184215, 'Losses/train_all_loss_dice': 0.1942436489498687, 'Losses/train_all_loss_iou': 0.02259510975809444, 'Losses/train_all_loss_class': 3.7102346460758284e-09, 'Losses/train_all_core_loss': 0.3885851017036615, 'Trainer/where': 0.67499373747495, 'Trainer/epoch': 26, 'Trainer/steps_train': 107784}
694
+ INFO 2025-10-06 15:25:39,425 trainer.py: 950: Estimated time remaining: 00d 03h 49m
695
+ INFO 2025-10-06 15:25:39,447 trainer.py: 892: Synchronizing meters
696
+ INFO 2025-10-06 15:25:39,447 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.7125891149229509, 'Losses/train_all_loss_mask': 0.024751994295421284, 'Losses/train_all_loss_dice': 0.194532726758826, 'Losses/train_all_loss_iou': 0.023016485271324848, 'Losses/train_all_loss_class': 3.9748640794428046e-09, 'Losses/train_all_core_loss': 0.7125891149229509, 'Trainer/where': 0.6999937374749499, 'Trainer/epoch': 27, 'Trainer/steps_train': 111776}
697
+ INFO 2025-10-06 15:44:53,252 trainer.py: 950: Estimated time remaining: 00d 03h 30m
698
+ INFO 2025-10-06 15:44:53,273 trainer.py: 892: Synchronizing meters
699
+ INFO 2025-10-06 15:44:53,273 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.8676063124507335, 'Losses/train_all_loss_mask': 0.032492553048528834, 'Losses/train_all_loss_dice': 0.1948043356587987, 'Losses/train_all_loss_iou': 0.022950956187875175, 'Losses/train_all_loss_class': 4.138141090095644e-09, 'Losses/train_all_core_loss': 0.8676063124507335, 'Trainer/where': 0.7249937374749499, 'Trainer/epoch': 28, 'Trainer/steps_train': 115768}
700
+ INFO 2025-10-06 16:04:06,937 trainer.py: 950: Estimated time remaining: 00d 03h 11m
701
+ INFO 2025-10-06 16:04:06,959 trainer.py: 892: Synchronizing meters
702
+ INFO 2025-10-06 16:04:06,959 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3487479994164496, 'Losses/train_all_loss_mask': 0.0067503434569706235, 'Losses/train_all_loss_dice': 0.19311891421526373, 'Losses/train_all_loss_iou': 0.020622213926316305, 'Losses/train_all_loss_class': 4.467678567490371e-09, 'Losses/train_all_core_loss': 0.3487479994164496, 'Trainer/where': 0.7499937374749499, 'Trainer/epoch': 29, 'Trainer/steps_train': 119760}
703
+ INFO 2025-10-06 16:23:19,709 trainer.py: 950: Estimated time remaining: 00d 02h 52m
704
+ INFO 2025-10-06 16:23:19,730 trainer.py: 892: Synchronizing meters
705
+ INFO 2025-10-06 16:23:19,730 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.36419604813683787, 'Losses/train_all_loss_mask': 0.00751875088206941, 'Losses/train_all_loss_dice': 0.19322081335740005, 'Losses/train_all_loss_iou': 0.0206002136427904, 'Losses/train_all_loss_class': 5.008077296045301e-09, 'Losses/train_all_core_loss': 0.36419604813683787, 'Trainer/where': 0.7749937374749499, 'Trainer/epoch': 30, 'Trainer/steps_train': 123752}
706
+ INFO 2025-10-06 16:42:36,647 trainer.py: 950: Estimated time remaining: 00d 02h 33m
707
+ INFO 2025-10-06 16:42:36,669 trainer.py: 892: Synchronizing meters
708
+ INFO 2025-10-06 16:42:36,669 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.34595307377449336, 'Losses/train_all_loss_mask': 0.006689208541691566, 'Losses/train_all_loss_dice': 0.19237655501267714, 'Losses/train_all_loss_iou': 0.01979234506802322, 'Losses/train_all_loss_class': 5.1453944205931e-09, 'Losses/train_all_core_loss': 0.34595307377449336, 'Trainer/where': 0.79999373747495, 'Trainer/epoch': 31, 'Trainer/steps_train': 127744}
709
+ INFO 2025-10-06 17:01:54,652 trainer.py: 950: Estimated time remaining: 00d 02h 14m
710
+ INFO 2025-10-06 17:01:54,674 trainer.py: 892: Synchronizing meters
711
+ INFO 2025-10-06 17:01:54,674 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.34565046294508334, 'Losses/train_all_loss_mask': 0.006636826759476352, 'Losses/train_all_loss_dice': 0.19229123223281813, 'Losses/train_all_loss_iou': 0.020622693491710736, 'Losses/train_all_loss_class': 4.764466950168121e-09, 'Losses/train_all_core_loss': 0.34565046294508334, 'Trainer/where': 0.8249937374749499, 'Trainer/epoch': 32, 'Trainer/steps_train': 131736}
712
+ INFO 2025-10-06 17:21:09,500 trainer.py: 950: Estimated time remaining: 00d 01h 55m
713
+ INFO 2025-10-06 17:21:09,521 trainer.py: 892: Synchronizing meters
714
+ INFO 2025-10-06 17:21:09,521 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.9008659057842683, 'Losses/train_all_loss_mask': 0.03423682985725872, 'Losses/train_all_loss_dice': 0.1938983456405227, 'Losses/train_all_loss_iou': 0.02223101315849819, 'Losses/train_all_loss_class': 4.9622400122766974e-09, 'Losses/train_all_core_loss': 0.9008659057842683, 'Trainer/where': 0.8499937374749498, 'Trainer/epoch': 33, 'Trainer/steps_train': 135728}
715
+ INFO 2025-10-06 17:40:24,086 trainer.py: 950: Estimated time remaining: 00d 01h 35m
716
+ INFO 2025-10-06 17:40:24,108 trainer.py: 892: Synchronizing meters
717
+ INFO 2025-10-06 17:40:24,108 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3465600523536368, 'Losses/train_all_loss_mask': 0.0067609497240599245, 'Losses/train_all_loss_dice': 0.19183460045195294, 'Losses/train_all_loss_iou': 0.019506455022350135, 'Losses/train_all_loss_class': 4.679632632014728e-09, 'Losses/train_all_core_loss': 0.3465600523536368, 'Trainer/where': 0.8749937374749498, 'Trainer/epoch': 34, 'Trainer/steps_train': 139720}
718
+ INFO 2025-10-06 17:59:43,886 trainer.py: 950: Estimated time remaining: 00d 01h 17m
719
+ INFO 2025-10-06 17:59:43,908 trainer.py: 892: Synchronizing meters
720
+ INFO 2025-10-06 17:59:43,908 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.34736052319718447, 'Losses/train_all_loss_mask': 0.0067391459940458545, 'Losses/train_all_loss_dice': 0.1922520945270458, 'Losses/train_all_loss_iou': 0.020325507099748605, 'Losses/train_all_loss_class': 4.45559715646195e-09, 'Losses/train_all_core_loss': 0.34736052319718447, 'Trainer/where': 0.8999937374749498, 'Trainer/epoch': 35, 'Trainer/steps_train': 143712}
721
+ INFO 2025-10-06 18:18:47,675 trainer.py: 950: Estimated time remaining: 00d 00h 56m
722
+ INFO 2025-10-06 18:18:47,697 trainer.py: 892: Synchronizing meters
723
+ INFO 2025-10-06 18:18:47,697 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3672967086860374, 'Losses/train_all_loss_mask': 0.00773209927745972, 'Losses/train_all_loss_dice': 0.19209734350442886, 'Losses/train_all_loss_iou': 0.02055737860401078, 'Losses/train_all_loss_class': 4.592152288894342e-09, 'Losses/train_all_core_loss': 0.3672967086860374, 'Trainer/where': 0.9249937374749498, 'Trainer/epoch': 36, 'Trainer/steps_train': 147704}
724
+ INFO 2025-10-06 18:37:46,625 trainer.py: 950: Estimated time remaining: 00d 00h 37m
725
+ INFO 2025-10-06 18:37:46,646 trainer.py: 892: Synchronizing meters
726
+ INFO 2025-10-06 18:37:46,646 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.8421824378987265, 'Losses/train_all_loss_mask': 0.03133104354486921, 'Losses/train_all_loss_dice': 0.19316817402003522, 'Losses/train_all_loss_iou': 0.02239339469971622, 'Losses/train_all_loss_class': 4.4197077939473966e-09, 'Losses/train_all_core_loss': 0.8421824378987265, 'Trainer/where': 0.9499937374749499, 'Trainer/epoch': 37, 'Trainer/steps_train': 151696}
727
+ INFO 2025-10-06 18:56:48,973 trainer.py: 950: Estimated time remaining: 00d 00h 18m
728
+ INFO 2025-10-06 18:56:48,995 trainer.py: 892: Synchronizing meters
729
+ INFO 2025-10-06 18:56:48,995 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.3468215012218792, 'Losses/train_all_loss_mask': 0.006743870759146193, 'Losses/train_all_loss_dice': 0.19145133795742997, 'Losses/train_all_loss_iou': 0.020492745865770254, 'Losses/train_all_loss_class': 4.498966078856853e-09, 'Losses/train_all_core_loss': 0.3468215012218792, 'Trainer/where': 0.9749937374749498, 'Trainer/epoch': 38, 'Trainer/steps_train': 155688}
730
+ INFO 2025-10-06 19:15:48,999 trainer.py: 950: Estimated time remaining: 00d 00h 00m
731
+ INFO 2025-10-06 19:15:49,026 trainer.py: 892: Synchronizing meters
732
+ INFO 2025-10-06 19:15:49,026 trainer.py: 830: Losses and meters: {'Losses/train_all_loss': 0.361319512792094, 'Losses/train_all_loss_mask': 0.007438624991261454, 'Losses/train_all_loss_dice': 0.19195612370669243, 'Losses/train_all_loss_iou': 0.0205908868190231, 'Losses/train_all_loss_class': 4.3955577136424175e-09, 'Losses/train_all_core_loss': 0.361319512792094, 'Trainer/where': 0.9999937374749498, 'Trainer/epoch': 39, 'Trainer/steps_train': 159680}
experiment/thermal_run1/logs/train_stats.json ADDED
@@ -0,0 +1,40 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"Losses/train_all_loss": 0.6424086557137584, "Losses/train_all_loss_mask": 0.016180070180966514, "Losses/train_all_loss_dice": 0.2685501508280366, "Losses/train_all_loss_iou": 0.05025709560852524, "Losses/train_all_loss_class": 1.2424740680067156e-08, "Losses/train_all_core_loss": 0.6424086557137584, "Trainer/where": 0.0249937374749499, "Trainer/epoch": 0, "Trainer/steps_train": 3992}
2
+ {"Losses/train_all_loss": 0.5279103564334108, "Losses/train_all_loss_mask": 0.012948783188376493, "Losses/train_all_loss_dice": 0.23409812990016116, "Losses/train_all_loss_iou": 0.034836555814920164, "Losses/train_all_loss_class": 1.1137212414612728e-08, "Losses/train_all_core_loss": 0.5279103564334108, "Trainer/where": 0.0499937374749499, "Trainer/epoch": 1, "Trainer/steps_train": 7984}
3
+ {"Losses/train_all_loss": 0.46176709332815996, "Losses/train_all_loss_mask": 0.010168827943158898, "Losses/train_all_loss_dice": 0.22589266421142704, "Losses/train_all_loss_iou": 0.03249785962655957, "Losses/train_all_loss_class": 1.3400916166038667e-08, "Losses/train_all_core_loss": 0.46176709332815996, "Trainer/where": 0.0749937374749499, "Trainer/epoch": 2, "Trainer/steps_train": 11976}
4
+ {"Losses/train_all_loss": 0.434850245800041, "Losses/train_all_loss_mask": 0.008949943296251449, "Losses/train_all_loss_dice": 0.22050112636688954, "Losses/train_all_loss_iou": 0.03535024233930884, "Losses/train_all_loss_class": 1.4512113502645153e-08, "Losses/train_all_core_loss": 0.434850245800041, "Trainer/where": 0.09999373747494991, "Trainer/epoch": 3, "Trainer/steps_train": 15968}
5
+ {"Losses/train_all_loss": 0.4899576190065402, "Losses/train_all_loss_mask": 0.012139334249143563, "Losses/train_all_loss_dice": 0.2170970643271425, "Losses/train_all_loss_iou": 0.030073830085804915, "Losses/train_all_loss_class": 3.6043506326426754e-08, "Losses/train_all_core_loss": 0.4899576190065402, "Trainer/where": 0.1249937374749499, "Trainer/epoch": 4, "Trainer/steps_train": 19960}
6
+ {"Losses/train_all_loss": 0.410329947133319, "Losses/train_all_loss_mask": 0.008565576918526002, "Losses/train_all_loss_dice": 0.21291188210368395, "Losses/train_all_loss_iou": 0.026106498928851203, "Losses/train_all_loss_class": 2.8962244711128784e-08, "Losses/train_all_core_loss": 0.410329947133319, "Trainer/where": 0.1499937374749499, "Trainer/epoch": 5, "Trainer/steps_train": 23952}
7
+ {"Losses/train_all_loss": 0.40882908666967405, "Losses/train_all_loss_mask": 0.008480613211250676, "Losses/train_all_loss_dice": 0.21131395521706234, "Losses/train_all_loss_iou": 0.027902849250237918, "Losses/train_all_loss_class": 2.056003091207329e-08, "Losses/train_all_core_loss": 0.40882908666967405, "Trainer/where": 0.1749937374749499, "Trainer/epoch": 6, "Trainer/steps_train": 27944}
8
+ {"Losses/train_all_loss": 0.4277842160713726, "Losses/train_all_loss_mask": 0.009505709921017888, "Losses/train_all_loss_dice": 0.2092911386209165, "Losses/train_all_loss_iou": 0.02837886042178577, "Losses/train_all_loss_class": 1.8972794202037397e-08, "Losses/train_all_core_loss": 0.4277842160713726, "Trainer/where": 0.19999373747494992, "Trainer/epoch": 7, "Trainer/steps_train": 31936}
9
+ {"Losses/train_all_loss": 0.3915867800609711, "Losses/train_all_loss_mask": 0.007933716841337687, "Losses/train_all_loss_dice": 0.20667340398909811, "Losses/train_all_loss_iou": 0.02623902521838522, "Losses/train_all_loss_class": 1.5299105419432164e-08, "Losses/train_all_core_loss": 0.3915867800609711, "Trainer/where": 0.2249937374749499, "Trainer/epoch": 8, "Trainer/steps_train": 35928}
10
+ {"Losses/train_all_loss": 0.3884903532788829, "Losses/train_all_loss_mask": 0.00786731781312654, "Losses/train_all_loss_dice": 0.2054668479936873, "Losses/train_all_loss_iou": 0.025677137474684822, "Losses/train_all_loss_class": 1.3447321963829661e-08, "Losses/train_all_core_loss": 0.3884903532788829, "Trainer/where": 0.2499937374749499, "Trainer/epoch": 9, "Trainer/steps_train": 39920}
11
+ {"Losses/train_all_loss": 0.3757703946919679, "Losses/train_all_loss_mask": 0.007310912669020113, "Losses/train_all_loss_dice": 0.20403454606542606, "Losses/train_all_loss_iou": 0.025517578823297127, "Losses/train_all_loss_class": 1.685980004621154e-08, "Losses/train_all_core_loss": 0.3757703946919679, "Trainer/where": 0.27499373747494993, "Trainer/epoch": 10, "Trainer/steps_train": 43912}
12
+ {"Losses/train_all_loss": 0.3717774872969974, "Losses/train_all_loss_mask": 0.0072885528313850366, "Losses/train_all_loss_dice": 0.20273731466763484, "Losses/train_all_loss_iou": 0.023269104299064116, "Losses/train_all_loss_class": 1.295583962462502e-08, "Losses/train_all_core_loss": 0.3717774872969974, "Trainer/where": 0.2999937374749499, "Trainer/epoch": 11, "Trainer/steps_train": 47904}
13
+ {"Losses/train_all_loss": 0.3672938159928715, "Losses/train_all_loss_mask": 0.0071393110150955305, "Losses/train_all_loss_dice": 0.20154863357066152, "Losses/train_all_loss_iou": 0.022958954503873592, "Losses/train_all_loss_class": 9.158463877552852e-09, "Losses/train_all_core_loss": 0.3672938159928715, "Trainer/where": 0.3249937374749499, "Trainer/epoch": 12, "Trainer/steps_train": 51896}
14
+ {"Losses/train_all_loss": 0.39827264390161676, "Losses/train_all_loss_mask": 0.00852792210578642, "Losses/train_all_loss_dice": 0.2016383660042692, "Losses/train_all_loss_iou": 0.026075829454423077, "Losses/train_all_loss_class": 6.9018100357850494e-09, "Losses/train_all_core_loss": 0.39827264390161676, "Trainer/where": 0.3499937374749499, "Trainer/epoch": 13, "Trainer/steps_train": 55888}
15
+ {"Losses/train_all_loss": 0.3666049185414744, "Losses/train_all_loss_mask": 0.007134012589840914, "Losses/train_all_loss_dice": 0.2001152827081556, "Losses/train_all_loss_iou": 0.023809378810292475, "Losses/train_all_loss_class": 7.340426579333355e-09, "Losses/train_all_core_loss": 0.3666049185414744, "Trainer/where": 0.3749937374749499, "Trainer/epoch": 14, "Trainer/steps_train": 59880}
16
+ {"Losses/train_all_loss": 0.36204657752245556, "Losses/train_all_loss_mask": 0.0069741076941301034, "Losses/train_all_loss_dice": 0.1988546567444572, "Losses/train_all_loss_iou": 0.02370976204282832, "Losses/train_all_loss_class": 6.914729194342508e-09, "Losses/train_all_core_loss": 0.36204657752245556, "Trainer/where": 0.39999373747494993, "Trainer/epoch": 15, "Trainer/steps_train": 63872}
17
+ {"Losses/train_all_loss": 0.36432591524420266, "Losses/train_all_loss_mask": 0.00711237450751671, "Losses/train_all_loss_dice": 0.19882314240108273, "Losses/train_all_loss_iou": 0.023255279706872696, "Losses/train_all_loss_class": 5.094582148262241e-09, "Losses/train_all_core_loss": 0.36432591524420266, "Trainer/where": 0.4249937374749499, "Trainer/epoch": 16, "Trainer/steps_train": 67864}
18
+ {"Losses/train_all_loss": 0.3739850448014286, "Losses/train_all_loss_mask": 0.007661915094332017, "Losses/train_all_loss_dice": 0.19808480110698806, "Losses/train_all_loss_iou": 0.02266193838917906, "Losses/train_all_loss_class": 5.422859437734412e-09, "Losses/train_all_core_loss": 0.3739850448014286, "Trainer/where": 0.4499937374749499, "Trainer/epoch": 17, "Trainer/steps_train": 71856}
19
+ {"Losses/train_all_loss": 0.3802372602399911, "Losses/train_all_loss_mask": 0.008000960067011056, "Losses/train_all_loss_dice": 0.19741905017761524, "Losses/train_all_loss_iou": 0.02279900476346511, "Losses/train_all_loss_class": 5.678085751427958e-09, "Losses/train_all_core_loss": 0.3802372602399911, "Trainer/where": 0.4749937374749499, "Trainer/epoch": 18, "Trainer/steps_train": 75848}
20
+ {"Losses/train_all_loss": 0.376298183201997, "Losses/train_all_loss_mask": 0.007830308981010056, "Losses/train_all_loss_dice": 0.1965342678711983, "Losses/train_all_loss_iou": 0.023157731618651492, "Losses/train_all_loss_class": 5.28514186526349e-09, "Losses/train_all_core_loss": 0.376298183201997, "Trainer/where": 0.4999937374749499, "Trainer/epoch": 19, "Trainer/steps_train": 79840}
21
+ {"Losses/train_all_loss": 0.3772340752292874, "Losses/train_all_loss_mask": 0.007914954837213077, "Losses/train_all_loss_dice": 0.19617746839064634, "Losses/train_all_loss_iou": 0.022757507024552415, "Losses/train_all_loss_class": 5.4267739055031245e-09, "Losses/train_all_core_loss": 0.3772340752292874, "Trainer/where": 0.5249937374749499, "Trainer/epoch": 20, "Trainer/steps_train": 83832}
22
+ {"Losses/train_all_loss": 0.37047547260336655, "Losses/train_all_loss_mask": 0.007639010061916952, "Losses/train_all_loss_dice": 0.1958161407786763, "Losses/train_all_loss_iou": 0.02187912743158927, "Losses/train_all_loss_class": 5.4363083103324426e-09, "Losses/train_all_core_loss": 0.37047547260336655, "Trainer/where": 0.54999373747495, "Trainer/epoch": 21, "Trainer/steps_train": 87824}
23
+ {"Losses/train_all_loss": 0.35376920676995477, "Losses/train_all_loss_mask": 0.006838303287161567, "Losses/train_all_loss_dice": 0.19547302056410032, "Losses/train_all_loss_iou": 0.021530116622054854, "Losses/train_all_loss_class": 6.322159236068461e-09, "Losses/train_all_core_loss": 0.35376920676995477, "Trainer/where": 0.5749937374749499, "Trainer/epoch": 22, "Trainer/steps_train": 91816}
24
+ {"Losses/train_all_loss": 0.3551223263956834, "Losses/train_all_loss_mask": 0.006957760564867117, "Losses/train_all_loss_dice": 0.1945757962957413, "Losses/train_all_loss_iou": 0.02139131658811324, "Losses/train_all_loss_class": 4.68340592482518e-09, "Losses/train_all_core_loss": 0.3551223263956834, "Trainer/where": 0.5999937374749499, "Trainer/epoch": 23, "Trainer/steps_train": 95808}
25
+ {"Losses/train_all_loss": 0.35436655999975974, "Losses/train_all_loss_mask": 0.006915995280616119, "Losses/train_all_loss_dice": 0.19451504708351736, "Losses/train_all_loss_iou": 0.0215316050213107, "Losses/train_all_loss_class": 4.694827900397807e-09, "Losses/train_all_core_loss": 0.35436655999975974, "Trainer/where": 0.6249937374749499, "Trainer/epoch": 24, "Trainer/steps_train": 99800}
26
+ {"Losses/train_all_loss": 0.3539243154792313, "Losses/train_all_loss_mask": 0.0069243552351725595, "Losses/train_all_loss_dice": 0.19411168701364426, "Losses/train_all_loss_iou": 0.021325522290423973, "Losses/train_all_loss_class": 4.124210543847477e-09, "Losses/train_all_core_loss": 0.3539243154792313, "Trainer/where": 0.6499937374749499, "Trainer/epoch": 25, "Trainer/steps_train": 103792}
27
+ {"Losses/train_all_loss": 0.3885851017036615, "Losses/train_all_loss_mask": 0.008587317138184215, "Losses/train_all_loss_dice": 0.1942436489498687, "Losses/train_all_loss_iou": 0.02259510975809444, "Losses/train_all_loss_class": 3.7102346460758284e-09, "Losses/train_all_core_loss": 0.3885851017036615, "Trainer/where": 0.67499373747495, "Trainer/epoch": 26, "Trainer/steps_train": 107784}
28
+ {"Losses/train_all_loss": 0.7125891149229509, "Losses/train_all_loss_mask": 0.024751994295421284, "Losses/train_all_loss_dice": 0.194532726758826, "Losses/train_all_loss_iou": 0.023016485271324848, "Losses/train_all_loss_class": 3.9748640794428046e-09, "Losses/train_all_core_loss": 0.7125891149229509, "Trainer/where": 0.6999937374749499, "Trainer/epoch": 27, "Trainer/steps_train": 111776}
29
+ {"Losses/train_all_loss": 0.8676063124507335, "Losses/train_all_loss_mask": 0.032492553048528834, "Losses/train_all_loss_dice": 0.1948043356587987, "Losses/train_all_loss_iou": 0.022950956187875175, "Losses/train_all_loss_class": 4.138141090095644e-09, "Losses/train_all_core_loss": 0.8676063124507335, "Trainer/where": 0.7249937374749499, "Trainer/epoch": 28, "Trainer/steps_train": 115768}
30
+ {"Losses/train_all_loss": 0.3487479994164496, "Losses/train_all_loss_mask": 0.0067503434569706235, "Losses/train_all_loss_dice": 0.19311891421526373, "Losses/train_all_loss_iou": 0.020622213926316305, "Losses/train_all_loss_class": 4.467678567490371e-09, "Losses/train_all_core_loss": 0.3487479994164496, "Trainer/where": 0.7499937374749499, "Trainer/epoch": 29, "Trainer/steps_train": 119760}
31
+ {"Losses/train_all_loss": 0.36419604813683787, "Losses/train_all_loss_mask": 0.00751875088206941, "Losses/train_all_loss_dice": 0.19322081335740005, "Losses/train_all_loss_iou": 0.0206002136427904, "Losses/train_all_loss_class": 5.008077296045301e-09, "Losses/train_all_core_loss": 0.36419604813683787, "Trainer/where": 0.7749937374749499, "Trainer/epoch": 30, "Trainer/steps_train": 123752}
32
+ {"Losses/train_all_loss": 0.34595307377449336, "Losses/train_all_loss_mask": 0.006689208541691566, "Losses/train_all_loss_dice": 0.19237655501267714, "Losses/train_all_loss_iou": 0.01979234506802322, "Losses/train_all_loss_class": 5.1453944205931e-09, "Losses/train_all_core_loss": 0.34595307377449336, "Trainer/where": 0.79999373747495, "Trainer/epoch": 31, "Trainer/steps_train": 127744}
33
+ {"Losses/train_all_loss": 0.34565046294508334, "Losses/train_all_loss_mask": 0.006636826759476352, "Losses/train_all_loss_dice": 0.19229123223281813, "Losses/train_all_loss_iou": 0.020622693491710736, "Losses/train_all_loss_class": 4.764466950168121e-09, "Losses/train_all_core_loss": 0.34565046294508334, "Trainer/where": 0.8249937374749499, "Trainer/epoch": 32, "Trainer/steps_train": 131736}
34
+ {"Losses/train_all_loss": 0.9008659057842683, "Losses/train_all_loss_mask": 0.03423682985725872, "Losses/train_all_loss_dice": 0.1938983456405227, "Losses/train_all_loss_iou": 0.02223101315849819, "Losses/train_all_loss_class": 4.9622400122766974e-09, "Losses/train_all_core_loss": 0.9008659057842683, "Trainer/where": 0.8499937374749498, "Trainer/epoch": 33, "Trainer/steps_train": 135728}
35
+ {"Losses/train_all_loss": 0.3465600523536368, "Losses/train_all_loss_mask": 0.0067609497240599245, "Losses/train_all_loss_dice": 0.19183460045195294, "Losses/train_all_loss_iou": 0.019506455022350135, "Losses/train_all_loss_class": 4.679632632014728e-09, "Losses/train_all_core_loss": 0.3465600523536368, "Trainer/where": 0.8749937374749498, "Trainer/epoch": 34, "Trainer/steps_train": 139720}
36
+ {"Losses/train_all_loss": 0.34736052319718447, "Losses/train_all_loss_mask": 0.0067391459940458545, "Losses/train_all_loss_dice": 0.1922520945270458, "Losses/train_all_loss_iou": 0.020325507099748605, "Losses/train_all_loss_class": 4.45559715646195e-09, "Losses/train_all_core_loss": 0.34736052319718447, "Trainer/where": 0.8999937374749498, "Trainer/epoch": 35, "Trainer/steps_train": 143712}
37
+ {"Losses/train_all_loss": 0.3672967086860374, "Losses/train_all_loss_mask": 0.00773209927745972, "Losses/train_all_loss_dice": 0.19209734350442886, "Losses/train_all_loss_iou": 0.02055737860401078, "Losses/train_all_loss_class": 4.592152288894342e-09, "Losses/train_all_core_loss": 0.3672967086860374, "Trainer/where": 0.9249937374749498, "Trainer/epoch": 36, "Trainer/steps_train": 147704}
38
+ {"Losses/train_all_loss": 0.8421824378987265, "Losses/train_all_loss_mask": 0.03133104354486921, "Losses/train_all_loss_dice": 0.19316817402003522, "Losses/train_all_loss_iou": 0.02239339469971622, "Losses/train_all_loss_class": 4.4197077939473966e-09, "Losses/train_all_core_loss": 0.8421824378987265, "Trainer/where": 0.9499937374749499, "Trainer/epoch": 37, "Trainer/steps_train": 151696}
39
+ {"Losses/train_all_loss": 0.3468215012218792, "Losses/train_all_loss_mask": 0.006743870759146193, "Losses/train_all_loss_dice": 0.19145133795742997, "Losses/train_all_loss_iou": 0.020492745865770254, "Losses/train_all_loss_class": 4.498966078856853e-09, "Losses/train_all_core_loss": 0.3468215012218792, "Trainer/where": 0.9749937374749498, "Trainer/epoch": 38, "Trainer/steps_train": 155688}
40
+ {"Losses/train_all_loss": 0.361319512792094, "Losses/train_all_loss_mask": 0.007438624991261454, "Losses/train_all_loss_dice": 0.19195612370669243, "Losses/train_all_loss_iou": 0.0205908868190231, "Losses/train_all_loss_class": 4.3955577136424175e-09, "Losses/train_all_core_loss": 0.361319512792094, "Trainer/where": 0.9999937374749498, "Trainer/epoch": 39, "Trainer/steps_train": 159680}
experiment/thermal_run1/tensorboard/events.out.tfevents.1759750510.gpub060.delta.ncsa.illinois.edu.921762.0c94822e4-1523-4465-a797-8a6fd58b2af0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:872d92f23e17cdc70e7c071350d5ac8cd50f1b9f4fb30f6477f5c6def1e2256d
3
+ size 14811175
sam2.1_hiera_base_plus.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a2345aede8715ab1d5d31b4a509fb160c5a4af1970f199d9054ccfb746c004c5
3
+ size 323606802
sam2.1_hiera_large.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2647878d5dfa5098f2f8649825738a9345572bae2d4350a2468587ece47dd318
3
+ size 898083611
sam2.1_hiera_small.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d1aa6f30de5c92224f8172114de081d104bbd23dd9dc5c58996f0cad5dc4d38
3
+ size 184416285