fhaosss commited on
Commit
6b69a9d
·
verified ·
1 Parent(s): 040a4e6

Upload config/uwsam_teacher_paper.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. config/uwsam_teacher_paper.py +342 -0
config/uwsam_teacher_paper.py ADDED
@@ -0,0 +1,342 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ custom_imports = dict(
2
+ allow_failed_imports=False, imports=[
3
+ 'uwsam_teacher',
4
+ ])
5
+ data_root = '/home/cuongvt/My-works/code/UWSAM/UIIS10K/UIIS10K/'
6
+ default_hooks = dict(
7
+ checkpoint=dict(interval=1, max_keep_ckpts=3, type='CheckpointHook'),
8
+ logger=dict(interval=50, type='LoggerHook'),
9
+ param_scheduler=dict(type='ParamSchedulerHook'),
10
+ sampler_seed=dict(type='DistSamplerSeedHook'),
11
+ timer=dict(type='IterTimerHook'),
12
+ visualization=dict(type='DetVisualizationHook'))
13
+ default_scope = 'mmdet'
14
+ env_cfg = dict(
15
+ cuda_check_device=True,
16
+ cudnn_benchmark=False,
17
+ dist_cfg=dict(backend='nccl'),
18
+ mp_cfg=dict(mp_start_method='fork', opencv_num_threads=0))
19
+ launcher = 'none'
20
+ load_from = None
21
+ log_level = 'INFO'
22
+ log_processor = dict(by_epoch=True, type='LogProcessor', window_size=50)
23
+ metainfo = dict(
24
+ classes=(
25
+ 'fish',
26
+ 'reptiles',
27
+ 'arthropoda',
28
+ 'corals',
29
+ 'mollusk',
30
+ 'plants',
31
+ 'ruins',
32
+ 'garbage',
33
+ 'human',
34
+ 'robots',
35
+ ))
36
+ model = dict(
37
+ backbone=dict(
38
+ freeze_base=True,
39
+ img_size=1024,
40
+ lora_alpha=16,
41
+ lora_dropout=0.0,
42
+ lora_r=8,
43
+ sam_checkpoint='/home/cuongvt/My-works/code/UWSAM/sam_vit_h_4b8939.pth',
44
+ sam_type='vit_h',
45
+ type='SAMImageEncoderLoRABackbone'),
46
+ data_preprocessor=dict(
47
+ bgr_to_rgb=True,
48
+ mean=[
49
+ 123.675,
50
+ 116.28,
51
+ 103.53,
52
+ ],
53
+ pad_mask=True,
54
+ pad_size_divisor=32,
55
+ std=[
56
+ 58.395,
57
+ 57.12,
58
+ 57.375,
59
+ ],
60
+ type='DetDataPreprocessor'),
61
+ mask_head=dict(
62
+ freeze_mask_decoder=False,
63
+ in_channels=256,
64
+ loss_iou=dict(loss_weight=0.5, type='MSELoss'),
65
+ loss_mask=dict(
66
+ loss_weight=1.0, type='CrossEntropyLoss', use_sigmoid=True),
67
+ num_classes=10,
68
+ sam_checkpoint='/home/cuongvt/My-works/code/UWSAM/sam_vit_h_4b8939.pth',
69
+ sam_dim=256,
70
+ sam_type='vit_h',
71
+ type='SAMHeadV2'),
72
+ neck=dict(
73
+ in_channels=256,
74
+ rpn_head=dict(
75
+ anchor_generator=dict(
76
+ ratios=[
77
+ 0.5,
78
+ 1.0,
79
+ 2.0,
80
+ ],
81
+ scales=[
82
+ 8,
83
+ ],
84
+ strides=[
85
+ 16,
86
+ ],
87
+ type='AnchorGenerator'),
88
+ bbox_coder=dict(
89
+ target_means=[
90
+ 0.0,
91
+ 0.0,
92
+ 0.0,
93
+ 0.0,
94
+ ],
95
+ target_stds=[
96
+ 1.0,
97
+ 1.0,
98
+ 1.0,
99
+ 1.0,
100
+ ],
101
+ type='DeltaXYWHBBoxCoder'),
102
+ feat_channels=256,
103
+ in_channels=256,
104
+ loss_bbox=dict(loss_weight=1.0, type='L1Loss'),
105
+ loss_cls=dict(
106
+ loss_weight=1.0, type='CrossEntropyLoss', use_sigmoid=True),
107
+ num_convs=1,
108
+ test_cfg=dict(
109
+ max_per_img=100,
110
+ min_bbox_size=0,
111
+ nms=dict(iou_threshold=0.7, type='nms'),
112
+ nms_pre=300),
113
+ train_cfg=dict(
114
+ allowed_border=-1,
115
+ assigner=dict(
116
+ ignore_iof_thr=-1,
117
+ match_low_quality=True,
118
+ min_pos_iou=0.3,
119
+ neg_iou_thr=0.3,
120
+ pos_iou_thr=0.7,
121
+ type='MaxIoUAssigner'),
122
+ debug=False,
123
+ pos_weight=-1,
124
+ sampler=dict(
125
+ add_gt_as_proposals=False,
126
+ neg_pos_ub=-1,
127
+ num=256,
128
+ pos_fraction=0.5,
129
+ type='RandomSampler')),
130
+ type='RPNHead'),
131
+ type='EUPGHead'),
132
+ test_cfg=None,
133
+ train_cfg=None,
134
+ type='UWSAM')
135
+ optim_wrapper = dict(
136
+ accumulative_counts=4,
137
+ clip_grad=dict(max_norm=1.0, norm_type=2),
138
+ loss_scale=dict(
139
+ backoff_factor=0.5,
140
+ growth_factor=2.0,
141
+ growth_interval=2000,
142
+ init_scale=512.0),
143
+ optimizer=dict(eps=1e-08, lr=0.0001, type='AdamW', weight_decay=0.05),
144
+ type='AmpOptimWrapper')
145
+ param_scheduler = [
146
+ dict(
147
+ begin=0, by_epoch=False, end=500, start_factor=0.001, type='LinearLR'),
148
+ dict(
149
+ begin=0,
150
+ by_epoch=True,
151
+ end=24,
152
+ gamma=0.1,
153
+ milestones=[
154
+ 16,
155
+ 22,
156
+ ],
157
+ type='MultiStepLR'),
158
+ ]
159
+ resume = False
160
+ sam_checkpoint = '/home/cuongvt/My-works/code/UWSAM/sam_vit_h_4b8939.pth'
161
+ test_cfg = dict(type='TestLoop')
162
+ test_dataloader = dict(
163
+ batch_size=1,
164
+ dataset=dict(
165
+ ann_file='annotations/multiclass_test.json',
166
+ data_prefix=dict(img='img/'),
167
+ data_root='/home/cuongvt/My-works/code/UWSAM/UIIS10K/UIIS10K/',
168
+ metainfo=dict(
169
+ classes=(
170
+ 'fish',
171
+ 'reptiles',
172
+ 'arthropoda',
173
+ 'corals',
174
+ 'mollusk',
175
+ 'plants',
176
+ 'ruins',
177
+ 'garbage',
178
+ 'human',
179
+ 'robots',
180
+ )),
181
+ pipeline=[
182
+ dict(type='LoadImageFromFile'),
183
+ dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
184
+ dict(keep_ratio=False, scale=(
185
+ 1024,
186
+ 1024,
187
+ ), type='Resize'),
188
+ dict(type='PackDetInputs'),
189
+ ],
190
+ type='CocoDataset'),
191
+ num_workers=0,
192
+ persistent_workers=False,
193
+ sampler=dict(shuffle=False, type='DefaultSampler'))
194
+ test_evaluator = dict(
195
+ ann_file=
196
+ '/home/cuongvt/My-works/code/UWSAM/UIIS10K/UIIS10K/annotations/multiclass_test.json',
197
+ format_only=False,
198
+ metric=[
199
+ 'bbox',
200
+ 'segm',
201
+ ],
202
+ type='CocoMetric')
203
+ test_pipeline = [
204
+ dict(type='LoadImageFromFile'),
205
+ dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
206
+ dict(keep_ratio=False, scale=(
207
+ 1024,
208
+ 1024,
209
+ ), type='Resize'),
210
+ dict(type='PackDetInputs'),
211
+ ]
212
+ train_cfg = dict(max_epochs=24, type='EpochBasedTrainLoop', val_interval=24)
213
+ train_dataloader = dict(
214
+ batch_size=1,
215
+ dataset=dict(
216
+ ann_file='annotations/multiclass_train.json',
217
+ data_prefix=dict(img='img/'),
218
+ data_root='/home/cuongvt/My-works/code/UWSAM/UIIS10K/UIIS10K/',
219
+ filter_cfg=dict(filter_empty_gt=True, min_size=32),
220
+ metainfo=dict(
221
+ classes=(
222
+ 'fish',
223
+ 'reptiles',
224
+ 'arthropoda',
225
+ 'corals',
226
+ 'mollusk',
227
+ 'plants',
228
+ 'ruins',
229
+ 'garbage',
230
+ 'human',
231
+ 'robots',
232
+ )),
233
+ pipeline=[
234
+ dict(type='LoadImageFromFile'),
235
+ dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
236
+ dict(
237
+ keep_ratio=True,
238
+ ratio_range=(
239
+ 0.8,
240
+ 1.2,
241
+ ),
242
+ scale=(
243
+ 1024,
244
+ 1024,
245
+ ),
246
+ type='RandomResize'),
247
+ dict(
248
+ allow_negative_crop=False,
249
+ crop_size=(
250
+ 1024,
251
+ 1024,
252
+ ),
253
+ type='RandomCrop'),
254
+ dict(keep_ratio=False, scale=(
255
+ 1024,
256
+ 1024,
257
+ ), type='Resize'),
258
+ dict(prob=0.5, type='RandomFlip'),
259
+ dict(type='PackDetInputs'),
260
+ ],
261
+ type='CocoDataset'),
262
+ num_workers=0,
263
+ persistent_workers=False,
264
+ sampler=dict(shuffle=True, type='DefaultSampler'))
265
+ train_pipeline = [
266
+ dict(type='LoadImageFromFile'),
267
+ dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
268
+ dict(
269
+ keep_ratio=True,
270
+ ratio_range=(
271
+ 0.8,
272
+ 1.2,
273
+ ),
274
+ scale=(
275
+ 1024,
276
+ 1024,
277
+ ),
278
+ type='RandomResize'),
279
+ dict(
280
+ allow_negative_crop=False, crop_size=(
281
+ 1024,
282
+ 1024,
283
+ ), type='RandomCrop'),
284
+ dict(keep_ratio=False, scale=(
285
+ 1024,
286
+ 1024,
287
+ ), type='Resize'),
288
+ dict(prob=0.5, type='RandomFlip'),
289
+ dict(type='PackDetInputs'),
290
+ ]
291
+ val_cfg = dict(type='ValLoop')
292
+ val_dataloader = dict(
293
+ batch_size=1,
294
+ dataset=dict(
295
+ ann_file='annotations/multiclass_test.json',
296
+ data_prefix=dict(img='img/'),
297
+ data_root='/home/cuongvt/My-works/code/UWSAM/UIIS10K/UIIS10K/',
298
+ metainfo=dict(
299
+ classes=(
300
+ 'fish',
301
+ 'reptiles',
302
+ 'arthropoda',
303
+ 'corals',
304
+ 'mollusk',
305
+ 'plants',
306
+ 'ruins',
307
+ 'garbage',
308
+ 'human',
309
+ 'robots',
310
+ )),
311
+ pipeline=[
312
+ dict(type='LoadImageFromFile'),
313
+ dict(type='LoadAnnotations', with_bbox=True, with_mask=True),
314
+ dict(keep_ratio=False, scale=(
315
+ 1024,
316
+ 1024,
317
+ ), type='Resize'),
318
+ dict(type='PackDetInputs'),
319
+ ],
320
+ type='CocoDataset'),
321
+ num_workers=0,
322
+ persistent_workers=False,
323
+ sampler=dict(shuffle=False, type='DefaultSampler'))
324
+ val_evaluator = dict(
325
+ ann_file=
326
+ '/home/cuongvt/My-works/code/UWSAM/UIIS10K/UIIS10K/annotations/multiclass_test.json',
327
+ format_only=False,
328
+ metric=[
329
+ 'bbox',
330
+ 'segm',
331
+ ],
332
+ type='CocoMetric')
333
+ vis_backends = [
334
+ dict(type='LocalVisBackend'),
335
+ ]
336
+ visualizer = dict(
337
+ name='visualizer',
338
+ type='DetLocalVisualizer',
339
+ vis_backends=[
340
+ dict(type='LocalVisBackend'),
341
+ ])
342
+ work_dir = './work_dirs/uwsam_teacher_paper'