CVRPDataset commited on
Commit
527792c
·
verified ·
1 Parent(s): 8413c5a

Delete model_configs/CVRP_mask2former.py

Browse files
Files changed (1) hide show
  1. model_configs/CVRP_mask2former.py +0 -572
model_configs/CVRP_mask2former.py DELETED
@@ -1,572 +0,0 @@
1
- auto_scale_lr = dict(base_batch_size=16, enable=False)
2
- backbone_embed_multi = dict(decay_mult=0.0, lr_mult=0.1)
3
- backbone_norm_multi = dict(decay_mult=0.0, lr_mult=0.1)
4
- crop_size = (
5
- 512,
6
- 512,
7
- )
8
- custom_keys = dict({
9
- 'absolute_pos_embed':
10
- dict(decay_mult=0.0, lr_mult=0.1),
11
- 'backbone':
12
- dict(decay_mult=1.0, lr_mult=0.1),
13
- 'backbone.norm':
14
- dict(decay_mult=0.0, lr_mult=0.1),
15
- 'backbone.patch_embed.norm':
16
- dict(decay_mult=0.0, lr_mult=0.1),
17
- 'backbone.stages.0.blocks.0.norm':
18
- dict(decay_mult=0.0, lr_mult=0.1),
19
- 'backbone.stages.0.blocks.1.norm':
20
- dict(decay_mult=0.0, lr_mult=0.1),
21
- 'backbone.stages.0.downsample.norm':
22
- dict(decay_mult=0.0, lr_mult=0.1),
23
- 'backbone.stages.1.blocks.0.norm':
24
- dict(decay_mult=0.0, lr_mult=0.1),
25
- 'backbone.stages.1.blocks.1.norm':
26
- dict(decay_mult=0.0, lr_mult=0.1),
27
- 'backbone.stages.1.downsample.norm':
28
- dict(decay_mult=0.0, lr_mult=0.1),
29
- 'backbone.stages.2.blocks.0.norm':
30
- dict(decay_mult=0.0, lr_mult=0.1),
31
- 'backbone.stages.2.blocks.1.norm':
32
- dict(decay_mult=0.0, lr_mult=0.1),
33
- 'backbone.stages.2.blocks.10.norm':
34
- dict(decay_mult=0.0, lr_mult=0.1),
35
- 'backbone.stages.2.blocks.11.norm':
36
- dict(decay_mult=0.0, lr_mult=0.1),
37
- 'backbone.stages.2.blocks.12.norm':
38
- dict(decay_mult=0.0, lr_mult=0.1),
39
- 'backbone.stages.2.blocks.13.norm':
40
- dict(decay_mult=0.0, lr_mult=0.1),
41
- 'backbone.stages.2.blocks.14.norm':
42
- dict(decay_mult=0.0, lr_mult=0.1),
43
- 'backbone.stages.2.blocks.15.norm':
44
- dict(decay_mult=0.0, lr_mult=0.1),
45
- 'backbone.stages.2.blocks.16.norm':
46
- dict(decay_mult=0.0, lr_mult=0.1),
47
- 'backbone.stages.2.blocks.17.norm':
48
- dict(decay_mult=0.0, lr_mult=0.1),
49
- 'backbone.stages.2.blocks.2.norm':
50
- dict(decay_mult=0.0, lr_mult=0.1),
51
- 'backbone.stages.2.blocks.3.norm':
52
- dict(decay_mult=0.0, lr_mult=0.1),
53
- 'backbone.stages.2.blocks.4.norm':
54
- dict(decay_mult=0.0, lr_mult=0.1),
55
- 'backbone.stages.2.blocks.5.norm':
56
- dict(decay_mult=0.0, lr_mult=0.1),
57
- 'backbone.stages.2.blocks.6.norm':
58
- dict(decay_mult=0.0, lr_mult=0.1),
59
- 'backbone.stages.2.blocks.7.norm':
60
- dict(decay_mult=0.0, lr_mult=0.1),
61
- 'backbone.stages.2.blocks.8.norm':
62
- dict(decay_mult=0.0, lr_mult=0.1),
63
- 'backbone.stages.2.blocks.9.norm':
64
- dict(decay_mult=0.0, lr_mult=0.1),
65
- 'backbone.stages.2.downsample.norm':
66
- dict(decay_mult=0.0, lr_mult=0.1),
67
- 'backbone.stages.3.blocks.0.norm':
68
- dict(decay_mult=0.0, lr_mult=0.1),
69
- 'backbone.stages.3.blocks.1.norm':
70
- dict(decay_mult=0.0, lr_mult=0.1),
71
- 'level_embed':
72
- dict(decay_mult=0.0, lr_mult=1.0),
73
- 'query_embed':
74
- dict(decay_mult=0.0, lr_mult=1.0),
75
- 'query_feat':
76
- dict(decay_mult=0.0, lr_mult=1.0),
77
- 'relative_position_bias_table':
78
- dict(decay_mult=0.0, lr_mult=0.1)
79
- })
80
- data_preprocessor = dict(
81
- bgr_to_rgb=True,
82
- mean=[
83
- 123.675,
84
- 116.28,
85
- 103.53,
86
- ],
87
- pad_val=0,
88
- seg_pad_val=255,
89
- size=(
90
- 640,
91
- 640,
92
- ),
93
- std=[
94
- 58.395,
95
- 57.12,
96
- 57.375,
97
- ],
98
- type='SegDataPreProcessor')
99
- data_root = 'CVRPDataset/'
100
- dataset_type = 'CVRPDataset'
101
- default_hooks = dict(
102
- checkpoint=dict(
103
- by_epoch=False,
104
- interval=2500,
105
- max_keep_ckpts=1,
106
- save_best='mIoU',
107
- type='CheckpointHook'),
108
- logger=dict(interval=100, log_metric_by_epoch=False, type='LoggerHook'),
109
- param_scheduler=dict(type='ParamSchedulerHook'),
110
- sampler_seed=dict(type='DistSamplerSeedHook'),
111
- timer=dict(type='IterTimerHook'),
112
- visualization=dict(type='SegVisualizationHook'))
113
- default_scope = 'mmseg'
114
- depths = [
115
- 2,
116
- 2,
117
- 18,
118
- 2,
119
- ]
120
- embed_multi = dict(decay_mult=0.0, lr_mult=1.0)
121
- env_cfg = dict(
122
- cudnn_benchmark=True,
123
- dist_cfg=dict(backend='nccl'),
124
- mp_cfg=dict(mp_start_method='fork', opencv_num_threads=0))
125
- img_ratios = [
126
- 0.5,
127
- 0.75,
128
- 1.0,
129
- 1.25,
130
- 1.5,
131
- 1.75,
132
- ]
133
- load_from = None
134
- log_level = 'INFO'
135
- log_processor = dict(by_epoch=False)
136
- model = dict(
137
- backbone=dict(
138
- attn_drop_rate=0.0,
139
- depths=[
140
- 2,
141
- 2,
142
- 18,
143
- 2,
144
- ],
145
- drop_path_rate=0.3,
146
- drop_rate=0.0,
147
- embed_dims=192,
148
- frozen_stages=-1,
149
- init_cfg=dict(
150
- checkpoint=
151
- 'https://download.openmmlab.com/mmsegmentation/v0.5/pretrain/swin/swin_large_patch4_window12_384_22k_20220412-6580f57d.pth',
152
- type='Pretrained'),
153
- mlp_ratio=4,
154
- num_heads=[
155
- 6,
156
- 12,
157
- 24,
158
- 48,
159
- ],
160
- out_indices=(
161
- 0,
162
- 1,
163
- 2,
164
- 3,
165
- ),
166
- patch_norm=True,
167
- pretrain_img_size=384,
168
- qk_scale=None,
169
- qkv_bias=True,
170
- type='SwinTransformer',
171
- window_size=12,
172
- with_cp=False),
173
- data_preprocessor=dict(
174
- bgr_to_rgb=True,
175
- mean=[
176
- 123.675,
177
- 116.28,
178
- 103.53,
179
- ],
180
- pad_val=0,
181
- seg_pad_val=255,
182
- size=(
183
- 512,
184
- 512,
185
- ),
186
- std=[
187
- 58.395,
188
- 57.12,
189
- 57.375,
190
- ],
191
- type='SegDataPreProcessor'),
192
- decode_head=dict(
193
- align_corners=False,
194
- enforce_decoder_input_project=False,
195
- feat_channels=256,
196
- in_channels=[
197
- 192,
198
- 384,
199
- 768,
200
- 1536,
201
- ],
202
- loss_cls=dict(
203
- class_weight=[
204
- 1.0,
205
- 1.0,
206
- 0.1,
207
- ],
208
- loss_weight=2.0,
209
- reduction='mean',
210
- type='mmdet.CrossEntropyLoss',
211
- use_sigmoid=False),
212
- loss_dice=dict(
213
- activate=True,
214
- eps=1.0,
215
- loss_weight=5.0,
216
- naive_dice=True,
217
- reduction='mean',
218
- type='mmdet.DiceLoss',
219
- use_sigmoid=True),
220
- loss_mask=dict(
221
- loss_weight=5.0,
222
- reduction='mean',
223
- type='mmdet.CrossEntropyLoss',
224
- use_sigmoid=True),
225
- num_classes=2,
226
- num_queries=100,
227
- num_transformer_feat_level=3,
228
- out_channels=256,
229
- pixel_decoder=dict(
230
- act_cfg=dict(type='ReLU'),
231
- encoder=dict(
232
- init_cfg=None,
233
- layer_cfg=dict(
234
- ffn_cfg=dict(
235
- act_cfg=dict(inplace=True, type='ReLU'),
236
- embed_dims=256,
237
- feedforward_channels=1024,
238
- ffn_drop=0.0,
239
- num_fcs=2),
240
- self_attn_cfg=dict(
241
- batch_first=True,
242
- dropout=0.0,
243
- embed_dims=256,
244
- im2col_step=64,
245
- init_cfg=None,
246
- norm_cfg=None,
247
- num_heads=8,
248
- num_levels=3,
249
- num_points=4)),
250
- num_layers=6),
251
- init_cfg=None,
252
- norm_cfg=dict(num_groups=32, type='GN'),
253
- num_outs=3,
254
- positional_encoding=dict(normalize=True, num_feats=128),
255
- type='mmdet.MSDeformAttnPixelDecoder'),
256
- positional_encoding=dict(normalize=True, num_feats=128),
257
- strides=[
258
- 4,
259
- 8,
260
- 16,
261
- 32,
262
- ],
263
- train_cfg=dict(
264
- assigner=dict(
265
- match_costs=[
266
- dict(type='mmdet.ClassificationCost', weight=2.0),
267
- dict(
268
- type='mmdet.CrossEntropyLossCost',
269
- use_sigmoid=True,
270
- weight=5.0),
271
- dict(
272
- eps=1.0,
273
- pred_act=True,
274
- type='mmdet.DiceCost',
275
- weight=5.0),
276
- ],
277
- type='mmdet.HungarianAssigner'),
278
- importance_sample_ratio=0.75,
279
- num_points=12544,
280
- oversample_ratio=3.0,
281
- sampler=dict(type='mmdet.MaskPseudoSampler')),
282
- transformer_decoder=dict(
283
- init_cfg=None,
284
- layer_cfg=dict(
285
- cross_attn_cfg=dict(
286
- attn_drop=0.0,
287
- batch_first=True,
288
- dropout_layer=None,
289
- embed_dims=256,
290
- num_heads=8,
291
- proj_drop=0.0),
292
- ffn_cfg=dict(
293
- act_cfg=dict(inplace=True, type='ReLU'),
294
- add_identity=True,
295
- dropout_layer=None,
296
- embed_dims=256,
297
- feedforward_channels=2048,
298
- ffn_drop=0.0,
299
- num_fcs=2),
300
- self_attn_cfg=dict(
301
- attn_drop=0.0,
302
- batch_first=True,
303
- dropout_layer=None,
304
- embed_dims=256,
305
- num_heads=8,
306
- proj_drop=0.0)),
307
- num_layers=9,
308
- return_intermediate=True),
309
- type='Mask2FormerHead'),
310
- test_cfg=dict(mode='whole'),
311
- train_cfg=dict(),
312
- type='EncoderDecoder')
313
- norm_cfg = dict(requires_grad=True, type='BN')
314
- num_classes = 150
315
- optim_wrapper = dict(
316
- clip_grad=dict(max_norm=0.01, norm_type=2),
317
- optimizer=dict(
318
- betas=(
319
- 0.9,
320
- 0.999,
321
- ),
322
- eps=1e-08,
323
- lr=0.0001,
324
- type='AdamW',
325
- weight_decay=0.05),
326
- paramwise_cfg=dict(
327
- custom_keys=dict({
328
- 'absolute_pos_embed':
329
- dict(decay_mult=0.0, lr_mult=0.1),
330
- 'backbone':
331
- dict(decay_mult=1.0, lr_mult=0.1),
332
- 'backbone.norm':
333
- dict(decay_mult=0.0, lr_mult=0.1),
334
- 'backbone.patch_embed.norm':
335
- dict(decay_mult=0.0, lr_mult=0.1),
336
- 'backbone.stages.0.blocks.0.norm':
337
- dict(decay_mult=0.0, lr_mult=0.1),
338
- 'backbone.stages.0.blocks.1.norm':
339
- dict(decay_mult=0.0, lr_mult=0.1),
340
- 'backbone.stages.0.downsample.norm':
341
- dict(decay_mult=0.0, lr_mult=0.1),
342
- 'backbone.stages.1.blocks.0.norm':
343
- dict(decay_mult=0.0, lr_mult=0.1),
344
- 'backbone.stages.1.blocks.1.norm':
345
- dict(decay_mult=0.0, lr_mult=0.1),
346
- 'backbone.stages.1.downsample.norm':
347
- dict(decay_mult=0.0, lr_mult=0.1),
348
- 'backbone.stages.2.blocks.0.norm':
349
- dict(decay_mult=0.0, lr_mult=0.1),
350
- 'backbone.stages.2.blocks.1.norm':
351
- dict(decay_mult=0.0, lr_mult=0.1),
352
- 'backbone.stages.2.blocks.10.norm':
353
- dict(decay_mult=0.0, lr_mult=0.1),
354
- 'backbone.stages.2.blocks.11.norm':
355
- dict(decay_mult=0.0, lr_mult=0.1),
356
- 'backbone.stages.2.blocks.12.norm':
357
- dict(decay_mult=0.0, lr_mult=0.1),
358
- 'backbone.stages.2.blocks.13.norm':
359
- dict(decay_mult=0.0, lr_mult=0.1),
360
- 'backbone.stages.2.blocks.14.norm':
361
- dict(decay_mult=0.0, lr_mult=0.1),
362
- 'backbone.stages.2.blocks.15.norm':
363
- dict(decay_mult=0.0, lr_mult=0.1),
364
- 'backbone.stages.2.blocks.16.norm':
365
- dict(decay_mult=0.0, lr_mult=0.1),
366
- 'backbone.stages.2.blocks.17.norm':
367
- dict(decay_mult=0.0, lr_mult=0.1),
368
- 'backbone.stages.2.blocks.2.norm':
369
- dict(decay_mult=0.0, lr_mult=0.1),
370
- 'backbone.stages.2.blocks.3.norm':
371
- dict(decay_mult=0.0, lr_mult=0.1),
372
- 'backbone.stages.2.blocks.4.norm':
373
- dict(decay_mult=0.0, lr_mult=0.1),
374
- 'backbone.stages.2.blocks.5.norm':
375
- dict(decay_mult=0.0, lr_mult=0.1),
376
- 'backbone.stages.2.blocks.6.norm':
377
- dict(decay_mult=0.0, lr_mult=0.1),
378
- 'backbone.stages.2.blocks.7.norm':
379
- dict(decay_mult=0.0, lr_mult=0.1),
380
- 'backbone.stages.2.blocks.8.norm':
381
- dict(decay_mult=0.0, lr_mult=0.1),
382
- 'backbone.stages.2.blocks.9.norm':
383
- dict(decay_mult=0.0, lr_mult=0.1),
384
- 'backbone.stages.2.downsample.norm':
385
- dict(decay_mult=0.0, lr_mult=0.1),
386
- 'backbone.stages.3.blocks.0.norm':
387
- dict(decay_mult=0.0, lr_mult=0.1),
388
- 'backbone.stages.3.blocks.1.norm':
389
- dict(decay_mult=0.0, lr_mult=0.1),
390
- 'level_embed':
391
- dict(decay_mult=0.0, lr_mult=1.0),
392
- 'query_embed':
393
- dict(decay_mult=0.0, lr_mult=1.0),
394
- 'query_feat':
395
- dict(decay_mult=0.0, lr_mult=1.0),
396
- 'relative_position_bias_table':
397
- dict(decay_mult=0.0, lr_mult=0.1)
398
- }),
399
- norm_decay_mult=0.0),
400
- type='OptimWrapper')
401
- optimizer = dict(
402
- betas=(
403
- 0.9,
404
- 0.999,
405
- ),
406
- eps=1e-08,
407
- lr=0.0001,
408
- type='AdamW',
409
- weight_decay=0.05)
410
- param_scheduler = [
411
- dict(
412
- begin=0,
413
- by_epoch=False,
414
- end=160000,
415
- eta_min=0,
416
- power=0.9,
417
- type='PolyLR'),
418
- ]
419
- pretrained = 'https://download.openmmlab.com/mmsegmentation/v0.5/pretrain/swin/swin_large_patch4_window12_384_22k_20220412-6580f57d.pth'
420
- randomness = dict(seed=0)
421
- resume = False
422
- test_cfg = dict(type='TestLoop')
423
- test_dataloader = dict(
424
- batch_size=1,
425
- dataset=dict(
426
- data_prefix=dict(img_path='img_dir/val', seg_map_path='ann_dir/val'),
427
- data_root='CVRPDataset/',
428
- pipeline=[
429
- dict(type='LoadImageFromFile'),
430
- dict(keep_ratio=True, scale=(
431
- 2048,
432
- 1024,
433
- ), type='Resize'),
434
- dict(type='LoadAnnotations'),
435
- dict(type='PackSegInputs'),
436
- ],
437
- type='CVRPDataset'),
438
- num_workers=4,
439
- persistent_workers=True,
440
- sampler=dict(shuffle=False, type='DefaultSampler'))
441
- test_evaluator = dict(
442
- iou_metrics=[
443
- 'mIoU',
444
- 'mDice',
445
- 'mFscore',
446
- ], type='IoUMetric')
447
- test_pipeline = [
448
- dict(type='LoadImageFromFile'),
449
- dict(keep_ratio=True, scale=(
450
- 2048,
451
- 1024,
452
- ), type='Resize'),
453
- dict(type='LoadAnnotations'),
454
- dict(type='PackSegInputs'),
455
- ]
456
- train_cfg = dict(max_iters=20000, type='IterBasedTrainLoop', val_interval=500)
457
- train_dataloader = dict(
458
- batch_size=2,
459
- dataset=dict(
460
- data_prefix=dict(
461
- img_path='img_dir/train', seg_map_path='ann_dir/train'),
462
- data_root='CVRPDataset/',
463
- pipeline=[
464
- dict(type='LoadImageFromFile'),
465
- dict(type='LoadAnnotations'),
466
- dict(
467
- keep_ratio=True,
468
- ratio_range=(
469
- 0.5,
470
- 2.0,
471
- ),
472
- scale=(
473
- 2048,
474
- 1024,
475
- ),
476
- type='RandomResize'),
477
- dict(
478
- cat_max_ratio=0.75, crop_size=(
479
- 512,
480
- 512,
481
- ), type='RandomCrop'),
482
- dict(prob=0.5, type='RandomFlip'),
483
- dict(type='PhotoMetricDistortion'),
484
- dict(type='PackSegInputs'),
485
- ],
486
- type='CVRPDataset'),
487
- num_workers=2,
488
- persistent_workers=True,
489
- sampler=dict(shuffle=True, type='InfiniteSampler'))
490
- train_pipeline = [
491
- dict(type='LoadImageFromFile'),
492
- dict(type='LoadAnnotations'),
493
- dict(
494
- keep_ratio=True,
495
- ratio_range=(
496
- 0.5,
497
- 2.0,
498
- ),
499
- scale=(
500
- 2048,
501
- 1024,
502
- ),
503
- type='RandomResize'),
504
- dict(cat_max_ratio=0.75, crop_size=(
505
- 512,
506
- 512,
507
- ), type='RandomCrop'),
508
- dict(prob=0.5, type='RandomFlip'),
509
- dict(type='PhotoMetricDistortion'),
510
- dict(type='PackSegInputs'),
511
- ]
512
- tta_model = dict(type='SegTTAModel')
513
- tta_pipeline = [
514
- dict(file_client_args=dict(backend='disk'), type='LoadImageFromFile'),
515
- dict(
516
- transforms=[
517
- [
518
- dict(keep_ratio=True, scale_factor=0.5, type='Resize'),
519
- dict(keep_ratio=True, scale_factor=0.75, type='Resize'),
520
- dict(keep_ratio=True, scale_factor=1.0, type='Resize'),
521
- dict(keep_ratio=True, scale_factor=1.25, type='Resize'),
522
- dict(keep_ratio=True, scale_factor=1.5, type='Resize'),
523
- dict(keep_ratio=True, scale_factor=1.75, type='Resize'),
524
- ],
525
- [
526
- dict(direction='horizontal', prob=0.0, type='RandomFlip'),
527
- dict(direction='horizontal', prob=1.0, type='RandomFlip'),
528
- ],
529
- [
530
- dict(type='LoadAnnotations'),
531
- ],
532
- [
533
- dict(type='PackSegInputs'),
534
- ],
535
- ],
536
- type='TestTimeAug'),
537
- ]
538
- val_cfg = dict(type='ValLoop')
539
- val_dataloader = dict(
540
- batch_size=1,
541
- dataset=dict(
542
- data_prefix=dict(img_path='img_dir/val', seg_map_path='ann_dir/val'),
543
- data_root='CVRPDataset/',
544
- pipeline=[
545
- dict(type='LoadImageFromFile'),
546
- dict(keep_ratio=True, scale=(
547
- 2048,
548
- 1024,
549
- ), type='Resize'),
550
- dict(type='LoadAnnotations'),
551
- dict(type='PackSegInputs'),
552
- ],
553
- type='CVRPDataset'),
554
- num_workers=4,
555
- persistent_workers=True,
556
- sampler=dict(shuffle=False, type='DefaultSampler'))
557
- val_evaluator = dict(
558
- iou_metrics=[
559
- 'mIoU',
560
- 'mDice',
561
- 'mFscore',
562
- ], type='IoUMetric')
563
- vis_backends = [
564
- dict(type='LocalVisBackend'),
565
- ]
566
- visualizer = dict(
567
- name='visualizer',
568
- type='SegLocalVisualizer',
569
- vis_backends=[
570
- dict(type='LocalVisBackend'),
571
- ])
572
- work_dir = './work_dirs/CVRPDataset_mask2former'