| | CUDNN_BENCHMARK: false |
| | DATALOADER: |
| | ASPECT_RATIO_GROUPING: true |
| | FILTER_EMPTY_ANNOTATIONS: true |
| | NUM_WORKERS: 4 |
| | REPEAT_THRESHOLD: 0.0 |
| | SAMPLER_TRAIN: TrainingSampler |
| | DATASETS: |
| | PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000 |
| | PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000 |
| | PROPOSAL_FILES_TEST: [] |
| | PROPOSAL_FILES_TRAIN: [] |
| | TEST: [] |
| | TRAIN: |
| | - coco_lvis_no_part_train |
| | - coco_lvis_paco_part_train |
| | - ppp_train |
| | - ppp_val |
| | - entity_train_lr_with_cls |
| | - entity_train_lr_no_cls |
| | - textocr_train |
| | - mhp_train |
| | GLOBAL: |
| | HACK: 1.0 |
| | INPUT: |
| | COLOR_AUG_SSD: false |
| | CROP: |
| | ENABLED: false |
| | SINGLE_CATEGORY_MAX_AREA: 1.0 |
| | SIZE: |
| | - 0.9 |
| | - 0.9 |
| | TYPE: relative_range |
| | DATASET_MAPPER_NAME: coco_panoptic_lsj |
| | FORMAT: RGB |
| | IMAGE_SIZE: 1024 |
| | MASK_FORMAT: polygon |
| | MAX_SCALE: 2.0 |
| | MAX_SIZE_TEST: 1333 |
| | MAX_SIZE_TRAIN: 1333 |
| | MIN_SCALE: 0.1 |
| | MIN_SIZE_TEST: 800 |
| | MIN_SIZE_TRAIN: |
| | - 800 |
| | MIN_SIZE_TRAIN_SAMPLING: choice |
| | RANDOM_FLIP: horizontal |
| | SIZE_DIVISIBILITY: -1 |
| | MODEL: |
| | ANCHOR_GENERATOR: |
| | ANGLES: |
| | - - -90 |
| | - 0 |
| | - 90 |
| | ASPECT_RATIOS: |
| | - - 0.5 |
| | - 1.0 |
| | - 2.0 |
| | NAME: DefaultAnchorGenerator |
| | OFFSET: 0.0 |
| | SIZES: |
| | - - 32 |
| | - 64 |
| | - 128 |
| | - 256 |
| | - 512 |
| | BACKBONE: |
| | FREEZE_AT: 0 |
| | NAME: D2SwinTransformer |
| | DEVICE: cuda |
| | FPN: |
| | FUSE_TYPE: sum |
| | IN_FEATURES: [] |
| | NORM: '' |
| | OUT_CHANNELS: 256 |
| | KEYPOINT_ON: false |
| | LOAD_PROPOSALS: false |
| | MASK_FORMER: |
| | CLASS_WEIGHT: 0.0 |
| | CLIP: ViT-L-14-336/openai |
| | DEC_LAYERS: 10 |
| | DEEP_SUPERVISION: true |
| | DICE_WEIGHT: 5.0 |
| | DIM_FEEDFORWARD: 2048 |
| | DROPOUT: 0.0 |
| | ENC_LAYERS: 0 |
| | ENFORCE_INPUT_PROJ: false |
| | HIDDEN_DIM: 256 |
| | IMPORTANCE_SAMPLE_RATIO: 0.75 |
| | MASK_WEIGHT: 5.0 |
| | NHEADS: 8 |
| | NO_OBJECT_WEIGHT: 0.1 |
| | NUM_OBJECT_QUERIES: 200 |
| | NUM_PART_QUERIES: 50 |
| | NUM_TEXT_QUERIES: 50 |
| | OVERSAMPLE_RATIO: 3.0 |
| | PRE_NORM: false |
| | SEM_EMBED_DIM: 768 |
| | SIZE_DIVISIBILITY: 32 |
| | TEST: |
| | INSTANCE_ON: true |
| | OBJECT_MASK_THRESHOLD: 0.8 |
| | OVERLAP_THRESHOLD: 0.8 |
| | PANOPTIC_ON: true |
| | SEMANTIC_ON: true |
| | SEM_SEG_POSTPROCESSING_BEFORE_INFERENCE: false |
| | TRAIN_NUM_POINTS: 12544 |
| | TRANSFORMER_DECODER_NAME: MultiScaleMaskedTransformerDecoderPlus |
| | TRANSFORMER_IN_FEATURE: multi_scale_pixel_decoder |
| | MASK_ON: false |
| | META_ARCHITECTURE: MaskFormerPlusNoSem |
| | MULTI_DATASET_TRAIN: true |
| | PANOPTIC_FPN: |
| | COMBINE: |
| | ENABLED: true |
| | INSTANCES_CONFIDENCE_THRESH: 0.5 |
| | OVERLAP_THRESH: 0.5 |
| | STUFF_AREA_LIMIT: 4096 |
| | INSTANCE_LOSS_WEIGHT: 1.0 |
| | PIXEL_MEAN: |
| | - 123.675 |
| | - 116.28 |
| | - 103.53 |
| | PIXEL_STD: |
| | - 58.395 |
| | - 57.12 |
| | - 57.375 |
| | PROPOSAL_GENERATOR: |
| | MIN_SIZE: 0 |
| | NAME: RPN |
| | RESNETS: |
| | DEFORM_MODULATED: false |
| | DEFORM_NUM_GROUPS: 1 |
| | DEFORM_ON_PER_STAGE: |
| | - false |
| | - false |
| | - false |
| | - false |
| | DEPTH: 50 |
| | NORM: FrozenBN |
| | NUM_GROUPS: 1 |
| | OUT_FEATURES: |
| | - res2 |
| | - res3 |
| | - res4 |
| | - res5 |
| | RES2_OUT_CHANNELS: 256 |
| | RES4_DILATION: 1 |
| | RES5_DILATION: 1 |
| | RES5_MULTI_GRID: |
| | - 1 |
| | - 1 |
| | - 1 |
| | STEM_OUT_CHANNELS: 64 |
| | STEM_TYPE: basic |
| | STRIDE_IN_1X1: false |
| | WIDTH_PER_GROUP: 64 |
| | RETINANET: |
| | BBOX_REG_LOSS_TYPE: smooth_l1 |
| | BBOX_REG_WEIGHTS: &id002 |
| | - 1.0 |
| | - 1.0 |
| | - 1.0 |
| | - 1.0 |
| | FOCAL_LOSS_ALPHA: 0.25 |
| | FOCAL_LOSS_GAMMA: 2.0 |
| | IN_FEATURES: |
| | - p3 |
| | - p4 |
| | - p5 |
| | - p6 |
| | - p7 |
| | IOU_LABELS: |
| | - 0 |
| | - -1 |
| | - 1 |
| | IOU_THRESHOLDS: |
| | - 0.4 |
| | - 0.5 |
| | NMS_THRESH_TEST: 0.5 |
| | NORM: '' |
| | NUM_CLASSES: 80 |
| | NUM_CONVS: 4 |
| | PRIOR_PROB: 0.01 |
| | SCORE_THRESH_TEST: 0.05 |
| | SMOOTH_L1_LOSS_BETA: 0.1 |
| | TOPK_CANDIDATES_TEST: 1000 |
| | ROI_BOX_CASCADE_HEAD: |
| | BBOX_REG_WEIGHTS: |
| | - &id001 |
| | - 10.0 |
| | - 10.0 |
| | - 5.0 |
| | - 5.0 |
| | - - 20.0 |
| | - 20.0 |
| | - 10.0 |
| | - 10.0 |
| | - - 30.0 |
| | - 30.0 |
| | - 15.0 |
| | - 15.0 |
| | IOUS: |
| | - 0.5 |
| | - 0.6 |
| | - 0.7 |
| | ROI_BOX_HEAD: |
| | BBOX_REG_LOSS_TYPE: smooth_l1 |
| | BBOX_REG_LOSS_WEIGHT: 1.0 |
| | BBOX_REG_WEIGHTS: *id001 |
| | CLS_AGNOSTIC_BBOX_REG: false |
| | CONV_DIM: 256 |
| | FC_DIM: 1024 |
| | FED_LOSS_FREQ_WEIGHT_POWER: 0.5 |
| | FED_LOSS_NUM_CLASSES: 50 |
| | NAME: '' |
| | NORM: '' |
| | NUM_CONV: 0 |
| | NUM_FC: 0 |
| | POOLER_RESOLUTION: 14 |
| | POOLER_SAMPLING_RATIO: 0 |
| | POOLER_TYPE: ROIAlignV2 |
| | SMOOTH_L1_BETA: 0.0 |
| | TRAIN_ON_PRED_BOXES: false |
| | USE_FED_LOSS: false |
| | USE_SIGMOID_CE: false |
| | ROI_HEADS: |
| | BATCH_SIZE_PER_IMAGE: 512 |
| | IN_FEATURES: |
| | - res4 |
| | IOU_LABELS: |
| | - 0 |
| | - 1 |
| | IOU_THRESHOLDS: |
| | - 0.5 |
| | NAME: Res5ROIHeads |
| | NMS_THRESH_TEST: 0.5 |
| | NUM_CLASSES: 80 |
| | POSITIVE_FRACTION: 0.25 |
| | PROPOSAL_APPEND_GT: true |
| | SCORE_THRESH_TEST: 0.05 |
| | ROI_KEYPOINT_HEAD: |
| | CONV_DIMS: |
| | - 512 |
| | - 512 |
| | - 512 |
| | - 512 |
| | - 512 |
| | - 512 |
| | - 512 |
| | - 512 |
| | LOSS_WEIGHT: 1.0 |
| | MIN_KEYPOINTS_PER_IMAGE: 1 |
| | NAME: KRCNNConvDeconvUpsampleHead |
| | NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true |
| | NUM_KEYPOINTS: 17 |
| | POOLER_RESOLUTION: 14 |
| | POOLER_SAMPLING_RATIO: 0 |
| | POOLER_TYPE: ROIAlignV2 |
| | ROI_MASK_HEAD: |
| | CLS_AGNOSTIC_MASK: false |
| | CONV_DIM: 256 |
| | NAME: MaskRCNNConvUpsampleHead |
| | NORM: '' |
| | NUM_CONV: 0 |
| | POOLER_RESOLUTION: 14 |
| | POOLER_SAMPLING_RATIO: 0 |
| | POOLER_TYPE: ROIAlignV2 |
| | RPN: |
| | BATCH_SIZE_PER_IMAGE: 256 |
| | BBOX_REG_LOSS_TYPE: smooth_l1 |
| | BBOX_REG_LOSS_WEIGHT: 1.0 |
| | BBOX_REG_WEIGHTS: *id002 |
| | BOUNDARY_THRESH: -1 |
| | CONV_DIMS: |
| | - -1 |
| | HEAD_NAME: StandardRPNHead |
| | IN_FEATURES: |
| | - res4 |
| | IOU_LABELS: |
| | - 0 |
| | - -1 |
| | - 1 |
| | IOU_THRESHOLDS: |
| | - 0.3 |
| | - 0.7 |
| | LOSS_WEIGHT: 1.0 |
| | NMS_THRESH: 0.7 |
| | POSITIVE_FRACTION: 0.5 |
| | POST_NMS_TOPK_TEST: 1000 |
| | POST_NMS_TOPK_TRAIN: 2000 |
| | PRE_NMS_TOPK_TEST: 6000 |
| | PRE_NMS_TOPK_TRAIN: 12000 |
| | SMOOTH_L1_BETA: 0.0 |
| | SEM_SEG_HEAD: |
| | ASPP_CHANNELS: 256 |
| | ASPP_DILATIONS: |
| | - 6 |
| | - 12 |
| | - 18 |
| | ASPP_DROPOUT: 0.1 |
| | COMMON_STRIDE: 4 |
| | CONVS_DIM: 256 |
| | DEFORMABLE_TRANSFORMER_ENCODER_IN_FEATURES: |
| | - res3 |
| | - res4 |
| | - res5 |
| | DEFORMABLE_TRANSFORMER_ENCODER_N_HEADS: 8 |
| | DEFORMABLE_TRANSFORMER_ENCODER_N_POINTS: 4 |
| | IGNORE_VALUE: 255 |
| | IN_FEATURES: |
| | - res2 |
| | - res3 |
| | - res4 |
| | - res5 |
| | LOSS_TYPE: hard_pixel_mining |
| | LOSS_WEIGHT: 1.0 |
| | MASK_DIM: 256 |
| | NAME: MaskFormerHead |
| | NORM: GN |
| | NUM_CLASSES: 1 |
| | PIXEL_DECODER_NAME: MSDeformAttnPixelDecoder |
| | PROJECT_CHANNELS: |
| | - 48 |
| | PROJECT_FEATURES: |
| | - res2 |
| | TRANSFORMER_ENC_LAYERS: 6 |
| | USE_DEPTHWISE_SEPARABLE_CONV: false |
| | SWIN: |
| | APE: false |
| | ATTN_DROP_RATE: 0.0 |
| | DEPTHS: |
| | - 2 |
| | - 2 |
| | - 18 |
| | - 2 |
| | DROP_PATH_RATE: 0.3 |
| | DROP_RATE: 0.0 |
| | EMBED_DIM: 192 |
| | MLP_RATIO: 4.0 |
| | NUM_HEADS: |
| | - 6 |
| | - 12 |
| | - 24 |
| | - 48 |
| | OUT_FEATURES: |
| | - res2 |
| | - res3 |
| | - res4 |
| | - res5 |
| | PATCH_NORM: true |
| | PATCH_SIZE: 4 |
| | PRETRAIN_IMG_SIZE: 384 |
| | QKV_BIAS: true |
| | QK_SCALE: null |
| | USE_CHECKPOINT: false |
| | WINDOW_SIZE: 12 |
| | WEIGHTS: weights/coco_panoptic_swinl_100ep/model_final.pkl |
| | OUTPUT_DIR: runs/swinl-all_data-q200+50+50-res1024-bs16-poly50k-nosem-hasnoobj-debug |
| | SEED: -1 |
| | SOLVER: |
| | AMP: |
| | ENABLED: true |
| | BACKBONE_MULTIPLIER: 0.1 |
| | BASE_LR: 0.0001 |
| | BASE_LR_END: 0.0 |
| | BIAS_LR_FACTOR: 1.0 |
| | CHECKPOINT_PERIOD: 5000 |
| | CLIP_GRADIENTS: |
| | CLIP_TYPE: full_model |
| | CLIP_VALUE: 0.01 |
| | ENABLED: true |
| | NORM_TYPE: 2.0 |
| | GAMMA: 0.1 |
| | IMS_PER_BATCH: 16 |
| | LR_SCHEDULER_NAME: WarmupPolyLR |
| | MAX_ITER: 100000 |
| | MOMENTUM: 0.9 |
| | NESTEROV: false |
| | NUM_DECAYS: 3 |
| | OPTIMIZER: ADAMW |
| | POLY_LR_CONSTANT_ENDING: 0.0 |
| | POLY_LR_POWER: 0.9 |
| | REFERENCE_WORLD_SIZE: 0 |
| | RESCALE_INTERVAL: false |
| | STEPS: |
| | - 655556 |
| | - 710184 |
| | WARMUP_FACTOR: 1.0 |
| | WARMUP_ITERS: 10 |
| | WARMUP_METHOD: linear |
| | WEIGHT_DECAY: 0.05 |
| | WEIGHT_DECAY_BIAS: null |
| | WEIGHT_DECAY_EMBED: 0.0 |
| | WEIGHT_DECAY_NORM: 0.0 |
| | TEST: |
| | AUG: |
| | ENABLED: false |
| | FLIP: true |
| | MAX_SIZE: 4000 |
| | MIN_SIZES: |
| | - 400 |
| | - 500 |
| | - 600 |
| | - 700 |
| | - 800 |
| | - 900 |
| | - 1000 |
| | - 1100 |
| | - 1200 |
| | DETECTIONS_PER_IMAGE: 100 |
| | EVAL_PERIOD: 100000000 |
| | EXPECTED_RESULTS: [] |
| | KEYPOINT_OKS_SIGMAS: [] |
| | PRECISE_BN: |
| | ENABLED: false |
| | NUM_ITER: 200 |
| | VERSION: 2 |
| | VIS_PERIOD: 0 |
| | WANDB: |
| | NAME: swinl-all_data-q200+50+50-res1024-bs16-poly50k-nosem-hasnoobj-debug |
| | PROJECT: mask2former |
| |
|