DETR: backbone: PPHGNetV2 detr_head: DocLayoutV3Head neck: MaskHybridEncoder post_process: DocLayoutV3PostProcess transformer: DocLayoutV3Transformer DocLayoutV3Head: loss: aux_loss: true loss_coeff: bbox: 5 class: 4 dice: 5 giou: 2 mask: 5 order: 50 matcher: matcher_coeff: bbox: 5 class: 4 dice: 5 giou: 2 mask: 5 name: HungarianMatcher name: DocLayoutV3Loss use_focal_loss: true use_vfl: true vfl_iou_type: mask DocLayoutV3Metric: eval_mask: false DocLayoutV3PostProcess: mask_stride: 4 num_top_queries: 300 resize_mask: false DocLayoutV3Transformer: activation: relu box_noise_scale: 1.0 dim_feedforward: 1024 dropout: 0.0 feat_strides: - 8 - 16 - 32 label_noise_ratio: 0.5 learnt_init_query: false mask_enhanced: true nhead: 8 num_denoising: 0 num_levels: 3 num_queries: 300 position_embed_type: sine EvalDataset: anno_path: annotations/instance_val.json dataset_dir: /root/work/paddleocr-det/PaddleX/paddlex/dataset/handwriting image_dir: images name: COCOInstSegDataset EvalReader: batch_size: 1 drop_last: false sample_transforms: - Decode: {} - Resize: interp: 2 keep_ratio: false target_size: - 800 - 800 - NormalizeImage: mean: - 0.0 - 0.0 - 0.0 norm_type: none std: - 1.0 - 1.0 - 1.0 - Permute: {} shuffle: false LearningRate: base_lr: 0.0001 schedulers: - !PiecewiseDecay gamma: - 1.0 milestones: - 100 use_warmup: true values: null - !LinearWarmup epochs: null epochs_first: false start_factor: 0.001 steps: 200 MaskHybridEncoder: encoder_layer: activation: gelu d_model: 256 dim_feedforward: 1024 dropout: 0.0 name: TransformerLayer nhead: 8 expansion: 1.0 hidden_dim: 256 mask_feat_channels: - 64 - 64 num_encoder_layers: 1 use_encoder_idx: - 3 OptimizerBuilder: clip_grad_by_norm: 0.1 optimizer: type: AdamW weight_decay: 0.0001 regularizer: false PPHGNetV2: arch: L freeze_at: 0 freeze_norm: true freeze_stem_only: true lr_mult_list: - 0.0 - 0.05 - 0.05 - 0.05 - 0.05 return_idx: - 0 - 1 - 2 - 3 TestDataset: !ImageFolder anno_path: annotations/instance_val.json dataset_dir: /root/work/paddleocr-det/PaddleX/paddlex/dataset/handwriting image_dir: '' sample_num: -1 use_default_label: null TestReader: batch_size: 1 drop_last: false inputs_def: image_shape: - 3 - 800 - 800 sample_transforms: - Decode: {} - Resize: interp: 2 keep_ratio: false target_size: - 800 - 800 - NormalizeImage: mean: - 0.0 - 0.0 - 0.0 norm_type: none std: - 1.0 - 1.0 - 1.0 - Permute: {} shuffle: false TrainDataset: anno_path: annotations/instance_train.json data_fields: - image - gt_bbox - gt_class - gt_poly - is_crowd - gt_read_order dataset_dir: /root/work/paddleocr-det/PaddleX/paddlex/dataset/handwriting image_dir: images name: COCOInstSegDataset TrainReader: batch_size: 8 batch_transforms: - BatchRandomResize: keep_ratio: false random_interp: true random_size: true target_size: - 672 - 704 - 736 - 768 - 800 - 800 - 800 - 800 - 832 - 864 - 896 - 928 - UnpackMask: {} - NormalizeImage: mean: - 0.0 - 0.0 - 0.0 norm_type: none std: - 1.0 - 1.0 - 1.0 - NormalizeBox: {} - BboxXYXY2XYWH: {} - Permute: {} collate_batch: false drop_last: true sample_transforms: - Decode: {} - Poly2MaskPack: del_poly: true - RandomDistort: prob: 0.8 - UpdateBBoxFromMask: {} - RandomExpand: fill_value: - 123.675 - 116.28 - 103.53 prob: 0.5 ratio: 1.5 - RandomCrop: prob: 0.8 use_box_candidates: true shuffle: true use_shared_memory: true amp: false architecture: DETR ema_decay: 0.9999 ema_decay_type: exponential ema_filter_no_grad: true enable_ce: false epoch: 200 eval: true eval_size: - 800 - 800 export: benchmark: false fuse_conv_bn: false nms: true post_process: true export_with_pir: true filename: instancesegmodel_PP-DocLayoutV3 find_unused_parameters: true fleet: false hidden_dim: 256 log_iter: 10 metric: DocLayoutV3Metric norm_type: sync_bn num_classes: 6 num_prototypes: 32 pdx_model_name: PP-DocLayoutV3 pretrain_weights: /root/work/paddleocr-det/PaddleX/PP-DocLayoutV3_pretrained.pdparams print_flops: false print_params: false profiler_options: null proposals_path: sniper/proposals.json resume: null save_dir: /root/work/paddleocr-det/PaddleX/output save_prediction_only: false save_proposals: false snapshot_epoch: 5 target_metrics: mask to_static: false uniform_output_enabled: true use_ema: true use_focal_loss: true use_gpu: true use_iluvatar_gpu: false use_mlu: false use_npu: false use_vdl: true use_wandb: false use_xpu: false vdl_log_dir: /root/work/paddleocr-det/PaddleX/output with_mask: true worker_num: 24