| | Global: |
| | debug: false |
| | use_gpu: true |
| | epoch_num: 200 |
| | log_smooth_window: 20 |
| | print_batch_step: 20 |
| | save_model_dir: '/workspace/checkpoints/14-03-2024' |
| | save_epoch_step: 1 |
| | eval_batch_step: [0, 200] |
| | cal_metric_during_train: true |
| | pretrained_model: /workspace/pretrained/best_accuracy |
| | checkpoints: |
| | save_inference_dir: |
| | use_visualdl: false |
| | infer_img: doc/imgs_words/ch/word_1.jpg |
| | character_dict_path: /workspace/vi_dict.txt |
| | max_text_length: &max_text_length 64 |
| | infer_mode: false |
| | use_space_char: true |
| | distributed: true |
| | save_res_path: '/workspace/checkpoints/13-03-2024/predicts_ppocrv4.txt' |
| |
|
| |
|
| | Optimizer: |
| | name: Adam |
| | beta1: 0.9 |
| | beta2: 0.999 |
| | lr: |
| | name: Cosine |
| | learning_rate: 0.001 |
| | warmup_epoch: 5 |
| | regularizer: |
| | name: L2 |
| | factor: 3.0e-05 |
| |
|
| |
|
| | Architecture: |
| | model_type: rec |
| | algorithm: SVTR_LCNet |
| | Transform: |
| | Backbone: |
| | name: PPLCNetV3 |
| | scale: 0.95 |
| | Head: |
| | name: MultiHead |
| | head_list: |
| | - CTCHead: |
| | Neck: |
| | name: svtr |
| | dims: 120 |
| | depth: 2 |
| | hidden_dims: 120 |
| | kernel_size: [1, 3] |
| | use_guide: True |
| | Head: |
| | fc_decay: 0.00001 |
| | - NRTRHead: |
| | nrtr_dim: 384 |
| | max_text_length: *max_text_length |
| |
|
| | Loss: |
| | name: MultiLoss |
| | loss_config_list: |
| | - CTCLoss: |
| | - NRTRLoss: |
| |
|
| | PostProcess: |
| | name: CTCLabelDecode |
| |
|
| | Metric: |
| | name: RecMetric |
| | main_indicator: acc |
| |
|
| | Train: |
| | dataset: |
| | name: MultiScaleDataSet |
| | ds_width: false |
| | data_dir: /workspace/dataset |
| | ext_op_transform_idx: 1 |
| | label_file_list: |
| | - /workspace/dataset/merge_train_list.txt |
| | transforms: |
| | - DecodeImage: |
| | img_mode: BGR |
| | channel_first: false |
| | - RecConAug: |
| | prob: 0.5 |
| | ext_data_num: 2 |
| | image_shape: [48, 320, 3] |
| | max_text_length: *max_text_length |
| | - RecAug: |
| | - MultiLabelEncode: |
| | gtc_encode: NRTRLabelEncode |
| | - KeepKeys: |
| | keep_keys: |
| | - image |
| | - label_ctc |
| | - label_gtc |
| | - length |
| | - valid_ratio |
| | sampler: |
| | name: MultiScaleSampler |
| | scales: [[320, 32], [320, 48], [320, 64]] |
| | first_bs: &bs 512 |
| | fix_bs: false |
| | divided_factor: [8, 16] |
| | is_training: True |
| | loader: |
| | shuffle: true |
| | batch_size_per_card: *bs |
| | drop_last: true |
| | num_workers: 0 |
| | Eval: |
| | dataset: |
| | name: SimpleDataSet |
| | data_dir: /workspace/dataset |
| | label_file_list: |
| | - /workspace/dataset/merge_val_list.txt |
| | transforms: |
| | - DecodeImage: |
| | img_mode: BGR |
| | channel_first: false |
| | - MultiLabelEncode: |
| | gtc_encode: NRTRLabelEncode |
| | - RecResizeImg: |
| | image_shape: [3, 48, 320] |
| | - KeepKeys: |
| | keep_keys: |
| | - image |
| | - label_ctc |
| | - label_gtc |
| | - length |
| | - valid_ratio |
| | loader: |
| | shuffle: false |
| | drop_last: false |
| | batch_size_per_card: 256 |
| | num_workers: 0 |
| |
|