anhbn commited on
Commit
d250ac2
·
verified ·
1 Parent(s): fb4a8ec

Upload config.yml with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.yml +138 -0
config.yml ADDED
@@ -0,0 +1,138 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ Global:
2
+ debug: false
3
+ use_gpu: true
4
+ epoch_num: 200
5
+ log_smooth_window: 20
6
+ print_batch_step: 20
7
+ save_model_dir: '/workspace/checkpoints/14-03-2024'
8
+ save_epoch_step: 1
9
+ eval_batch_step: [0, 200]
10
+ cal_metric_during_train: true
11
+ pretrained_model: /workspace/pretrained/best_accuracy
12
+ checkpoints:
13
+ save_inference_dir:
14
+ use_visualdl: false
15
+ infer_img: doc/imgs_words/ch/word_1.jpg
16
+ character_dict_path: /workspace/vi_dict.txt
17
+ max_text_length: &max_text_length 64
18
+ infer_mode: false
19
+ use_space_char: true
20
+ distributed: true
21
+ save_res_path: '/workspace/checkpoints/13-03-2024/predicts_ppocrv4.txt'
22
+
23
+
24
+ Optimizer:
25
+ name: Adam
26
+ beta1: 0.9
27
+ beta2: 0.999
28
+ lr:
29
+ name: Cosine
30
+ learning_rate: 0.001
31
+ warmup_epoch: 5
32
+ regularizer:
33
+ name: L2
34
+ factor: 3.0e-05
35
+
36
+
37
+ Architecture:
38
+ model_type: rec
39
+ algorithm: SVTR_LCNet
40
+ Transform:
41
+ Backbone:
42
+ name: PPLCNetV3
43
+ scale: 0.95
44
+ Head:
45
+ name: MultiHead
46
+ head_list:
47
+ - CTCHead:
48
+ Neck:
49
+ name: svtr
50
+ dims: 120
51
+ depth: 2
52
+ hidden_dims: 120
53
+ kernel_size: [1, 3]
54
+ use_guide: True
55
+ Head:
56
+ fc_decay: 0.00001
57
+ - NRTRHead:
58
+ nrtr_dim: 384
59
+ max_text_length: *max_text_length
60
+
61
+ Loss:
62
+ name: MultiLoss
63
+ loss_config_list:
64
+ - CTCLoss:
65
+ - NRTRLoss:
66
+
67
+ PostProcess:
68
+ name: CTCLabelDecode
69
+
70
+ Metric:
71
+ name: RecMetric
72
+ main_indicator: acc
73
+
74
+ Train:
75
+ dataset:
76
+ name: MultiScaleDataSet
77
+ ds_width: false
78
+ data_dir: /workspace/dataset
79
+ ext_op_transform_idx: 1
80
+ label_file_list:
81
+ - /workspace/dataset/merge_train_list.txt
82
+ transforms:
83
+ - DecodeImage:
84
+ img_mode: BGR
85
+ channel_first: false
86
+ - RecConAug:
87
+ prob: 0.5
88
+ ext_data_num: 2
89
+ image_shape: [48, 320, 3]
90
+ max_text_length: *max_text_length
91
+ - RecAug:
92
+ - MultiLabelEncode:
93
+ gtc_encode: NRTRLabelEncode
94
+ - KeepKeys:
95
+ keep_keys:
96
+ - image
97
+ - label_ctc
98
+ - label_gtc
99
+ - length
100
+ - valid_ratio
101
+ sampler:
102
+ name: MultiScaleSampler
103
+ scales: [[320, 32], [320, 48], [320, 64]]
104
+ first_bs: &bs 512
105
+ fix_bs: false
106
+ divided_factor: [8, 16] # w, h
107
+ is_training: True
108
+ loader:
109
+ shuffle: true
110
+ batch_size_per_card: *bs
111
+ drop_last: true
112
+ num_workers: 0
113
+ Eval:
114
+ dataset:
115
+ name: SimpleDataSet
116
+ data_dir: /workspace/dataset
117
+ label_file_list:
118
+ - /workspace/dataset/merge_val_list.txt
119
+ transforms:
120
+ - DecodeImage:
121
+ img_mode: BGR
122
+ channel_first: false
123
+ - MultiLabelEncode:
124
+ gtc_encode: NRTRLabelEncode
125
+ - RecResizeImg:
126
+ image_shape: [3, 48, 320]
127
+ - KeepKeys:
128
+ keep_keys:
129
+ - image
130
+ - label_ctc
131
+ - label_gtc
132
+ - length
133
+ - valid_ratio
134
+ loader:
135
+ shuffle: false
136
+ drop_last: false
137
+ batch_size_per_card: 256
138
+ num_workers: 0