kwanwoo02 commited on
Commit
7951901
·
verified ·
1 Parent(s): e0b62ee

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,9 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ Multilingual_PP-OCRv3_det_infer/inference.pdiparams filter=lfs diff=lfs merge=lfs -text
37
+ Multilingual_PP-OCRv3_det_infer/inference.pdmodel filter=lfs diff=lfs merge=lfs -text
38
+ ch_ppocr_mobile_v2.0_cls_infer/inference.pdiparams filter=lfs diff=lfs merge=lfs -text
39
+ ch_ppocr_mobile_v2.0_cls_infer/inference.pdmodel filter=lfs diff=lfs merge=lfs -text
40
+ korean_PP-OCRv4_rec_infer/inference.pdiparams filter=lfs diff=lfs merge=lfs -text
41
+ korean_PP-OCRv4_rec_infer/inference.pdmodel filter=lfs diff=lfs merge=lfs -text
Color_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45c42c8d3d2d3e27d34b43916357f6a946291712ed4fdbe1651c9b8877a0b5d5
3
+ size 583206801
Detection_config.yaml ADDED
@@ -0,0 +1,326 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CUDNN_BENCHMARK: false
2
+ DATALOADER:
3
+ ASPECT_RATIO_GROUPING: true
4
+ FILTER_EMPTY_ANNOTATIONS: true
5
+ NUM_WORKERS: 4
6
+ REPEAT_THRESHOLD: 0.0
7
+ SAMPLER_TRAIN: TrainingSampler
8
+ DATASETS:
9
+ PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
10
+ PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
11
+ PROPOSAL_FILES_TEST: []
12
+ PROPOSAL_FILES_TRAIN: []
13
+ TEST: &id001
14
+ - balloon
15
+ TRAIN: *id001
16
+ GLOBAL:
17
+ HACK: 1.0
18
+ INPUT:
19
+ CROP:
20
+ ENABLED: false
21
+ SIZE:
22
+ - 0.9
23
+ - 0.9
24
+ TYPE: relative_range
25
+ FORMAT: BGR
26
+ MASK_FORMAT: polygon
27
+ MAX_SIZE_TEST: 1333
28
+ MAX_SIZE_TRAIN: 1333
29
+ MIN_SIZE_TEST: 800
30
+ MIN_SIZE_TRAIN:
31
+ - 640
32
+ - 672
33
+ - 704
34
+ - 736
35
+ - 768
36
+ - 800
37
+ MIN_SIZE_TRAIN_SAMPLING: choice
38
+ RANDOM_FLIP: horizontal
39
+ MODEL:
40
+ ANCHOR_GENERATOR:
41
+ ANGLES:
42
+ - - -90
43
+ - 0
44
+ - 90
45
+ ASPECT_RATIOS:
46
+ - - 0.5
47
+ - 1.0
48
+ - 2.0
49
+ NAME: DefaultAnchorGenerator
50
+ OFFSET: 0.0
51
+ SIZES:
52
+ - - 32
53
+ - - 64
54
+ - - 128
55
+ - - 256
56
+ - - 512
57
+ BACKBONE:
58
+ FREEZE_AT: 2
59
+ NAME: build_resnet_fpn_backbone
60
+ DEVICE: cuda
61
+ FPN:
62
+ FUSE_TYPE: sum
63
+ IN_FEATURES:
64
+ - res2
65
+ - res3
66
+ - res4
67
+ - res5
68
+ NORM: ''
69
+ OUT_CHANNELS: 256
70
+ KEYPOINT_ON: false
71
+ LOAD_PROPOSALS: false
72
+ MASK_ON: true
73
+ META_ARCHITECTURE: GeneralizedRCNN
74
+ PANOPTIC_FPN:
75
+ COMBINE:
76
+ ENABLED: true
77
+ INSTANCES_CONFIDENCE_THRESH: 0.5
78
+ OVERLAP_THRESH: 0.5
79
+ STUFF_AREA_LIMIT: 4096
80
+ INSTANCE_LOSS_WEIGHT: 1.0
81
+ PIXEL_MEAN:
82
+ - 103.53
83
+ - 116.28
84
+ - 123.675
85
+ PIXEL_STD:
86
+ - 57.375
87
+ - 57.12
88
+ - 58.395
89
+ PROPOSAL_GENERATOR:
90
+ MIN_SIZE: 0
91
+ NAME: RPN
92
+ RESNETS:
93
+ DEFORM_MODULATED: false
94
+ DEFORM_NUM_GROUPS: 1
95
+ DEFORM_ON_PER_STAGE:
96
+ - false
97
+ - false
98
+ - false
99
+ - false
100
+ DEPTH: 101
101
+ NORM: FrozenBN
102
+ NUM_GROUPS: 32
103
+ OUT_FEATURES:
104
+ - res2
105
+ - res3
106
+ - res4
107
+ - res5
108
+ RES2_OUT_CHANNELS: 256
109
+ RES5_DILATION: 1
110
+ STEM_OUT_CHANNELS: 64
111
+ STRIDE_IN_1X1: false
112
+ WIDTH_PER_GROUP: 8
113
+ RETINANET:
114
+ BBOX_REG_LOSS_TYPE: smooth_l1
115
+ BBOX_REG_WEIGHTS: &id003
116
+ - 1.0
117
+ - 1.0
118
+ - 1.0
119
+ - 1.0
120
+ FOCAL_LOSS_ALPHA: 0.25
121
+ FOCAL_LOSS_GAMMA: 2.0
122
+ IN_FEATURES:
123
+ - p3
124
+ - p4
125
+ - p5
126
+ - p6
127
+ - p7
128
+ IOU_LABELS:
129
+ - 0
130
+ - -1
131
+ - 1
132
+ IOU_THRESHOLDS:
133
+ - 0.4
134
+ - 0.5
135
+ NMS_THRESH_TEST: 0.5
136
+ NORM: ''
137
+ NUM_CLASSES: 80
138
+ NUM_CONVS: 4
139
+ PRIOR_PROB: 0.01
140
+ SCORE_THRESH_TEST: 0.05
141
+ SMOOTH_L1_LOSS_BETA: 0.1
142
+ TOPK_CANDIDATES_TEST: 1000
143
+ ROI_BOX_CASCADE_HEAD:
144
+ BBOX_REG_WEIGHTS:
145
+ - &id002
146
+ - 10.0
147
+ - 10.0
148
+ - 5.0
149
+ - 5.0
150
+ - - 20.0
151
+ - 20.0
152
+ - 10.0
153
+ - 10.0
154
+ - - 30.0
155
+ - 30.0
156
+ - 15.0
157
+ - 15.0
158
+ IOUS:
159
+ - 0.5
160
+ - 0.6
161
+ - 0.7
162
+ ROI_BOX_HEAD:
163
+ BBOX_REG_LOSS_TYPE: smooth_l1
164
+ BBOX_REG_LOSS_WEIGHT: 1.0
165
+ BBOX_REG_WEIGHTS: *id002
166
+ CLS_AGNOSTIC_BBOX_REG: false
167
+ CONV_DIM: 256
168
+ FC_DIM: 1024
169
+ FED_LOSS_FREQ_WEIGHT_POWER: 0.5
170
+ FED_LOSS_NUM_CLASSES: 50
171
+ NAME: FastRCNNConvFCHead
172
+ NORM: ''
173
+ NUM_CONV: 0
174
+ NUM_FC: 2
175
+ POOLER_RESOLUTION: 7
176
+ POOLER_SAMPLING_RATIO: 0
177
+ POOLER_TYPE: ROIAlignV2
178
+ SMOOTH_L1_BETA: 0.0
179
+ TRAIN_ON_PRED_BOXES: false
180
+ USE_FED_LOSS: false
181
+ USE_SIGMOID_CE: false
182
+ ROI_HEADS:
183
+ BATCH_SIZE_PER_IMAGE: 512
184
+ IN_FEATURES:
185
+ - p2
186
+ - p3
187
+ - p4
188
+ - p5
189
+ IOU_LABELS:
190
+ - 0
191
+ - 1
192
+ IOU_THRESHOLDS:
193
+ - 0.5
194
+ NAME: StandardROIHeads
195
+ NMS_THRESH_TEST: 0.5
196
+ NUM_CLASSES: 2
197
+ POSITIVE_FRACTION: 0.25
198
+ PROPOSAL_APPEND_GT: true
199
+ SCORE_THRESH_TEST: 0.05
200
+ ROI_KEYPOINT_HEAD:
201
+ CONV_DIMS:
202
+ - 512
203
+ - 512
204
+ - 512
205
+ - 512
206
+ - 512
207
+ - 512
208
+ - 512
209
+ - 512
210
+ LOSS_WEIGHT: 1.0
211
+ MIN_KEYPOINTS_PER_IMAGE: 1
212
+ NAME: KRCNNConvDeconvUpsampleHead
213
+ NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
214
+ NUM_KEYPOINTS: 17
215
+ POOLER_RESOLUTION: 14
216
+ POOLER_SAMPLING_RATIO: 0
217
+ POOLER_TYPE: ROIAlignV2
218
+ ROI_MASK_HEAD:
219
+ CLS_AGNOSTIC_MASK: false
220
+ CONV_DIM: 256
221
+ NAME: MaskRCNNConvUpsampleHead
222
+ NORM: ''
223
+ NUM_CONV: 4
224
+ POOLER_RESOLUTION: 14
225
+ POOLER_SAMPLING_RATIO: 0
226
+ POOLER_TYPE: ROIAlignV2
227
+ RPN:
228
+ BATCH_SIZE_PER_IMAGE: 256
229
+ BBOX_REG_LOSS_TYPE: smooth_l1
230
+ BBOX_REG_LOSS_WEIGHT: 1.0
231
+ BBOX_REG_WEIGHTS: *id003
232
+ BOUNDARY_THRESH: -1
233
+ CONV_DIMS:
234
+ - -1
235
+ HEAD_NAME: StandardRPNHead
236
+ IN_FEATURES:
237
+ - p2
238
+ - p3
239
+ - p4
240
+ - p5
241
+ - p6
242
+ IOU_LABELS:
243
+ - 0
244
+ - -1
245
+ - 1
246
+ IOU_THRESHOLDS:
247
+ - 0.3
248
+ - 0.7
249
+ LOSS_WEIGHT: 1.0
250
+ NMS_THRESH: 0.7
251
+ POSITIVE_FRACTION: 0.5
252
+ POST_NMS_TOPK_TEST: 1000
253
+ POST_NMS_TOPK_TRAIN: 1000
254
+ PRE_NMS_TOPK_TEST: 1000
255
+ PRE_NMS_TOPK_TRAIN: 2000
256
+ SMOOTH_L1_BETA: 0.0
257
+ SEM_SEG_HEAD:
258
+ COMMON_STRIDE: 4
259
+ CONVS_DIM: 128
260
+ IGNORE_VALUE: 255
261
+ IN_FEATURES:
262
+ - p2
263
+ - p3
264
+ - p4
265
+ - p5
266
+ LOSS_WEIGHT: 1.0
267
+ NAME: SemSegFPNHead
268
+ NORM: GN
269
+ NUM_CLASSES: 54
270
+ WEIGHTS: detectron2://ImageNetPretrained/FAIR/X-101-32x8d.pkl
271
+ OUTPUT_DIR: ./output
272
+ SEED: -1
273
+ SOLVER:
274
+ AMP:
275
+ ENABLED: false
276
+ BASE_LR: 0.02
277
+ BASE_LR_END: 0.0
278
+ BIAS_LR_FACTOR: 1.0
279
+ CHECKPOINT_PERIOD: 2500
280
+ CLIP_GRADIENTS:
281
+ CLIP_TYPE: value
282
+ CLIP_VALUE: 1.0
283
+ ENABLED: false
284
+ NORM_TYPE: 2.0
285
+ GAMMA: 0.1
286
+ IMS_PER_BATCH: 24
287
+ LR_SCHEDULER_NAME: WarmupMultiStepLR
288
+ MAX_ITER: 270000
289
+ MOMENTUM: 0.9
290
+ NESTEROV: false
291
+ NUM_DECAYS: 3
292
+ REFERENCE_WORLD_SIZE: 0
293
+ RESCALE_INTERVAL: false
294
+ STEPS:
295
+ - 210000
296
+ - 250000
297
+ WARMUP_FACTOR: 0.001
298
+ WARMUP_ITERS: 1000
299
+ WARMUP_METHOD: linear
300
+ WEIGHT_DECAY: 0.0001
301
+ WEIGHT_DECAY_BIAS: null
302
+ WEIGHT_DECAY_NORM: 0.0
303
+ TEST:
304
+ AUG:
305
+ ENABLED: false
306
+ FLIP: true
307
+ MAX_SIZE: 4000
308
+ MIN_SIZES:
309
+ - 400
310
+ - 500
311
+ - 600
312
+ - 700
313
+ - 800
314
+ - 900
315
+ - 1000
316
+ - 1100
317
+ - 1200
318
+ DETECTIONS_PER_IMAGE: 100
319
+ EVAL_PERIOD: 0
320
+ EXPECTED_RESULTS: []
321
+ KEYPOINT_OKS_SIGMAS: []
322
+ PRECISE_BN:
323
+ ENABLED: false
324
+ NUM_ITER: 200
325
+ VERSION: 2
326
+ VIS_PERIOD: 0
Detection_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a23214ba38a08bebb86eb6b6bc050af9dc8f8240ade151c19f84b01d804c06a
3
+ size 835237759
Multilingual_PP-OCRv3_det_infer/inference.pdiparams ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6119e639cade15873ac32eb4bee121b63c811c4d007d9f618baf680aef8b857
3
+ size 2377917
Multilingual_PP-OCRv3_det_infer/inference.pdiparams.info ADDED
Binary file (26.4 kB). View file
 
Multilingual_PP-OCRv3_det_infer/inference.pdmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c49f664c75549678deedcaff8d11f8f2b9f1303ef6c72deccdb98a5ea2104381
3
+ size 1441206
Segmentation_config.yaml ADDED
@@ -0,0 +1,326 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ CUDNN_BENCHMARK: false
2
+ DATALOADER:
3
+ ASPECT_RATIO_GROUPING: true
4
+ FILTER_EMPTY_ANNOTATIONS: true
5
+ NUM_WORKERS: 4
6
+ REPEAT_THRESHOLD: 0.0
7
+ SAMPLER_TRAIN: TrainingSampler
8
+ DATASETS:
9
+ PRECOMPUTED_PROPOSAL_TOPK_TEST: 1000
10
+ PRECOMPUTED_PROPOSAL_TOPK_TRAIN: 2000
11
+ PROPOSAL_FILES_TEST: []
12
+ PROPOSAL_FILES_TRAIN: []
13
+ TEST: &id001
14
+ - balloon
15
+ TRAIN: *id001
16
+ GLOBAL:
17
+ HACK: 1.0
18
+ INPUT:
19
+ CROP:
20
+ ENABLED: false
21
+ SIZE:
22
+ - 0.9
23
+ - 0.9
24
+ TYPE: relative_range
25
+ FORMAT: BGR
26
+ MASK_FORMAT: polygon
27
+ MAX_SIZE_TEST: 1333
28
+ MAX_SIZE_TRAIN: 1333
29
+ MIN_SIZE_TEST: 800
30
+ MIN_SIZE_TRAIN:
31
+ - 640
32
+ - 672
33
+ - 704
34
+ - 736
35
+ - 768
36
+ - 800
37
+ MIN_SIZE_TRAIN_SAMPLING: choice
38
+ RANDOM_FLIP: horizontal
39
+ MODEL:
40
+ ANCHOR_GENERATOR:
41
+ ANGLES:
42
+ - - -90
43
+ - 0
44
+ - 90
45
+ ASPECT_RATIOS:
46
+ - - 0.5
47
+ - 1.0
48
+ - 2.0
49
+ NAME: DefaultAnchorGenerator
50
+ OFFSET: 0.0
51
+ SIZES:
52
+ - - 32
53
+ - - 64
54
+ - - 128
55
+ - - 256
56
+ - - 512
57
+ BACKBONE:
58
+ FREEZE_AT: 2
59
+ NAME: build_resnet_fpn_backbone
60
+ DEVICE: cuda
61
+ FPN:
62
+ FUSE_TYPE: sum
63
+ IN_FEATURES:
64
+ - res2
65
+ - res3
66
+ - res4
67
+ - res5
68
+ NORM: ''
69
+ OUT_CHANNELS: 256
70
+ KEYPOINT_ON: false
71
+ LOAD_PROPOSALS: false
72
+ MASK_ON: true
73
+ META_ARCHITECTURE: GeneralizedRCNN
74
+ PANOPTIC_FPN:
75
+ COMBINE:
76
+ ENABLED: true
77
+ INSTANCES_CONFIDENCE_THRESH: 0.5
78
+ OVERLAP_THRESH: 0.5
79
+ STUFF_AREA_LIMIT: 4096
80
+ INSTANCE_LOSS_WEIGHT: 1.0
81
+ PIXEL_MEAN:
82
+ - 103.53
83
+ - 116.28
84
+ - 123.675
85
+ PIXEL_STD:
86
+ - 57.375
87
+ - 57.12
88
+ - 58.395
89
+ PROPOSAL_GENERATOR:
90
+ MIN_SIZE: 0
91
+ NAME: RPN
92
+ RESNETS:
93
+ DEFORM_MODULATED: false
94
+ DEFORM_NUM_GROUPS: 1
95
+ DEFORM_ON_PER_STAGE:
96
+ - false
97
+ - false
98
+ - false
99
+ - false
100
+ DEPTH: 101
101
+ NORM: FrozenBN
102
+ NUM_GROUPS: 32
103
+ OUT_FEATURES:
104
+ - res2
105
+ - res3
106
+ - res4
107
+ - res5
108
+ RES2_OUT_CHANNELS: 256
109
+ RES5_DILATION: 1
110
+ STEM_OUT_CHANNELS: 64
111
+ STRIDE_IN_1X1: false
112
+ WIDTH_PER_GROUP: 8
113
+ RETINANET:
114
+ BBOX_REG_LOSS_TYPE: smooth_l1
115
+ BBOX_REG_WEIGHTS: &id003
116
+ - 1.0
117
+ - 1.0
118
+ - 1.0
119
+ - 1.0
120
+ FOCAL_LOSS_ALPHA: 0.25
121
+ FOCAL_LOSS_GAMMA: 2.0
122
+ IN_FEATURES:
123
+ - p3
124
+ - p4
125
+ - p5
126
+ - p6
127
+ - p7
128
+ IOU_LABELS:
129
+ - 0
130
+ - -1
131
+ - 1
132
+ IOU_THRESHOLDS:
133
+ - 0.4
134
+ - 0.5
135
+ NMS_THRESH_TEST: 0.5
136
+ NORM: ''
137
+ NUM_CLASSES: 80
138
+ NUM_CONVS: 4
139
+ PRIOR_PROB: 0.01
140
+ SCORE_THRESH_TEST: 0.05
141
+ SMOOTH_L1_LOSS_BETA: 0.1
142
+ TOPK_CANDIDATES_TEST: 1000
143
+ ROI_BOX_CASCADE_HEAD:
144
+ BBOX_REG_WEIGHTS:
145
+ - &id002
146
+ - 10.0
147
+ - 10.0
148
+ - 5.0
149
+ - 5.0
150
+ - - 20.0
151
+ - 20.0
152
+ - 10.0
153
+ - 10.0
154
+ - - 30.0
155
+ - 30.0
156
+ - 15.0
157
+ - 15.0
158
+ IOUS:
159
+ - 0.5
160
+ - 0.6
161
+ - 0.7
162
+ ROI_BOX_HEAD:
163
+ BBOX_REG_LOSS_TYPE: smooth_l1
164
+ BBOX_REG_LOSS_WEIGHT: 1.0
165
+ BBOX_REG_WEIGHTS: *id002
166
+ CLS_AGNOSTIC_BBOX_REG: false
167
+ CONV_DIM: 256
168
+ FC_DIM: 1024
169
+ FED_LOSS_FREQ_WEIGHT_POWER: 0.5
170
+ FED_LOSS_NUM_CLASSES: 50
171
+ NAME: FastRCNNConvFCHead
172
+ NORM: ''
173
+ NUM_CONV: 0
174
+ NUM_FC: 2
175
+ POOLER_RESOLUTION: 7
176
+ POOLER_SAMPLING_RATIO: 0
177
+ POOLER_TYPE: ROIAlignV2
178
+ SMOOTH_L1_BETA: 0.0
179
+ TRAIN_ON_PRED_BOXES: false
180
+ USE_FED_LOSS: false
181
+ USE_SIGMOID_CE: false
182
+ ROI_HEADS:
183
+ BATCH_SIZE_PER_IMAGE: 512
184
+ IN_FEATURES:
185
+ - p2
186
+ - p3
187
+ - p4
188
+ - p5
189
+ IOU_LABELS:
190
+ - 0
191
+ - 1
192
+ IOU_THRESHOLDS:
193
+ - 0.5
194
+ NAME: StandardROIHeads
195
+ NMS_THRESH_TEST: 0.5
196
+ NUM_CLASSES: 1
197
+ POSITIVE_FRACTION: 0.25
198
+ PROPOSAL_APPEND_GT: true
199
+ SCORE_THRESH_TEST: 0.05
200
+ ROI_KEYPOINT_HEAD:
201
+ CONV_DIMS:
202
+ - 512
203
+ - 512
204
+ - 512
205
+ - 512
206
+ - 512
207
+ - 512
208
+ - 512
209
+ - 512
210
+ LOSS_WEIGHT: 1.0
211
+ MIN_KEYPOINTS_PER_IMAGE: 1
212
+ NAME: KRCNNConvDeconvUpsampleHead
213
+ NORMALIZE_LOSS_BY_VISIBLE_KEYPOINTS: true
214
+ NUM_KEYPOINTS: 17
215
+ POOLER_RESOLUTION: 14
216
+ POOLER_SAMPLING_RATIO: 0
217
+ POOLER_TYPE: ROIAlignV2
218
+ ROI_MASK_HEAD:
219
+ CLS_AGNOSTIC_MASK: false
220
+ CONV_DIM: 256
221
+ NAME: MaskRCNNConvUpsampleHead
222
+ NORM: ''
223
+ NUM_CONV: 4
224
+ POOLER_RESOLUTION: 14
225
+ POOLER_SAMPLING_RATIO: 0
226
+ POOLER_TYPE: ROIAlignV2
227
+ RPN:
228
+ BATCH_SIZE_PER_IMAGE: 256
229
+ BBOX_REG_LOSS_TYPE: smooth_l1
230
+ BBOX_REG_LOSS_WEIGHT: 1.0
231
+ BBOX_REG_WEIGHTS: *id003
232
+ BOUNDARY_THRESH: -1
233
+ CONV_DIMS:
234
+ - -1
235
+ HEAD_NAME: StandardRPNHead
236
+ IN_FEATURES:
237
+ - p2
238
+ - p3
239
+ - p4
240
+ - p5
241
+ - p6
242
+ IOU_LABELS:
243
+ - 0
244
+ - -1
245
+ - 1
246
+ IOU_THRESHOLDS:
247
+ - 0.3
248
+ - 0.7
249
+ LOSS_WEIGHT: 1.0
250
+ NMS_THRESH: 0.7
251
+ POSITIVE_FRACTION: 0.5
252
+ POST_NMS_TOPK_TEST: 1000
253
+ POST_NMS_TOPK_TRAIN: 1000
254
+ PRE_NMS_TOPK_TEST: 1000
255
+ PRE_NMS_TOPK_TRAIN: 2000
256
+ SMOOTH_L1_BETA: 0.0
257
+ SEM_SEG_HEAD:
258
+ COMMON_STRIDE: 4
259
+ CONVS_DIM: 128
260
+ IGNORE_VALUE: 255
261
+ IN_FEATURES:
262
+ - p2
263
+ - p3
264
+ - p4
265
+ - p5
266
+ LOSS_WEIGHT: 1.0
267
+ NAME: SemSegFPNHead
268
+ NORM: GN
269
+ NUM_CLASSES: 54
270
+ WEIGHTS: detectron2://ImageNetPretrained/FAIR/X-101-32x8d.pkl
271
+ OUTPUT_DIR: ./output
272
+ SEED: -1
273
+ SOLVER:
274
+ AMP:
275
+ ENABLED: false
276
+ BASE_LR: 0.02
277
+ BASE_LR_END: 0.0
278
+ BIAS_LR_FACTOR: 1.0
279
+ CHECKPOINT_PERIOD: 2500
280
+ CLIP_GRADIENTS:
281
+ CLIP_TYPE: value
282
+ CLIP_VALUE: 1.0
283
+ ENABLED: false
284
+ NORM_TYPE: 2.0
285
+ GAMMA: 0.1
286
+ IMS_PER_BATCH: 24
287
+ LR_SCHEDULER_NAME: WarmupMultiStepLR
288
+ MAX_ITER: 270000
289
+ MOMENTUM: 0.9
290
+ NESTEROV: false
291
+ NUM_DECAYS: 3
292
+ REFERENCE_WORLD_SIZE: 0
293
+ RESCALE_INTERVAL: false
294
+ STEPS:
295
+ - 210000
296
+ - 250000
297
+ WARMUP_FACTOR: 0.001
298
+ WARMUP_ITERS: 1000
299
+ WARMUP_METHOD: linear
300
+ WEIGHT_DECAY: 0.0001
301
+ WEIGHT_DECAY_BIAS: null
302
+ WEIGHT_DECAY_NORM: 0.0
303
+ TEST:
304
+ AUG:
305
+ ENABLED: false
306
+ FLIP: true
307
+ MAX_SIZE: 4000
308
+ MIN_SIZES:
309
+ - 400
310
+ - 500
311
+ - 600
312
+ - 700
313
+ - 800
314
+ - 900
315
+ - 1000
316
+ - 1100
317
+ - 1200
318
+ DETECTIONS_PER_IMAGE: 100
319
+ EVAL_PERIOD: 0
320
+ EXPECTED_RESULTS: []
321
+ KEYPOINT_OKS_SIGMAS: []
322
+ PRECISE_BN:
323
+ ENABLED: false
324
+ NUM_ITER: 200
325
+ VERSION: 2
326
+ VIS_PERIOD: 0
Segmentation_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e72a9006b291a08f8c162a325cbdbddeecb6e708f9e4adb3d1702a11c9ba169d
3
+ size 856189263
ch_ppocr_mobile_v2.0_cls_infer/inference.pdiparams ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1efda1b80e174b4fcb168a035ac96c1af4938892bd86a55f300a6027105d08c
3
+ size 539978
ch_ppocr_mobile_v2.0_cls_infer/inference.pdiparams.info ADDED
Binary file (18.5 kB). View file
 
ch_ppocr_mobile_v2.0_cls_infer/inference.pdmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c4337ec61722a20b1dca2e5bfaffc313c0592bc89ad6e0d45168224186f6683
3
+ size 1624487
korean_PP-OCRv4_rec_infer/inference.pdiparams ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea4f4762582336e9b85653b016c5b1091223c947fafd282161fa3145ecb72d1d
3
+ size 23920621
korean_PP-OCRv4_rec_infer/inference.pdiparams.info ADDED
Binary file (95.7 kB). View file
 
korean_PP-OCRv4_rec_infer/inference.pdmodel ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:992eed58af98ed6125065027e52fbc69b570e6c2e74610ec240e8a2436151ada
3
+ size 353760