Luis J Camargo commited on
Commit
b7745a8
·
1 Parent(s): cec97f0

feat: Add default configuration for the PaddleOCR-VL-1.5 pipeline.

Browse files
Files changed (1) hide show
  1. default.yaml +85 -0
default.yaml ADDED
@@ -0,0 +1,85 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+ pipeline_name: PaddleOCR-VL-1.5
3
+
4
+ batch_size: 64
5
+
6
+ use_queues: True
7
+
8
+ use_doc_preprocessor: False
9
+ use_layout_detection: True
10
+ use_chart_recognition: False
11
+ use_seal_recognition: False
12
+ format_block_content: False
13
+ merge_layout_blocks: True
14
+ markdown_ignore_labels:
15
+ - number
16
+ - footnote
17
+ - header
18
+ - header_image
19
+ - footer
20
+ - footer_image
21
+ - aside_text
22
+
23
+ SubModules:
24
+ LayoutDetection:
25
+ module_name: layout_detection
26
+ model_name: PP-DocLayoutV3
27
+ model_dir: null
28
+ batch_size: 8
29
+ threshold: 0.3
30
+ layout_nms: True
31
+ layout_unclip_ratio: [1.0, 1.0]
32
+ layout_merge_bboxes_mode:
33
+ 0: "union" # abstract
34
+ 1: "union" # algorithm
35
+ 2: "union" # aside_text
36
+ 3: "large" # chart
37
+ 4: "union" # content
38
+ 5: "large" # display_formula
39
+ 6: "large" # doc_title
40
+ 7: "union" # figure_title
41
+ 8: "union" # footer
42
+ 9: "union" # footer
43
+ 10: "union" # footnote
44
+ 11: "union" # formula_number
45
+ 12: "union" # header
46
+ 13: "union" # header
47
+ 14: "union" # image
48
+ 15: "large" # inline_formula
49
+ 16: "union" # number
50
+ 17: "large" # paragraph_title
51
+ 18: "union" # reference
52
+ 19: "union" # reference_content
53
+ 20: "union" # seal
54
+ 21: "union" # table
55
+ 22: "union" # text
56
+ 23: "union" # text
57
+ 24: "union" # vision_footnote
58
+ VLRecognition:
59
+ module_name: vl_recognition
60
+ model_name: PaddleOCR-VL-1.5-0.9B
61
+ model_dir: null
62
+ batch_size: 4096
63
+ genai_config:
64
+ backend: native
65
+
66
+ SubPipelines:
67
+ DocPreprocessor:
68
+ pipeline_name: doc_preprocessor
69
+ batch_size: 8
70
+ use_doc_orientation_classify: True
71
+ use_doc_unwarping: True
72
+ SubModules:
73
+ DocOrientationClassify:
74
+ module_name: doc_text_orientation
75
+ model_name: PP-LCNet_x1_0_doc_ori
76
+ model_dir: null
77
+ batch_size: 8
78
+ DocUnwarping:
79
+ module_name: image_unwarping
80
+ model_name: UVDoc
81
+ model_dir: null
82
+
83
+ Serving:
84
+ extra:
85
+ max_num_input_imgs: null