first commit
This commit is contained in:
227
pp-stv3.yaml
Normal file
227
pp-stv3.yaml
Normal file
@@ -0,0 +1,227 @@
|
||||
pipeline_name: PP-StructureV3
|
||||
|
||||
batch_size: 8
|
||||
|
||||
use_doc_preprocessor: True
|
||||
use_seal_recognition: True
|
||||
use_table_recognition: True
|
||||
use_formula_recognition: True
|
||||
use_chart_recognition: True
|
||||
use_region_detection: True
|
||||
Serving:
|
||||
extra:
|
||||
max_num_input_imgs: null
|
||||
SubModules:
|
||||
LayoutDetection:
|
||||
module_name: layout_detection
|
||||
model_name: PP-DocLayout_plus-L
|
||||
model_dir: null
|
||||
batch_size: 8
|
||||
threshold:
|
||||
0: 0.3 # paragraph_title
|
||||
1: 0.5 # image
|
||||
2: 0.4 # text
|
||||
3: 0.5 # number
|
||||
4: 0.5 # abstract
|
||||
5: 0.5 # content
|
||||
6: 0.5 # figure_table_chart_title
|
||||
7: 0.3 # formula
|
||||
8: 0.5 # table
|
||||
9: 0.5 # reference
|
||||
10: 0.5 # doc_title
|
||||
11: 0.5 # footnote
|
||||
12: 0.5 # header
|
||||
13: 0.5 # algorithm
|
||||
14: 0.5 # footer
|
||||
15: 0.45 # seal
|
||||
16: 0.5 # chart
|
||||
17: 0.5 # formula_number
|
||||
18: 0.5 # aside_text
|
||||
19: 0.5 # reference_content
|
||||
layout_nms: True
|
||||
layout_unclip_ratio: [1.0, 1.0]
|
||||
layout_merge_bboxes_mode:
|
||||
0: "large" # paragraph_title
|
||||
1: "large" # image
|
||||
2: "union" # text
|
||||
3: "union" # number
|
||||
4: "union" # abstract
|
||||
5: "union" # content
|
||||
6: "union" # figure_table_chart_title
|
||||
7: "large" # formula
|
||||
8: "union" # table
|
||||
9: "union" # reference
|
||||
10: "union" # doc_title
|
||||
11: "union" # footnote
|
||||
12: "union" # header
|
||||
13: "union" # algorithm
|
||||
14: "union" # footer
|
||||
15: "union" # seal
|
||||
16: "large" # chart
|
||||
17: "union" # formula_number
|
||||
18: "union" # aside_text
|
||||
19: "union" # reference_content
|
||||
ChartRecognition:
|
||||
module_name: chart_recognition
|
||||
model_name: PP-Chart2Table
|
||||
model_dir: null
|
||||
batch_size: 1
|
||||
RegionDetection:
|
||||
module_name: layout_detection
|
||||
model_name: PP-DocBlockLayout
|
||||
model_dir: null
|
||||
layout_nms: True
|
||||
layout_merge_bboxes_mode: "small"
|
||||
|
||||
SubPipelines:
|
||||
DocPreprocessor:
|
||||
pipeline_name: doc_preprocessor
|
||||
batch_size: 8
|
||||
use_doc_orientation_classify: True
|
||||
use_doc_unwarping: True
|
||||
SubModules:
|
||||
DocOrientationClassify:
|
||||
module_name: doc_text_orientation
|
||||
model_name: PP-LCNet_x1_0_doc_ori
|
||||
model_dir: null
|
||||
batch_size: 8
|
||||
DocUnwarping:
|
||||
module_name: image_unwarping
|
||||
model_name: UVDoc
|
||||
model_dir: null
|
||||
|
||||
GeneralOCR:
|
||||
pipeline_name: OCR
|
||||
batch_size: 8
|
||||
text_type: general
|
||||
use_doc_preprocessor: False
|
||||
use_textline_orientation: True
|
||||
SubModules:
|
||||
TextDetection:
|
||||
module_name: text_detection
|
||||
model_name: PP-OCRv5_server_det
|
||||
model_dir: null
|
||||
limit_side_len: 736
|
||||
limit_type: min
|
||||
max_side_limit: 4000
|
||||
thresh: 0.3
|
||||
box_thresh: 0.6
|
||||
unclip_ratio: 1.5
|
||||
TextLineOrientation:
|
||||
module_name: textline_orientation
|
||||
model_name: PP-LCNet_x1_0_textline_ori
|
||||
model_dir: null
|
||||
batch_size: 8
|
||||
TextRecognition:
|
||||
module_name: text_recognition
|
||||
model_name: PP-OCRv5_server_rec
|
||||
model_dir: null
|
||||
batch_size: 8
|
||||
score_thresh: 0.0
|
||||
|
||||
|
||||
TableRecognition:
|
||||
pipeline_name: table_recognition_v2
|
||||
use_layout_detection: False
|
||||
use_doc_preprocessor: False
|
||||
use_ocr_model: False
|
||||
SubModules:
|
||||
TableClassification:
|
||||
module_name: table_classification
|
||||
model_name: PP-LCNet_x1_0_table_cls
|
||||
model_dir: null
|
||||
|
||||
WiredTableStructureRecognition:
|
||||
module_name: table_structure_recognition
|
||||
model_name: SLANeXt_wired
|
||||
model_dir: null
|
||||
|
||||
WirelessTableStructureRecognition:
|
||||
module_name: table_structure_recognition
|
||||
model_name: SLANet_plus
|
||||
model_dir: null
|
||||
|
||||
WiredTableCellsDetection:
|
||||
module_name: table_cells_detection
|
||||
model_name: RT-DETR-L_wired_table_cell_det
|
||||
model_dir: null
|
||||
|
||||
WirelessTableCellsDetection:
|
||||
module_name: table_cells_detection
|
||||
model_name: RT-DETR-L_wireless_table_cell_det
|
||||
model_dir: null
|
||||
|
||||
TableOrientationClassify:
|
||||
module_name: doc_text_orientation
|
||||
model_name: PP-LCNet_x1_0_doc_ori
|
||||
model_dir: null
|
||||
SubPipelines:
|
||||
GeneralOCR:
|
||||
pipeline_name: OCR
|
||||
text_type: general
|
||||
use_doc_preprocessor: False
|
||||
use_textline_orientation: True
|
||||
SubModules:
|
||||
TextDetection:
|
||||
module_name: text_detection
|
||||
model_name: PP-OCRv5_server_det
|
||||
model_dir: null
|
||||
limit_side_len: 736
|
||||
limit_type: min
|
||||
max_side_limit: 4000
|
||||
thresh: 0.3
|
||||
box_thresh: 0.4
|
||||
unclip_ratio: 1.5
|
||||
TextLineOrientation:
|
||||
module_name: textline_orientation
|
||||
model_name: PP-LCNet_x1_0_textline_ori
|
||||
model_dir: null
|
||||
batch_size: 8
|
||||
TextRecognition:
|
||||
module_name: text_recognition
|
||||
model_name: PP-OCRv5_server_rec
|
||||
model_dir: null
|
||||
batch_size: 8
|
||||
score_thresh: 0.0
|
||||
|
||||
SealRecognition:
|
||||
pipeline_name: seal_recognition
|
||||
batch_size: 8
|
||||
use_layout_detection: False
|
||||
use_doc_preprocessor: False
|
||||
SubPipelines:
|
||||
SealOCR:
|
||||
pipeline_name: OCR
|
||||
batch_size: 8
|
||||
text_type: seal
|
||||
use_doc_preprocessor: False
|
||||
use_textline_orientation: False
|
||||
SubModules:
|
||||
TextDetection:
|
||||
module_name: seal_text_detection
|
||||
model_name: PP-OCRv4_server_seal_det
|
||||
model_dir: null
|
||||
limit_side_len: 736
|
||||
limit_type: min
|
||||
max_side_limit: 4000
|
||||
thresh: 0.2
|
||||
box_thresh: 0.6
|
||||
unclip_ratio: 0.5
|
||||
TextRecognition:
|
||||
module_name: text_recognition
|
||||
model_name: PP-OCRv5_server_rec
|
||||
model_dir: null
|
||||
batch_size: 8
|
||||
score_thresh: 0
|
||||
|
||||
FormulaRecognition:
|
||||
pipeline_name: formula_recognition
|
||||
batch_size: 8
|
||||
use_layout_detection: False
|
||||
use_doc_preprocessor: False
|
||||
SubModules:
|
||||
FormulaRecognition:
|
||||
module_name: formula_recognition
|
||||
model_name: PP-FormulaNet_plus-L
|
||||
model_dir: null
|
||||
batch_size: 8
|
||||
Reference in New Issue
Block a user