| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102 |
- pipeline_name: layout_parsing
- use_doc_preprocessor: True
- use_seal_recognition: True
- use_table_recognition: True
- use_formula_recognition: False
- SubModules:
- LayoutDetection:
- module_name: layout_detection
- model_name: RT-DETR-H_layout_17cls
- model_dir: null
- SubPipelines:
- DocPreprocessor:
- pipeline_name: doc_preprocessor
- use_doc_orientation_classify: True
- use_doc_unwarping: True
- SubModules:
- DocOrientationClassify:
- module_name: doc_text_orientation
- model_name: PP-LCNet_x1_0_doc_ori
- model_dir: null
- DocUnwarping:
- module_name: image_unwarping
- model_name: UVDoc
- model_dir: null
- GeneralOCR:
- pipeline_name: OCR
- text_type: general
- use_doc_preprocessor: False
- use_textline_orientation: False
- SubModules:
- TextDetection:
- module_name: text_detection
- model_name: PP-OCRv5_server_det
- model_dir: null
- limit_side_len: 960
- limit_type: max
- max_side_limit: 4000
- thresh: 0.3
- box_thresh: 0.6
- unclip_ratio: 1.5
-
- TextRecognition:
- module_name: text_recognition
- model_name: PP-OCRv5_server_rec
- model_dir: null
- batch_size: 6
- score_thresh: 0
- TableRecognition:
- pipeline_name: table_recognition
- use_layout_detection: False
- use_doc_preprocessor: False
- use_ocr_model: False
- SubModules:
- TableStructureRecognition:
- module_name: table_structure_recognition
- model_name: SLANet_plus
- model_dir: null
- SealRecognition:
- pipeline_name: seal_recognition
- use_layout_detection: False
- use_doc_preprocessor: False
- SubPipelines:
- SealOCR:
- pipeline_name: OCR
- text_type: seal
- use_doc_preprocessor: False
- use_textline_orientation: False
- SubModules:
- TextDetection:
- module_name: seal_text_detection
- model_name: PP-OCRv4_server_seal_det
- model_dir: null
- limit_side_len: 736
- limit_type: min
- max_side_limit: 4000
- thresh: 0.2
- box_thresh: 0.6
- unclip_ratio: 0.5
- TextRecognition:
- module_name: text_recognition
- model_name: PP-OCRv4_server_rec
- model_dir: null
- batch_size: 1
- score_thresh: 0
-
- FormulaRecognition:
- pipeline_name: formula_recognition
- use_layout_detection: False
- use_doc_preprocessor: False
- SubModules:
- FormulaRecognition:
- module_name: formula_recognition
- model_name: PP-FormulaNet-L
- model_dir: null
- batch_size: 5
|