|
|
@@ -1,127 +0,0 @@
|
|
|
-
|
|
|
-pipeline_name: table_recognition_v2
|
|
|
-
|
|
|
-use_doc_preprocessor: False
|
|
|
-use_layout_detection: True
|
|
|
-use_ocr_model: True
|
|
|
-
|
|
|
-SubModules:
|
|
|
- LayoutDetection:
|
|
|
- module_name: layout_detection
|
|
|
- model_name: PP-DocLayout_plus-L
|
|
|
- model_dir: null
|
|
|
- batch_size: 1
|
|
|
- threshold:
|
|
|
- 0: 0.3 # paragraph_title
|
|
|
- 1: 0.5 # image
|
|
|
- 2: 0.4 # text
|
|
|
- 3: 0.5 # number
|
|
|
- 4: 0.5 # abstract
|
|
|
- 5: 0.5 # content
|
|
|
- 6: 0.5 # figure_table_chart_title
|
|
|
- 7: 0.3 # formula
|
|
|
- 8: 0.5 # table
|
|
|
- 9: 0.5 # reference
|
|
|
- 10: 0.5 # doc_title
|
|
|
- 11: 0.5 # footnote
|
|
|
- 12: 0.5 # header
|
|
|
- 13: 0.5 # algorithm
|
|
|
- 14: 0.5 # footer
|
|
|
- 15: 0.45 # seal
|
|
|
- 16: 0.5 # chart
|
|
|
- 17: 0.5 # formula_number
|
|
|
- 18: 0.5 # aside_text
|
|
|
- 19: 0.5 # reference_content
|
|
|
- layout_nms: True
|
|
|
- layout_unclip_ratio: [1.0, 1.0]
|
|
|
- layout_merge_bboxes_mode:
|
|
|
- 0: "large" # paragraph_title
|
|
|
- 1: "large" # image
|
|
|
- 2: "union" # text
|
|
|
- 3: "union" # number
|
|
|
- 4: "union" # abstract
|
|
|
- 5: "union" # content
|
|
|
- 6: "union" # figure_table_chart_title
|
|
|
- 7: "large" # formula
|
|
|
- 8: "union" # table
|
|
|
- 9: "union" # reference
|
|
|
- 10: "union" # doc_title
|
|
|
- 11: "union" # footnote
|
|
|
- 12: "union" # header
|
|
|
- 13: "union" # algorithm
|
|
|
- 14: "union" # footer
|
|
|
- 15: "union" # seal
|
|
|
- 16: "large" # chart
|
|
|
- 17: "union" # formula_number
|
|
|
- 18: "union" # aside_text
|
|
|
- 19: "union" # reference_content
|
|
|
-
|
|
|
- TableOrientationClassify:
|
|
|
- module_name: doc_text_orientation
|
|
|
- model_name: PP-LCNet_x1_0_doc_ori
|
|
|
- model_dir: null
|
|
|
-
|
|
|
- TableClassification:
|
|
|
- module_name: table_classification
|
|
|
- model_name: PP-LCNet_x1_0_table_cls
|
|
|
- model_dir: null
|
|
|
-
|
|
|
- WiredTableStructureRecognition:
|
|
|
- module_name: table_structure_recognition
|
|
|
- model_name: SLANeXt_wired
|
|
|
- model_dir: null
|
|
|
-
|
|
|
- WirelessTableStructureRecognition:
|
|
|
- module_name: table_structure_recognition
|
|
|
- model_name: SLANeXt_wireless
|
|
|
- model_dir: null
|
|
|
-
|
|
|
- WiredTableCellsDetection:
|
|
|
- module_name: table_cells_detection
|
|
|
- model_name: RT-DETR-L_wired_table_cell_det
|
|
|
- model_dir: null
|
|
|
-
|
|
|
- WirelessTableCellsDetection:
|
|
|
- module_name: table_cells_detection
|
|
|
- model_name: RT-DETR-L_wireless_table_cell_det
|
|
|
- model_dir: null
|
|
|
-
|
|
|
-SubPipelines:
|
|
|
- DocPreprocessor:
|
|
|
- pipeline_name: doc_preprocessor
|
|
|
- use_doc_orientation_classify: False
|
|
|
- use_doc_unwarping: False
|
|
|
- SubModules:
|
|
|
- DocOrientationClassify:
|
|
|
- module_name: doc_text_orientation
|
|
|
- model_name: PP-LCNet_x1_0_doc_ori
|
|
|
- model_dir: null
|
|
|
-
|
|
|
- DocUnwarping:
|
|
|
- module_name: image_unwarping
|
|
|
- model_name: UVDoc
|
|
|
- model_dir: null
|
|
|
-
|
|
|
- GeneralOCR:
|
|
|
- pipeline_name: OCR
|
|
|
- text_type: general
|
|
|
- use_doc_preprocessor: False
|
|
|
- use_textline_orientation: False
|
|
|
- SubModules:
|
|
|
- TextDetection:
|
|
|
- module_name: text_detection
|
|
|
- model_name: PP-OCRv5_server_det
|
|
|
- model_dir: null
|
|
|
- limit_side_len: 1600
|
|
|
- limit_type: max
|
|
|
- max_side_limit: 4000
|
|
|
- thresh: 0.3
|
|
|
- box_thresh: 0.4
|
|
|
- unclip_ratio: 1.5
|
|
|
-
|
|
|
- TextRecognition:
|
|
|
- module_name: text_recognition
|
|
|
- model_name: PP-OCRv5_server_rec
|
|
|
- model_dir: null
|
|
|
- batch_size: 1
|
|
|
- score_thresh: 0
|