|
|
@@ -44,6 +44,7 @@ class ElementProcessors:
|
|
|
vl_recognizer: Any,
|
|
|
table_cell_matcher: Optional[Any] = None,
|
|
|
wired_table_recognizer: Optional[Any] = None,
|
|
|
+ table_classifier: Optional[Any] = None,
|
|
|
):
|
|
|
"""
|
|
|
初始化元素处理器
|
|
|
@@ -54,12 +55,14 @@ class ElementProcessors:
|
|
|
vl_recognizer: VL识别器(表格、公式)
|
|
|
table_cell_matcher: 表格单元格匹配器
|
|
|
wired_table_recognizer: 有线表格识别器(可选)
|
|
|
+ table_classifier: 表格分类器(区分有线/无线表格,可选)
|
|
|
"""
|
|
|
self.preprocessor = preprocessor
|
|
|
self.ocr_recognizer = ocr_recognizer
|
|
|
self.vl_recognizer = vl_recognizer
|
|
|
self.table_cell_matcher = table_cell_matcher
|
|
|
self.wired_table_recognizer = wired_table_recognizer
|
|
|
+ self.table_classifier = table_classifier
|
|
|
|
|
|
def _convert_ocr_details_to_absolute(
|
|
|
self,
|