瀏覽代碼

feat: 添加可选的表格分类器参数以支持有线/无线表格的区分

zhch158_admin 3 天之前
父節點
當前提交
768858cbff
共有 1 個文件被更改,包括 3 次插入0 次删除
  1. 3 0
      ocr_tools/universal_doc_parser/core/element_processors.py

+ 3 - 0
ocr_tools/universal_doc_parser/core/element_processors.py

@@ -44,6 +44,7 @@ class ElementProcessors:
         vl_recognizer: Any,
         table_cell_matcher: Optional[Any] = None,
         wired_table_recognizer: Optional[Any] = None,
+        table_classifier: Optional[Any] = None,
     ):
         """
         初始化元素处理器
@@ -54,12 +55,14 @@ class ElementProcessors:
             vl_recognizer: VL识别器(表格、公式)
             table_cell_matcher: 表格单元格匹配器
             wired_table_recognizer: 有线表格识别器(可选)
+            table_classifier: 表格分类器(区分有线/无线表格,可选)
         """
         self.preprocessor = preprocessor
         self.ocr_recognizer = ocr_recognizer
         self.vl_recognizer = vl_recognizer
         self.table_cell_matcher = table_cell_matcher
         self.wired_table_recognizer = wired_table_recognizer
+        self.table_classifier = table_classifier
     
     def _convert_ocr_details_to_absolute(
         self,