Explorar o código

feat: 添加BBoxExtractor以计算OCR文本的倾斜角度并记录信息

zhch158_admin hai 5 días
pai
achega
05d07bb9ef
Modificáronse 1 ficheiros con 4 adicións e 0 borrados
  1. 4 0
      ocr_tools/universal_doc_parser/core/pipeline_manager_v2.py

+ 4 - 0
ocr_tools/universal_doc_parser/core/pipeline_manager_v2.py

@@ -57,6 +57,7 @@ except ImportError:
     TableCellMatcher = None
     TextMatcher = None
 
+from ocr_utils.bbox_utils import BBoxExtractor
 
 class EnhancedDocPipeline:
     """增强版文档处理流水线"""
@@ -350,6 +351,9 @@ class EnhancedDocPipeline:
             logger.info(f"📝 Page {page_idx}: OCR detected {len(all_ocr_spans)} text spans")
         except Exception as e:
             logger.warning(f"⚠️ Full-page OCR failed: {e}")
+
+        skew_angle = BBoxExtractor.calculate_skew_angle(all_ocr_spans)
+        logger.info(f"📊 Wired table skew angle: {skew_angle:.3f}°")
         
         # 4. 将 OCR spans 匹配到 layout blocks
         matched_spans = SpanMatcher.match_spans_to_blocks(