Prechádzať zdrojové kódy

feat(MinerUWiredTableRecognizer): 更新单元格提取方法,简化OCR边缘补偿参数传递

zhch158_admin 2 týždňov pred
rodič
commit
dc9ae52f78

+ 2 - 5
ocr_tools/universal_doc_parser/models/adapters/mineru_wired_table.py

@@ -379,7 +379,7 @@ class MinerUWiredTableRecognizer:
             # Step 2: 使用连通域法提取单元格 (替换了原来的投影法)
             debug_prefix = f"{dbg.prefix}_grid" if dbg.prefix else "grid"
             
-            # 传入原图的实际尺寸、裁剪padding和OCR结果
+            # 传入原图的实际尺寸和裁剪padding
             bboxes = self.grid_recovery.compute_cells_from_lines(
                 hpred_up, 
                 vpred_up, 
@@ -389,14 +389,11 @@ class MinerUWiredTableRecognizer:
                 debug_dir=debug_dir,
                 debug_prefix=debug_prefix,
                 crop_padding=10,  # 传递 padding 值(与 element_processors.py 中的 crop_padding 保持一致)
-                ocr_bboxes=ocr_boxes,  # 🆕 传递OCR结果用于边缘补偿
-                enable_ocr_edge_compensation=True  # 🆕 启用OCR边缘补偿
             )
-            # bboxes = self.grid_recovery.compute_cells_from_lines(hpred_up, vpred_up, upscale) # Original call
             if not bboxes:
                 raise RuntimeError("未能提取出单元格")
 
-            # Step 2.3: 🆕 多源单元格融合(UNet + RT-DETR ), ocr边缘补偿在前面compute_cells_from_lines完成
+            # Step 2.3: 🆕 多源单元格融合(UNet + RT-DETR + OCR边缘补偿)
             fusion_stats = {}
             if self.cell_fusion_engine:
                 try: