hai 2 semanas · 4c56f9c64a
--- a/zhch/universal_doc_parser/tests/test_layout_detector.py
+++ b/zhch/universal_doc_parser/tests/test_layout_detector.py
@@ -0,0 +1,128 @@
 
				+"""
			
 
				+布局检测器测试脚本
			
 
				+"""
			
 
				+
			
 
				+import sys
			
 
				+from pathlib import Path
			
 
				+import cv2
			
 
				+import random
			
 
				+
			
 
				+# 添加项目根目录到路径
			
 
				+project_root = Path(__file__).parents[1]
			
 
				+sys.path.insert(0, str(project_root))
			
 
				+
			
 
				+from models.adapters import PaddleLayoutDetector
			
 
				+
			
 
				+
			
 
				+def test_layout_detector():
			
 
				+    """测试 PaddleX 布局检测器"""
			
 
				+    
			
 
				+    # 测试配置
			
 
				+    config = {
			
 
				+        'model_dir': '/Users/zhch158/workspace/repository.git/PaddleX/zhch/unified_pytorch_models/Layout/RT-DETR-H_layout_17cls.onnx',
			
 
				+        'device': 'cpu',
			
 
				+        'conf': 0.25
			
 
				+    }
			
 
				+    
			
 
				+    # 初始化检测器
			
 
				+    print("🔧 Initializing detector...")
			
 
				+    detector = PaddleLayoutDetector(config)
			
 
				+    detector.initialize()
			
 
				+    
			
 
				+    # 读取测试图像
			
 
				+    img_path = "/Users/zhch158/workspace/data/流水分析/B用户_扫描流水/PaddleOCR_VL_Results/B用户_扫描流水/B用户_扫描流水_page_001.png"
			
 
				+    print(f"\n📖 Loading image: {img_path}")
			
 
				+    img = cv2.imread(img_path)
			
 
				+    
			
 
				+    if img is None:
			
 
				+        print(f"❌ Failed to load image: {img_path}")
			
 
				+        return
			
 
				+    
			
 
				+    print(f"   Image shape: {img.shape}")
			
 
				+    
			
 
				+    # 执行检测
			
 
				+    print("\n🔍 Detecting layout...")
			
 
				+    results = detector.detect(img)
			
 
				+    
			
 
				+    print(f"\n✅ 检测到 {len(results)} 个区域:")
			
 
				+    for i, res in enumerate(results, 1):
			
 
				+        print(f"  [{i}] {res['category']}: "
			
 
				+              f"score={res['confidence']:.3f}, "
			
 
				+              f"bbox={res['bbox']}, "
			
 
				+              f"size={res['raw']['width']}x{res['raw']['height']}, "
			
 
				+              f"original={res['raw']['original_category_name']}")
			
 
				+    
			
 
				+    # 统计各类别
			
 
				+    category_counts = {}
			
 
				+    for res in results:
			
 
				+        cat = res['category']
			
 
				+        category_counts[cat] = category_counts.get(cat, 0) + 1
			
 
				+    
			
 
				+    print(f"\n📊 类别统计 (MinerU格式):")
			
 
				+    for cat, count in sorted(category_counts.items()):
			
 
				+        print(f"  - {cat}: {count}")
			
 
				+    
			
 
				+    # 可视化结果
			
 
				+    if len(results) > 0:
			
 
				+        print("\n🎨 Generating visualization...")
			
 
				+        
			
 
				+        # 为每个类别分配颜色
			
 
				+        category_colors = {}
			
 
				+        for res in results:
			
 
				+            cat = res['category']
			
 
				+            if cat not in category_colors:
			
 
				+                category_colors[cat] = (
			
 
				+                    random.randint(50, 255),
			
 
				+                    random.randint(50, 255),
			
 
				+                    random.randint(50, 255)
			
 
				+                )
			
 
				+        
			
 
				+        # 绘制检测框
			
 
				+        vis_img = img.copy()
			
 
				+        for res in results:
			
 
				+            bbox = res['bbox']
			
 
				+            x1, y1, x2, y2 = bbox
			
 
				+            cat = res['category']
			
 
				+            color = category_colors[cat]
			
 
				+            
			
 
				+            # 绘制矩形
			
 
				+            cv2.rectangle(vis_img, (x1, y1), (x2, y2), color, 2)
			
 
				+            
			
 
				+            # 绘制标签
			
 
				+            label = f"{cat} {res['confidence']:.2f}"
			
 
				+            label_size, _ = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, 0.5, 1)
			
 
				+            
			
 
				+            # 标签背景
			
 
				+            cv2.rectangle(
			
 
				+                vis_img,
			
 
				+                (x1, y1 - label_size[1] - 4),
			
 
				+                (x1 + label_size[0], y1),
			
 
				+                color,
			
 
				+                -1
			
 
				+            )
			
 
				+            
			
 
				+            # 标签文字
			
 
				+            cv2.putText(
			
 
				+                vis_img,
			
 
				+                label,
			
 
				+                (x1, y1 - 2),
			
 
				+                cv2.FONT_HERSHEY_SIMPLEX,
			
 
				+                0.5,
			
 
				+                (255, 255, 255),
			
 
				+                1
			
 
				+            )
			
 
				+        
			
 
				+        # 保存可视化结果
			
 
				+        output_dir = Path(__file__).parent / "output"
			
 
				+        output_dir.mkdir(exist_ok=True)
			
 
				+        output_path = output_dir / f"{Path(img_path).stem}_layout_vis.jpg"
			
 
				+        cv2.imwrite(str(output_path), vis_img)
			
 
				+        print(f"💾 Visualization saved to: {output_path}")
			
 
				+    
			
 
				+    # 清理
			
 
				+    detector.cleanup()
			
 
				+    print("\n✅ 测试完成!")
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    test_layout_detector()