|
|
@@ -0,0 +1,153 @@
|
|
|
+# OCR验证工具配置文件
|
|
|
+
|
|
|
+# 样式配置
|
|
|
+styles:
|
|
|
+ font_size: 8
|
|
|
+
|
|
|
+ colors:
|
|
|
+ primary: "#0288d1"
|
|
|
+ secondary: "#ff9800"
|
|
|
+ success: "#4caf50"
|
|
|
+ error: "#f44336"
|
|
|
+ warning: "#ff9800"
|
|
|
+ background: "#fafafa"
|
|
|
+ text: "#333333"
|
|
|
+
|
|
|
+ layout:
|
|
|
+ default_zoom: 1.0
|
|
|
+ default_height: 800
|
|
|
+ sidebar_width: 1
|
|
|
+ content_width: 0.65
|
|
|
+
|
|
|
+# 界面配置
|
|
|
+ui:
|
|
|
+ page_title: "OCR可视化校验工具"
|
|
|
+ page_icon: "🔍"
|
|
|
+ layout: "wide"
|
|
|
+ sidebar_state: "expanded"
|
|
|
+
|
|
|
+# OCR数据配置
|
|
|
+ocr:
|
|
|
+ min_text_length: 2
|
|
|
+ default_confidence: 1.0
|
|
|
+ exclude_texts: ["Picture", ""]
|
|
|
+
|
|
|
+ # 图片方向检测配置
|
|
|
+ orientation_detection:
|
|
|
+ enabled: true
|
|
|
+ confidence_threshold: 0.3 # 置信度阈值
|
|
|
+ methods: ["opencv_analysis"] # 检测方法
|
|
|
+ cache_results: true # 缓存检测结果
|
|
|
+
|
|
|
+ # OCR工具类型配置
|
|
|
+ tools:
|
|
|
+ dots_ocr:
|
|
|
+ name: "Dots OCR"
|
|
|
+ description: "专业VLM OCR"
|
|
|
+ json_structure: "array" # JSON为数组格式
|
|
|
+ text_field: "text"
|
|
|
+ bbox_field: "bbox"
|
|
|
+ category_field: "category"
|
|
|
+ confidence_field: "confidence"
|
|
|
+ # 旋转处理配置
|
|
|
+ rotation:
|
|
|
+ coordinates_are_pre_rotated: false # 坐标不是预旋转的
|
|
|
+
|
|
|
+ ppstructv3:
|
|
|
+ name: "PPStructV3"
|
|
|
+ description: "PaddleOCR PP-StructureV3"
|
|
|
+ json_structure: "object" # JSON为对象格式
|
|
|
+ parsing_results_field: "parsing_res_list"
|
|
|
+ text_field: "block_content"
|
|
|
+ bbox_field: "block_bbox"
|
|
|
+ rec_texts_field: "overall_ocr_res.rec_texts" # 针对表格中的文字块
|
|
|
+ rec_boxes_field: "overall_ocr_res.rec_boxes" # 针对表格中的文字块
|
|
|
+ category_field: "block_label"
|
|
|
+ confidence_field: "confidence"
|
|
|
+ # 旋转处理配置
|
|
|
+ rotation:
|
|
|
+ coordinates_are_pre_rotated: true # 坐标已经是预旋转的
|
|
|
+
|
|
|
+ table_recognition_v2:
|
|
|
+ name: "TableRecognitionV2"
|
|
|
+ description: "PaddleOCR Table Recognition V2"
|
|
|
+ json_structure: "object"
|
|
|
+ parsing_results_field: "table_res_list"
|
|
|
+ text_field: "pred_html"
|
|
|
+ bbox_field: "cell_box_list" # 原先的 cell_box_listox 为笔误
|
|
|
+ rec_texts_field: "table_ocr_pred.rec_texts" # 针对表格中的文字块
|
|
|
+ rec_boxes_field: "table_ocr_pred.rec_boxes" # 针对表格中的文字块
|
|
|
+ category_field: "type"
|
|
|
+ confidence_field: "confidence"
|
|
|
+ rotation:
|
|
|
+ coordinates_are_pre_rotated: true
|
|
|
+
|
|
|
+ mineru:
|
|
|
+ name: "MinerU"
|
|
|
+ description: "MinerU OCR"
|
|
|
+ json_structure: "array" # JSON为数组格式
|
|
|
+ text_field: "text"
|
|
|
+ bbox_field: "bbox"
|
|
|
+ category_field: "type"
|
|
|
+ confidence_field: "confidence"
|
|
|
+ # 表格相关字段
|
|
|
+ table_body_field: "table_body"
|
|
|
+ table_cells_field: "table_cells"
|
|
|
+ img_path_field: "img_path"
|
|
|
+ # 旋转处理配置
|
|
|
+ rotation:
|
|
|
+ coordinates_are_pre_rotated: false
|
|
|
+
|
|
|
+ # 自动检测工具类型的规则(按优先级从高到低)
|
|
|
+ auto_detection:
|
|
|
+ enabled: true
|
|
|
+ rules:
|
|
|
+ # Table Recognition V2 - 最高优先级
|
|
|
+ - tool_type: "table_recognition_v2"
|
|
|
+ conditions:
|
|
|
+ - type: "field_exists"
|
|
|
+ field: "table_res_list"
|
|
|
+ - type: "field_not_exists"
|
|
|
+ field: "parsing_res_list"
|
|
|
+ priority: 4
|
|
|
+
|
|
|
+ # PPStructV3 - 第二优先级
|
|
|
+ - tool_type: "ppstructv3"
|
|
|
+ conditions:
|
|
|
+ - type: "field_exists"
|
|
|
+ field: "parsing_res_list"
|
|
|
+ - type: "field_exists"
|
|
|
+ field: "doc_preprocessor_res"
|
|
|
+ priority: 2
|
|
|
+
|
|
|
+ # MinerU - 第三优先级
|
|
|
+ - tool_type: "mineru"
|
|
|
+ conditions:
|
|
|
+ - type: "field_exists"
|
|
|
+ field: "page_idx"
|
|
|
+ - type: "field_exists"
|
|
|
+ field: "type"
|
|
|
+ - type: "json_structure"
|
|
|
+ structure: "array"
|
|
|
+ priority: 1
|
|
|
+
|
|
|
+ # Dots OCR - 最低优先级(默认)
|
|
|
+ - tool_type: "dots_ocr"
|
|
|
+ conditions:
|
|
|
+ - type: "json_structure"
|
|
|
+ structure: "array"
|
|
|
+ - type: "field_exists"
|
|
|
+ field: "category"
|
|
|
+ priority: 3
|
|
|
+
|
|
|
+# 预校验结果文件路径
|
|
|
+pre_validation:
|
|
|
+ out_dir: "./output/pre_validation/"
|
|
|
+
|
|
|
+data_sources:
|
|
|
+ - 德_内蒙古银行照.yaml
|
|
|
+ - 对公_招商银行图.yaml
|
|
|
+ - A用户_单元格扫描流水.yaml
|
|
|
+ - B用户_扫描流水.yaml
|
|
|
+ - 至远彩色_2023年报.yaml
|
|
|
+
|