|
@@ -26,15 +26,6 @@ ui:
|
|
|
layout: "wide"
|
|
layout: "wide"
|
|
|
sidebar_state: "expanded"
|
|
sidebar_state: "expanded"
|
|
|
|
|
|
|
|
-# 文件路径配置
|
|
|
|
|
-paths:
|
|
|
|
|
- ocr_out_dir: "/Users/zhch158/workspace/data/至远彩色印刷工业有限公司/data_DotsOCR_Results"
|
|
|
|
|
- # ocr_out_dir: "/Users/zhch158/workspace/data/至远彩色印刷工业有限公司/data_PPStructureV3_Results"
|
|
|
|
|
- src_img_dir: "/Users/zhch158/workspace/data/至远彩色印刷工业有限公司/data_PPStructureV3_Results/2023年度报告母公司"
|
|
|
|
|
- supported_image_formats: [".png", ".jpg", ".jpeg"]
|
|
|
|
|
- # 预校验结果文件路径
|
|
|
|
|
- pre_validation_dir: "./output/pre_validation/"
|
|
|
|
|
-
|
|
|
|
|
# OCR数据配置
|
|
# OCR数据配置
|
|
|
ocr:
|
|
ocr:
|
|
|
min_text_length: 2
|
|
min_text_length: 2
|
|
@@ -82,4 +73,58 @@ ocr:
|
|
|
- field_exists: "parsing_res_list" # 如果存在该字段,判断为ppstructv3
|
|
- field_exists: "parsing_res_list" # 如果存在该字段,判断为ppstructv3
|
|
|
tool_type: "ppstructv3"
|
|
tool_type: "ppstructv3"
|
|
|
- json_is_array: true # 如果JSON是数组,判断为dots_ocr
|
|
- json_is_array: true # 如果JSON是数组,判断为dots_ocr
|
|
|
- tool_type: "dots_ocr"
|
|
|
|
|
|
|
+ tool_type: "dots_ocr"
|
|
|
|
|
+
|
|
|
|
|
+data_sources:
|
|
|
|
|
+ - name: "A用户_单元格扫描流水"
|
|
|
|
|
+ ocr_tool: "dots_ocr"
|
|
|
|
|
+ ocr_out_dir: "/Users/zhch158/workspace/data/流水分析/A用户_单元格扫描流水/data_DotsOCR_Results"
|
|
|
|
|
+ src_img_dir: "/Users/zhch158/workspace/data/流水分析/A用户_单元格扫描流水/data_DotsOCR_Results/A用户_单元格扫描流水"
|
|
|
|
|
+ description: "A用户使用Dots OCR的单元格扫描结果"
|
|
|
|
|
+
|
|
|
|
|
+ - name: "A用户_单元格扫描流水"
|
|
|
|
|
+ ocr_tool: "ppstructv3"
|
|
|
|
|
+ ocr_out_dir: "/Users/zhch158/workspace/data/流水分析/A用户_单元格扫描流水/data_PPStructureV3_Results"
|
|
|
|
|
+ src_img_dir: "/Users/zhch158/workspace/data/流水分析/A用户_单元格扫描流水/data_PPStructureV3_Results/A用户_单元格扫描流水"
|
|
|
|
|
+ description: "A用户使用PPStructV3的单元格扫描结果"
|
|
|
|
|
+
|
|
|
|
|
+ - name: "A用户_单元格图片合成"
|
|
|
|
|
+ ocr_tool: "dots_ocr"
|
|
|
|
|
+ ocr_out_dir: "/Users/zhch158/workspace/data/流水分析/A用户_单元格图片合成/data_DotsOCR_Results"
|
|
|
|
|
+ src_img_dir: "/Users/zhch158/workspace/data/流水分析/A用户_单元格图片合成/data_DotsOCR_Results/A用户_单元格图片合成"
|
|
|
|
|
+ description: "A用户使用Dots OCR的单元格图片合成结果"
|
|
|
|
|
+
|
|
|
|
|
+ - name: "A用户_单元格图片合成"
|
|
|
|
|
+ ocr_tool: "ppstructv3"
|
|
|
|
|
+ ocr_out_dir: "/Users/zhch158/workspace/data/流水分析/A用户_单元格图片合成/data_PPStructureV3_Results"
|
|
|
|
|
+ src_img_dir: "/Users/zhch158/workspace/data/流水分析/A用户_单元格图片合成/data_PPStructureV3_Results/A用户_单元格图片合成"
|
|
|
|
|
+ description: "A用户使用PPStructV3的单元格图片合成结果"
|
|
|
|
|
+
|
|
|
|
|
+ - name: "B用户_扫描流水"
|
|
|
|
|
+ ocr_tool: "dots_ocr"
|
|
|
|
|
+ ocr_out_dir: "/Users/zhch158/workspace/data/流水分析/B用户_扫描流水/data_DotsOCR_Results"
|
|
|
|
|
+ src_img_dir: "/Users/zhch158/workspace/data/流水分析/B用户_扫描流水/data_DotsOCR_Results/B用户_扫描流水"
|
|
|
|
|
+ description: "B用户使用Dots OCR的扫描结果"
|
|
|
|
|
+
|
|
|
|
|
+ - name: "B用户_扫描流水"
|
|
|
|
|
+ ocr_tool: "ppstructv3"
|
|
|
|
|
+ ocr_out_dir: "/Users/zhch158/workspace/data/流水分析/B用户_扫描流水/data_PPStructureV3_Results"
|
|
|
|
|
+ src_img_dir: "/Users/zhch158/workspace/data/流水分析/B用户_扫描流水/data_PPStructureV3_Results/B用户_扫描流水"
|
|
|
|
|
+ description: "B用户使用PPStructV3的扫描结果"
|
|
|
|
|
+
|
|
|
|
|
+ - name: "B用户_图片合成流水"
|
|
|
|
|
+ ocr_tool: "dots_ocr"
|
|
|
|
|
+ ocr_out_dir: "/Users/zhch158/workspace/data/流水分析/B用户_图片合成流水/data_DotsOCR_Results"
|
|
|
|
|
+ src_img_dir: "/Users/zhch158/workspace/data/流水分析/B用户_图片合成流水/data_DotsOCR_Results/B用户_图片合成流水"
|
|
|
|
|
+ description: "B用户使用Dots OCR的图片合成结果"
|
|
|
|
|
+
|
|
|
|
|
+ - name: "B用户_图片合成流水"
|
|
|
|
|
+ ocr_tool: "ppstructv3"
|
|
|
|
|
+ ocr_out_dir: "/Users/zhch158/workspace/data/流水分析/B用户_图片合成流水/data_PPStructureV3_Results"
|
|
|
|
|
+ src_img_dir: "/Users/zhch158/workspace/data/流水分析/B用户_图片合成流水/data_PPStructureV3_Results/B用户_图片合成流水"
|
|
|
|
|
+ description: "B用户使用PPStructV3的图片合成结果"
|
|
|
|
|
+
|
|
|
|
|
+# 预校验结果文件路径
|
|
|
|
|
+pre_validation:
|
|
|
|
|
+ out_dir: "./output/pre_validation/"
|
|
|
|
|
+
|