Browse Source

feat(processor_configs): 添加yusys_ocr_v4处理器配置,支持银行对账单处理

zhch158_admin 1 tuần trước cách đây
mục cha
commit
1594cd3e94
1 tập tin đã thay đổi với 16 bổ sung1 xóa
  1. 16 1
      ocr_tools/ocr_batch/processor_configs.yaml

+ 16 - 1
ocr_tools/ocr_batch/processor_configs.yaml

@@ -8,7 +8,22 @@ processors:
   # MinerU vLLM 处理器
   # 基于 MinerU 的多线程批量处理(支持 PDF 和图片)
   # -------------------------------------------------------------------------
-  yusys_ocr:
+  yusys_ocr_v4:
+    script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/main_v2.py"
+    input_arg: "--input"
+    output_arg: "--output_dir"
+    extra_args:
+      - "--config=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/config/bank_statement_yusys_v4.yaml"
+      - "--pages=1-35"
+      - "--streaming"
+      - "--debug"
+      - "--log_level=DEBUG"
+    output_subdir: "bank_statement_yusys_v4"
+    log_subdir: "logs/bank_statement_yusys_v4"
+    venv: "conda activate mineru2"
+    description: "YUSYS Wired UNET OCR 框架 GLM-OCR"
+
+  yusys_ocr_v3:
     script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/main_v2.py"
     input_arg: "--input"
     output_arg: "--output_dir"