processor_configs.yaml 8.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187
  1. # ============================================================================
  2. # PDF 批量处理器配置文件
  3. # ============================================================================
  4. # 处理器定义
  5. processors:
  6. # -------------------------------------------------------------------------
  7. # MinerU vLLM 处理器
  8. # 基于 MinerU 的多线程批量处理(支持 PDF 和图片)
  9. # -------------------------------------------------------------------------
  10. yusys_ocr_v4:
  11. script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/main_v2.py"
  12. input_arg: "--input"
  13. output_arg: "--output_dir"
  14. extra_args:
  15. - "--config=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/config/bank_statement_yusys_v4.yaml"
  16. - "--pages=1-35"
  17. - "--streaming"
  18. - "--debug"
  19. - "--log_level=DEBUG"
  20. output_subdir: "bank_statement_yusys_v4"
  21. log_subdir: "logs/bank_statement_yusys_v4"
  22. venv: "conda activate mineru2"
  23. description: "YUSYS Wired UNET OCR 框架 GLM-OCR"
  24. yusys_ocr_v3:
  25. script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/main_v2.py"
  26. input_arg: "--input"
  27. output_arg: "--output_dir"
  28. extra_args:
  29. - "--config=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/config/bank_statement_yusys_v3.yaml"
  30. # - "--config=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/config/bank_statement_yusys_v2.yaml"
  31. - "--pages=1-35"
  32. - "--streaming"
  33. - "--debug"
  34. - "--log_level=DEBUG"
  35. output_subdir: "bank_statement_yusys_v3"
  36. log_subdir: "logs/bank_statement_yusys_v3"
  37. # output_subdir: "bank_statement_yusys_v2"
  38. # log_subdir: "logs/bank_statement_yusys_v2"
  39. venv: "conda activate mineru2"
  40. description: "YUSYS Wired UNET OCR 框架"
  41. yusys_mineru:
  42. script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/main_v2.py"
  43. input_arg: "--input"
  44. output_arg: "--output_dir"
  45. extra_args:
  46. - "--config=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/config/bank_statement_mineru_vl.yaml"
  47. # - "--config=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/config/bank_statement_yusys_v2.yaml"
  48. - "--pages=1-35"
  49. - "--streaming"
  50. - "--debug"
  51. - "--log_level=DEBUG"
  52. output_subdir: "bank_statement_mineru_vl"
  53. log_subdir: "logs/bank_statement_mineru_vl"
  54. # output_subdir: "bank_statement_yusys_v2"
  55. # log_subdir: "logs/bank_statement_yusys_v2"
  56. venv: "conda activate mineru2"
  57. description: "YUSYS MinerU OCR 框架"
  58. # -------------------------------------------------------------------------
  59. # PaddleOCR-VL 处理器
  60. # -------------------------------------------------------------------------
  61. paddleocr_vl_single_process:
  62. script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/paddle_vl_tool/main.py"
  63. input_arg: "--input"
  64. output_arg: "--output_dir"
  65. extra_args:
  66. - "--pipeline=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/paddle_common/config/PaddleOCR-VL-Client.yaml"
  67. - "--device=cpu"
  68. # - "--no-adapter"
  69. output_subdir: "paddleocr_vl_results"
  70. log_subdir: "logs/paddleocr_vl" # 🎯 新增:日志子目录
  71. venv: "source /Users/zhch158/workspace/repository.git/PaddleX/paddle_env/bin/activate"
  72. description: "PaddleOCR-VL 处理器 - 视觉语言模型OCR"
  73. # -------------------------------------------------------------------------
  74. # PP-StructureV3 本地处理器
  75. # -------------------------------------------------------------------------
  76. ppstructurev3_single_process:
  77. script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/ppstructure_tool/main.py"
  78. input_arg: "--input"
  79. output_arg: "--output_dir"
  80. extra_args:
  81. - "--pipeline=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/paddle_common/config/PP-StructureV3-zhch.yaml"
  82. - "--device=cpu"
  83. output_subdir: "ppstructurev3_results"
  84. log_subdir: "logs/ppstructurev3"
  85. venv: "conda activate paddle"
  86. description: "PP-StructureV3 处理器 - 本地处理"
  87. ppstructurev3_gpu:
  88. script: "/home/ubuntu/zhch/PaddleX/zhch/ppstructurev3_single_process.py"
  89. input_arg: "--input_file"
  90. output_arg: "--output_dir"
  91. extra_args:
  92. - "--pipeline=/home/ubuntu/zhch/PaddleX/zhch/my_config/PP-StructureV3.yaml"
  93. output_subdir: "ppstructurev3_gpu_results"
  94. log_subdir: "logs/ppstructurev3_gpu"
  95. venv: "conda activate paddle"
  96. description: "PP-StructureV3 处理器 - GPU加速"
  97. # -------------------------------------------------------------------------
  98. # PP-StructureV3 CPU 处理器
  99. # 明确使用 CPU 处理
  100. # -------------------------------------------------------------------------
  101. ppstructurev3_cpu:
  102. script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/ppstructure_tool/main.py"
  103. input_arg: "--input"
  104. output_arg: "--output_dir"
  105. extra_args:
  106. - "--pipeline=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/paddle_common/config/PP-StructureV3-zhch.yaml"
  107. - "--device=cpu"
  108. output_subdir: "ppstructurev3_cpu_results"
  109. log_subdir: "logs/ppstructurev3_cpu"
  110. venv: "source /Users/zhch158/workspace/repository.git/PaddleX/paddle_env/bin/activate"
  111. description: "PP-StructureV3 处理器 - CPU处理"
  112. # -------------------------------------------------------------------------
  113. # PP-StructureV3 API 客户端 (默认)
  114. # 通过 HTTP API 调用远程服务
  115. # -------------------------------------------------------------------------
  116. ppstructurev3_single_client:
  117. script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/ppstructure_tool/api_client.py"
  118. input_arg: "--input"
  119. output_arg: "--output_dir"
  120. extra_args:
  121. - "--api_url=http://10.192.72.11:20026/layout-parsing"
  122. - "--timeout=300"
  123. output_subdir: "ppstructurev3_client_results"
  124. log_subdir: "logs/ppstructurev3_client"
  125. venv: "source /Users/zhch158/workspace/repository.git/PaddleX/paddle_env/bin/activate"
  126. description: "PP-StructureV3 HTTP API 客户端 - 远程服务"
  127. # -------------------------------------------------------------------------
  128. # MinerU vLLM 处理器
  129. # 基于 MinerU 的多线程批量处理(支持 PDF 和图片)
  130. # -------------------------------------------------------------------------
  131. mineru_vllm:
  132. script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/mineru_vl_tool/main.py"
  133. input_arg: "--input"
  134. output_arg: "--output_dir"
  135. extra_args:
  136. - "--server_url=http://10.192.72.11:20006"
  137. - "--timeout=300"
  138. - "--batch_size=1"
  139. output_subdir: "mineru_vllm_results"
  140. log_subdir: "logs/mineru_vllm"
  141. venv: "conda activate mineru2"
  142. description: "MinerU vLLM 处理器 - 支持PDF和图片"
  143. # -------------------------------------------------------------------------
  144. # DotsOCR vLLM 处理器
  145. # 基于 DotsOCR 的批量处理(支持 PDF 和图片)
  146. # -------------------------------------------------------------------------
  147. dotsocr_vllm:
  148. script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/dots.ocr_vl_tool/main.py"
  149. input_arg: "--input"
  150. output_arg: "--output_dir"
  151. extra_args:
  152. - "--ip=10.192.72.11"
  153. - "--port=8101"
  154. - "--model_name=DotsOCR"
  155. - "--prompt_mode=prompt_layout_all_en"
  156. - "--batch_size=1"
  157. - "--max_workers=1"
  158. - "--dpi=200"
  159. output_subdir: "dotsocr_vllm_results"
  160. log_subdir: "logs/dotsocr_vllm"
  161. venv: "conda activate py312"
  162. description: "DotsOCR vLLM 处理器 - 支持PDF和图片"
  163. # ============================================================================
  164. # 全局配置
  165. # ============================================================================
  166. global:
  167. # PDF 文件基础目录
  168. base_dir: "/Users/zhch158/workspace/data/流水分析"
  169. # 默认输出子目录名称(如果处理器未指定)
  170. output_subdir: "results"
  171. # 🎯 新增:全局日志配置
  172. log_dir: "logs" # 全局日志目录(相对于 base_dir)
  173. log_retention_days: 30 # 日志保留天数
  174. log_level: "INFO" # 日志级别: DEBUG, INFO, WARNING, ERROR