|
|
@@ -21,7 +21,7 @@ processors:
|
|
|
- "--log_level=DEBUG"
|
|
|
output_subdir: "bank_statement_yusys_v4"
|
|
|
log_subdir: "logs/bank_statement_yusys_v4"
|
|
|
- venv: "conda activate mineru2"
|
|
|
+ venv: "conda activate mineru"
|
|
|
description: "YUSYS Wired UNET OCR 框架 GLM-OCR"
|
|
|
|
|
|
yusys_ocr_v3:
|
|
|
@@ -40,7 +40,7 @@ processors:
|
|
|
log_subdir: "logs/bank_statement_yusys_v3"
|
|
|
# output_subdir: "bank_statement_yusys_v2"
|
|
|
# log_subdir: "logs/bank_statement_yusys_v2"
|
|
|
- venv: "conda activate mineru2"
|
|
|
+ venv: "conda activate mineru"
|
|
|
description: "YUSYS Wired UNET OCR 框架"
|
|
|
|
|
|
yusys_mineru:
|
|
|
@@ -59,7 +59,7 @@ processors:
|
|
|
log_subdir: "logs/bank_statement_mineru_vl"
|
|
|
# output_subdir: "bank_statement_yusys_v2"
|
|
|
# log_subdir: "logs/bank_statement_yusys_v2"
|
|
|
- venv: "conda activate mineru2"
|
|
|
+ venv: "conda activate mineru"
|
|
|
description: "YUSYS MinerU OCR 框架"
|
|
|
|
|
|
yusys_ocr_local:
|
|
|
@@ -75,9 +75,25 @@ processors:
|
|
|
- "--log_level=DEBUG"
|
|
|
output_subdir: "bank_statement_yusys_local"
|
|
|
log_subdir: "logs/bank_statement_yusys_local"
|
|
|
- venv: "conda activate mineru2"
|
|
|
+ venv: "conda activate mineru"
|
|
|
description: "YUSYS(local) Wired UNET OCR GLM-OCR"
|
|
|
|
|
|
+ yusys_glmocr_local:
|
|
|
+ script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/main_v2.py"
|
|
|
+ input_arg: "--input"
|
|
|
+ output_arg: "--output_dir"
|
|
|
+ scene_arg: "--scene"
|
|
|
+ extra_args:
|
|
|
+ - "--config=/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/config/bank_statement_glm_vl_local.yaml"
|
|
|
+ - "--pages=1-35"
|
|
|
+ - "--streaming"
|
|
|
+ - "--debug"
|
|
|
+ - "--log_level=DEBUG"
|
|
|
+ output_subdir: "bank_statement_yusys_glmocr_local"
|
|
|
+ log_subdir: "logs/bank_statement_yusys_glmocr_local"
|
|
|
+ venv: "conda activate mineru"
|
|
|
+ description: "YUSYS(local) OCR GLM-OCR VLM"
|
|
|
+
|
|
|
yusys_paddleocr_local:
|
|
|
script: "/Users/zhch158/workspace/repository.git/ocr_platform/ocr_tools/universal_doc_parser/main_v2.py"
|
|
|
input_arg: "--input"
|
|
|
@@ -91,7 +107,7 @@ processors:
|
|
|
- "--log_level=DEBUG"
|
|
|
output_subdir: "bank_statement_yusys_paddleocr_local"
|
|
|
log_subdir: "logs/bank_statement_yusys_paddleocr_local"
|
|
|
- venv: "conda activate mineru2"
|
|
|
+ venv: "conda activate mineru"
|
|
|
description: "YUSYS(local) Wired UNET OCR PaddleOCR-VL"
|
|
|
|
|
|
# -------------------------------------------------------------------------
|
|
|
@@ -182,7 +198,7 @@ processors:
|
|
|
- "--batch_size=1"
|
|
|
output_subdir: "mineru_vllm_results"
|
|
|
log_subdir: "logs/mineru_vllm"
|
|
|
- venv: "conda activate mineru2"
|
|
|
+ venv: "conda activate mineru"
|
|
|
description: "MinerU vLLM 处理器 - 支持PDF和图片"
|
|
|
|
|
|
# -------------------------------------------------------------------------
|