1 月之前 · 5bbe299ec9
--- a/ocr_tools/remove_watermark_tool/remove_watermark.py
+++ b/ocr_tools/remove_watermark_tool/remove_watermark.py
@@ -2,35 +2,42 @@
 
				 银行流水水印去除工具
			
 
				 
			
 
				 支持 PDF 和常见图片格式（jpg/png/tif/bmp/webp）。
			
 
				-- 输入 PDF → 输出去水印 PDF（扫描件）或直接复制（文字型）
			
 
				-- 输入图片 → 输出去水印图片（保持原格式）
			
 
				-适用于福建农信、邮储银行等带有半透明文字水印的银行流水单。
			
 
				+参数默认从与 main_v2 相同的场景 YAML 读取（preprocessor.watermark_removal），
			
 
				+命令行仅用于输入/输出、批量、预览及少量覆盖项。
			
 
				 
			
 
				 用法:
			
 
				-    # 处理单个 PDF 或图片
			
 
				+    # 使用默认场景配置（bank_statement_yusys_local.yaml）
			
 
				     python remove_watermark.py input.pdf
			
 
				-    python remove_watermark.py input.jpg
			
 
				 
			
 
				-    # 指定输出路径
			
 
				-    python remove_watermark.py input.pdf -o output.pdf
			
 
				+    # 指定场景配置（与 Pipeline 一致）
			
 
				+    python remove_watermark.py input.png -c ../universal_doc_parser/config/bank_statement_yusys_local.yaml
			
 
				 
			
 
				-    # 指定页面范围（支持 "1-5,7,9-12" 格式）
			
 
				-    python remove_watermark.py input.pdf --page-range 1-3
			
 
				+    # 保存调试图（before/after/compare/meta）
			
 
				+    python remove_watermark.py input.png -o ./out --debug
			
 
				 
			
 
				-    # 调整去除阈值（默认 160，范围建议 140-180）
			
 
				+    # 临时覆盖阈值（其余仍来自配置文件）
			
 
				     python remove_watermark.py input.pdf --threshold 170
			
 
				 
			
 
				-    # 批量处理目录下所有 PDF 和图片
			
 
				-    python remove_watermark.py /path/to/dir/ --batch
			
 
				-
			
 
				-    # 预览单页/图片效果（不保存，直接展示对比图）
			
 
				+    # 预览
			
 
				     python remove_watermark.py input.pdf --preview --page 0
			
 
				-    python remove_watermark.py input.jpg --preview
			
 
				+
			
 
				+    # 批量
			
 
				+    python remove_watermark.py /path/to/dir/ --batch -o ./cleaned
			
 
				+
			
 
				+    # 对比 threshold vs masked_adaptive（输出三联图）
			
 
				+    python remove_watermark.py page_002.png --compare-methods -o ./method_compare
			
 
				 """
			
 
				 import argparse
			
 
				+import copy
			
 
				+import json
			
 
				 import sys
			
 
				+from dataclasses import dataclass
			
 
				 from pathlib import Path
			
 
				-from typing import Optional
			
 
				+from typing import Any, Dict, Optional
			
 
				+
			
 
				+import cv2
			
 
				+import numpy as np
			
 
				+import yaml
			
 
				 
			
 
				 # 将 ocr_platform 根目录加入 sys.path，以便导入 ocr_utils
			
 
				 _repo_root = Path(__file__).parents[2]
			
@@ -40,7 +47,10 @@ if str(_repo_root) not in sys.path:
 
				 from loguru import logger
			
 
				 from ocr_utils.watermark_utils import (
			
 
				     detect_watermark,
			
 
				-    remove_watermark_from_image,
			
 
				+    remove_watermark_from_image_rgb,
			
 
				+    render_watermark_mask_overlay,
			
 
				+    save_watermark_removal_debug,
			
 
				+    save_watermark_mask_debug_layers,
			
 
				     scan_pdf_watermark_xobjs,
			
 
				     remove_txt_pdf_watermark,
			
 
				 )
			
@@ -48,6 +58,190 @@ from ocr_utils.watermark_utils import (
 
				 # 支持的图片后缀（小写）
			
 
				 IMAGE_SUFFIXES = {".jpg", ".jpeg", ".png", ".tif", ".tiff", ".bmp", ".webp"}
			
 
				 
			
 
				+_DEFAULT_CONFIG_PATH = (
			
 
				+    _repo_root
			
 
				+    / "ocr_tools/universal_doc_parser/config/bank_statement_yusys_local.yaml"
			
 
				+)
			
 
				+
			
 
				+
			
 
				+@dataclass
			
 
				+class WatermarkToolSettings:
			
 
				+    """从场景 YAML 解析的水印处理参数（与 Pipeline preprocessor 对齐）。"""
			
 
				+
			
 
				+    threshold: int = 160
			
 
				+    morph_close_kernel: int = 0
			
 
				+    dpi: int = 200
			
 
				+    method: str = "threshold"
			
 
				+    contrast_enhancement: Optional[Dict[str, Any]] = None
			
 
				+    debug_options: Optional[Dict[str, Any]] = None
			
 
				+    watermark_enabled: bool = True
			
 
				+    watermark_config: Optional[Dict[str, Any]] = None
			
 
				+
			
 
				+    @property
			
 
				+    def debug_image_format(self) -> str:
			
 
				+        opts = self.debug_options or {}
			
 
				+        return str(opts.get("image_format") or "png").lstrip(".")
			
 
				+
			
 
				+
			
 
				+def load_watermark_settings(config_path: Path) -> WatermarkToolSettings:
			
 
				+    """
			
 
				+    从 universal_doc_parser 场景配置读取 preprocessor.watermark_removal 与 input.dpi。
			
 
				+
			
 
				+    不依赖完整 ConfigManager，避免仅调试水印时强依赖 layout/ocr 等段。
			
 
				+    """
			
 
				+    config_path = Path(config_path)
			
 
				+    if not config_path.is_file():
			
 
				+        raise FileNotFoundError(f"配置文件不存在: {config_path}")
			
 
				+
			
 
				+    with open(config_path, encoding="utf-8") as f:
			
 
				+        raw = yaml.safe_load(f) or {}
			
 
				+
			
 
				+    preprocessor = raw.get("preprocessor") or {}
			
 
				+    wm = preprocessor.get("watermark_removal") or {}
			
 
				+    input_cfg = raw.get("input") or {}
			
 
				+
			
 
				+    contrast = wm.get("contrast_enhancement")
			
 
				+    if contrast is not None and not isinstance(contrast, dict):
			
 
				+        contrast = None
			
 
				+
			
 
				+    wm_full = copy.deepcopy(wm)
			
 
				+    return WatermarkToolSettings(
			
 
				+        threshold=int(wm.get("threshold", 160)),
			
 
				+        morph_close_kernel=int(wm.get("morph_close_kernel", 0)),
			
 
				+        dpi=int(input_cfg.get("dpi", 200)),
			
 
				+        method=str(wm.get("method") or "threshold"),
			
 
				+        contrast_enhancement=copy.deepcopy(contrast) if contrast else None,
			
 
				+        debug_options=copy.deepcopy(wm.get("debug_options"))
			
 
				+        if wm.get("debug_options")
			
 
				+        else None,
			
 
				+        watermark_enabled=bool(wm.get("enabled", True)),
			
 
				+        watermark_config=wm_full,
			
 
				+    )
			
 
				+
			
 
				+
			
 
				+def resolve_watermark_settings(
			
 
				+    config_path: Path,
			
 
				+    *,
			
 
				+    threshold: Optional[int] = None,
			
 
				+    morph_close_kernel: Optional[int] = None,
			
 
				+    dpi: Optional[int] = None,
			
 
				+    no_contrast: bool = False,
			
 
				+    text_black_target: Optional[int] = None,
			
 
				+    method: Optional[str] = None,
			
 
				+) -> WatermarkToolSettings:
			
 
				+    """加载配置并应用命令行覆盖。"""
			
 
				+    settings = load_watermark_settings(config_path)
			
 
				+
			
 
				+    if threshold is not None:
			
 
				+        settings.threshold = threshold
			
 
				+    if morph_close_kernel is not None:
			
 
				+        settings.morph_close_kernel = morph_close_kernel
			
 
				+    if dpi is not None:
			
 
				+        settings.dpi = dpi
			
 
				+    if method is not None:
			
 
				+        settings.method = method
			
 
				+        if settings.watermark_config is not None:
			
 
				+            settings.watermark_config["method"] = method
			
 
				+
			
 
				+    if no_contrast and settings.contrast_enhancement:
			
 
				+        settings.contrast_enhancement = copy.deepcopy(settings.contrast_enhancement)
			
 
				+        settings.contrast_enhancement["enabled"] = False
			
 
				+    elif text_black_target is not None:
			
 
				+        if not settings.contrast_enhancement:
			
 
				+            settings.contrast_enhancement = {"enabled": True, "method": "text_restore"}
			
 
				+        else:
			
 
				+            settings.contrast_enhancement = copy.deepcopy(settings.contrast_enhancement)
			
 
				+        settings.contrast_enhancement["enabled"] = True
			
 
				+        settings.contrast_enhancement["text_black_target"] = text_black_target
			
 
				+
			
 
				+    return settings
			
 
				+
			
 
				+
			
 
				+def _watermark_removal_cfg_for_method(
			
 
				+    settings: WatermarkToolSettings,
			
 
				+    method: str,
			
 
				+) -> Dict[str, Any]:
			
 
				+    """构造指定 method 的 watermark_removal 配置副本。"""
			
 
				+    cfg = copy.deepcopy(settings.watermark_config or {})
			
 
				+    cfg["method"] = method
			
 
				+    cfg["threshold"] = settings.threshold
			
 
				+    cfg["morph_close_kernel"] = settings.morph_close_kernel
			
 
				+    return cfg
			
 
				+
			
 
				+
			
 
				+def _apply_image_watermark_removal(
			
 
				+    img_np: np.ndarray,
			
 
				+    *,
			
 
				+    settings: WatermarkToolSettings,
			
 
				+    contrast_enhancement: Optional[Dict[str, Any]] = None,
			
 
				+    apply_watermark_removal: bool = True,
			
 
				+    removal_debug: Optional[Dict[str, Any]] = None,
			
 
				+) -> np.ndarray:
			
 
				+    """与 universal_doc_parser 一致的 RGB 去水印 + 可选对比度增强。"""
			
 
				+    wm_cfg = _watermark_removal_cfg_for_method(settings, settings.method)
			
 
				+    return np.asarray(
			
 
				+        remove_watermark_from_image_rgb(
			
 
				+            img_np,
			
 
				+            threshold=settings.threshold,
			
 
				+            morph_close_kernel=settings.morph_close_kernel,
			
 
				+            contrast_enhancement=contrast_enhancement,
			
 
				+            apply_watermark_removal=apply_watermark_removal,
			
 
				+            watermark_removal_cfg=wm_cfg,
			
 
				+            removal_debug=removal_debug,
			
 
				+            return_pil=False,
			
 
				+        )
			
 
				+    )
			
 
				+
			
 
				+
			
 
				+def _active_contrast_enhancement(
			
 
				+    settings: WatermarkToolSettings,
			
 
				+) -> Optional[Dict[str, Any]]:
			
 
				+    ce = settings.contrast_enhancement
			
 
				+    if not ce or not ce.get("enabled", False):
			
 
				+        return None
			
 
				+    return ce
			
 
				+
			
 
				+
			
 
				+def _maybe_save_watermark_debug(
			
 
				+    before: np.ndarray,
			
 
				+    after: np.ndarray,
			
 
				+    debug_output_dir: Path,
			
 
				+    page_name: str,
			
 
				+    *,
			
 
				+    settings: WatermarkToolSettings,
			
 
				+    contrast_enhancement: Optional[Dict[str, Any]] = None,
			
 
				+    removal_debug: Optional[Dict[str, Any]] = None,
			
 
				+) -> None:
			
 
				+    """保存调试图到 debug_comparison/watermark_removal/（与 pipeline 相同布局）。"""
			
 
				+    params: Dict[str, Any] = {
			
 
				+        "method": settings.method,
			
 
				+        "threshold": settings.threshold,
			
 
				+        "morph_close_kernel": settings.morph_close_kernel,
			
 
				+    }
			
 
				+    if contrast_enhancement:
			
 
				+        params["contrast_enhancement"] = contrast_enhancement
			
 
				+    if removal_debug:
			
 
				+        for key in ("mode", "T_wm", "T_protect", "wm_mask_ratio", "white_pixel_ratio"):
			
 
				+            if key in removal_debug:
			
 
				+                params[key] = removal_debug[key]
			
 
				+
			
 
				+    mask_overlay = None
			
 
				+    if removal_debug and "wm_mask" in removal_debug:
			
 
				+        mask_overlay = render_watermark_mask_overlay(
			
 
				+            before, removal_debug["wm_mask"]
			
 
				+        )
			
 
				+
			
 
				+    save_watermark_removal_debug(
			
 
				+        before,
			
 
				+        after,
			
 
				+        debug_output_dir,
			
 
				+        page_name,
			
 
				+        processing_params=params,
			
 
				+        image_format=settings.debug_image_format,
			
 
				+        save_compare=True,
			
 
				+        mask_overlay=mask_overlay,
			
 
				+    )
			
 
				+
			
 
				 
			
 
				 def _try_remove_txt_pdf_watermark(input_path: Path, output_path: Path) -> int:
			
 
				     """
			
@@ -81,11 +275,12 @@ def _try_remove_txt_pdf_watermark(input_path: Path, output_path: Path) -> int:
 
				 def process_document(
			
 
				     input_path: Path,
			
 
				     output_path: Path,
			
 
				-    threshold: int = 160,
			
 
				-    morph_close_kernel: int = 0,
			
 
				-    dpi: int = 200,
			
 
				+    settings: WatermarkToolSettings,
			
 
				     page_range: Optional[str] = None,
			
 
				     force_image: bool = False,
			
 
				+    save_debug: bool = False,
			
 
				+    debug_output_dir: Optional[Path] = None,
			
 
				+    apply_watermark_removal: Optional[bool] = None,
			
 
				 ) -> int:
			
 
				     """
			
 
				     统一处理函数：支持 PDF（扫描件）和图片，去除水印后保存。
			
@@ -99,23 +294,27 @@ def process_document(
 
				     Args:
			
 
				         input_path: 输入文件路径（PDF 或图片）
			
 
				         output_path: 输出文件路径
			
 
				-        threshold: 灰度阈值（140-180），越大保守，越小激进
			
 
				-        morph_close_kernel: 形态学闭运算核大小，0 跳过
			
 
				-        dpi: PDF 渲染分辨率
			
 
				+        settings: 水印配置（含 method / threshold / mask / adaptive）
			
 
				         page_range: 页面范围字符串，如 "1-5,7,9-12"（从 1 开始，仅对 PDF 有效）
			
 
				         force_image: 强制对文字型 PDF 使用图像化处理（会失去文字可搜索性，
			
 
				                      但能处理水印嵌在内容流中的情况）
			
 
				+        save_debug: 是否保存 before/after/compare/meta 到 debug_comparison/watermark_removal/
			
 
				+        debug_output_dir: 调试图根目录，默认 output_path 的父目录
			
 
				+        apply_watermark_removal: 默认取 settings.watermark_enabled
			
 
				 
			
 
				     Returns:
			
 
				         实际处理的页/图片数
			
 
				     """
			
 
				     import shutil
			
 
				-    import numpy as np
			
 
				     from io import BytesIO
			
 
				     from PIL import Image
			
 
				     from ocr_utils.pdf_utils import PDFUtils
			
 
				 
			
 
				     is_pdf = input_path.suffix.lower() == ".pdf"
			
 
				+    dpi = settings.dpi
			
 
				+    contrast_enhancement = _active_contrast_enhancement(settings)
			
 
				+    if apply_watermark_removal is None:
			
 
				+        apply_watermark_removal = settings.watermark_enabled
			
 
				 
			
 
				     # 统一加载 + 分类（PDF 用 MinerU pdf_classify，图片直接读取）
			
 
				     images, pdf_type, pdf_doc, renderer = PDFUtils.load_and_classify_document(
			
@@ -161,12 +360,22 @@ def process_document(
 
				 
			
 
				     logger.info(
			
 
				         f"{'📄' if is_pdf else '🖼️ '} 处理: {input_path.name}  "
			
 
				-        f"共 {len(images)} {'页' if is_pdf else '张'}  threshold={threshold}"
			
 
				+        f"共 {len(images)} {'页' if is_pdf else '张'}  "
			
 
				+        f"method={settings.method} threshold={settings.threshold}"
			
 
				+    )
			
 
				+
			
 
				+    contrast_only = (
			
 
				+        not apply_watermark_removal
			
 
				+        and contrast_enhancement
			
 
				+        and contrast_enhancement.get("enabled", False)
			
 
				     )
			
 
				 
			
 
				     # 水印检测（仅用第一页/图判断，同一文档水印通常一致）
			
 
				     # _known_has_wm 已在 txt 分支设置时，跳过重复检测
			
 
				-    if _known_has_wm is not None:
			
 
				+    if contrast_only:
			
 
				+        has_wm = True
			
 
				+        logger.info("📋 配置关闭去水印，仅应用 contrast_enhancement")
			
 
				+    elif _known_has_wm is not None:
			
 
				         has_wm = _known_has_wm
			
 
				         logger.info("🔍 检测到水印，启动去水印处理" if has_wm else "✅ 未检测到水印，跳过")
			
 
				     else:
			
@@ -185,6 +394,7 @@ def process_document(
 
				                 return 1
			
 
				 
			
 
				     output_path.parent.mkdir(parents=True, exist_ok=True)
			
 
				+    debug_root = debug_output_dir or output_path.parent
			
 
				 
			
 
				     if is_pdf:
			
 
				         # 逐页处理后重新打包为 PDF
			
@@ -197,13 +407,31 @@ def process_document(
 
				         for i, img_dict in enumerate(images):
			
 
				             pil_img = img_dict["img_pil"]
			
 
				             img_np = np.array(pil_img)
			
 
				+            page_name = f"{input_path.stem}_page_{i + 1:03d}"
			
 
				 
			
 
				             if has_wm:
			
 
				-                cleaned_gray = remove_watermark_from_image(
			
 
				-                    img_np, threshold=threshold,
			
 
				-                    morph_close_kernel=morph_close_kernel, return_pil=False,
			
 
				+                before = img_np.copy()
			
 
				+                removal_dbg: Dict[str, Any] = {}
			
 
				+                cleaned_rgb = _apply_image_watermark_removal(
			
 
				+                    img_np,
			
 
				+                    settings=settings,
			
 
				+                    contrast_enhancement=contrast_enhancement,
			
 
				+                    apply_watermark_removal=apply_watermark_removal,
			
 
				+                    removal_debug=removal_dbg,
			
 
				+                )
			
 
				+                if save_debug:
			
 
				+                    _maybe_save_watermark_debug(
			
 
				+                        before,
			
 
				+                        cleaned_rgb,
			
 
				+                        debug_root,
			
 
				+                        page_name,
			
 
				+                        settings=settings,
			
 
				+                        contrast_enhancement=contrast_enhancement,
			
 
				+                        removal_debug=removal_dbg,
			
 
				+                    )
			
 
				+                out_pil = Image.fromarray(
			
 
				+                    cv2.cvtColor(cleaned_rgb, cv2.COLOR_BGR2RGB)
			
 
				                 )
			
 
				-                out_pil = Image.fromarray(cleaned_gray).convert("RGB")
			
 
				             else:
			
 
				                 out_pil = pil_img
			
 
				 
			
@@ -223,11 +451,27 @@ def process_document(
 
				     else:
			
 
				         # 图片：有水印则去除后保存
			
 
				         img_np = np.array(images[0]["img_pil"])
			
 
				-        cleaned_gray = remove_watermark_from_image(
			
 
				-            img_np, threshold=threshold,
			
 
				-            morph_close_kernel=morph_close_kernel, return_pil=False,
			
 
				+        before = img_np.copy()
			
 
				+        removal_dbg = {}
			
 
				+        cleaned_rgb = _apply_image_watermark_removal(
			
 
				+            img_np,
			
 
				+            settings=settings,
			
 
				+            contrast_enhancement=contrast_enhancement,
			
 
				+            apply_watermark_removal=apply_watermark_removal,
			
 
				+            removal_debug=removal_dbg,
			
 
				         )
			
 
				-        Image.fromarray(cleaned_gray, mode="L").save(str(output_path))
			
 
				+        if save_debug:
			
 
				+            _maybe_save_watermark_debug(
			
 
				+                before,
			
 
				+                cleaned_rgb,
			
 
				+                debug_root,
			
 
				+                input_path.stem,
			
 
				+                settings=settings,
			
 
				+                contrast_enhancement=contrast_enhancement,
			
 
				+                removal_debug=removal_dbg,
			
 
				+            )
			
 
				+        out_rgb = cv2.cvtColor(cleaned_rgb, cv2.COLOR_BGR2RGB)
			
 
				+        Image.fromarray(out_rgb).save(str(output_path))
			
 
				 
			
 
				     logger.info(f"✅ 保存到: {output_path}")
			
 
				     return len(images)
			
@@ -235,13 +479,11 @@ def process_document(
 
				 
			
 
				 def preview_page(
			
 
				     input_path: Path,
			
 
				+    settings: WatermarkToolSettings,
			
 
				     page_idx: int = 0,
			
 
				-    threshold: int = 160,
			
 
				-    dpi: int = 200,
			
 
				 ):
			
 
				     """展示单页原图与去水印对比（需要 matplotlib）。支持 PDF 和图片文件。"""
			
 
				     try:
			
 
				-        import numpy as np
			
 
				         import matplotlib.pyplot as plt
			
 
				         import matplotlib
			
 
				         matplotlib.rcParams['font.sans-serif'] = ['Arial Unicode MS', 'SimHei', 'sans-serif']
			
@@ -259,7 +501,7 @@ def preview_page(
 
				         doc = fitz.open(str(input_path))
			
 
				         if page_idx >= len(doc):
			
 
				             raise ValueError(f"页码 {page_idx} 超出范围（共 {len(doc)} 页）")
			
 
				-        mat = fitz.Matrix(dpi / 72, dpi / 72)
			
 
				+        mat = fitz.Matrix(settings.dpi / 72, settings.dpi / 72)
			
 
				         page = doc[page_idx]
			
 
				         pix = page.get_pixmap(matrix=mat, alpha=False)
			
 
				         img_np = np.frombuffer(pix.samples, dtype=np.uint8).reshape(pix.h, pix.w, 3)
			
@@ -271,56 +513,261 @@ def preview_page(
 
				     else:
			
 
				         raise ValueError(f"不支持的文件格式: {suffix}")
			
 
				 
			
 
				-    cleaned = remove_watermark_from_image(img_np, threshold=threshold, return_pil=False)
			
 
				+    contrast = _active_contrast_enhancement(settings)
			
 
				+    cleaned_rgb = _apply_image_watermark_removal(
			
 
				+        img_np,
			
 
				+        settings=settings,
			
 
				+        contrast_enhancement=contrast,
			
 
				+        apply_watermark_removal=settings.watermark_enabled,
			
 
				+    )
			
 
				+    cleaned = cv2.cvtColor(cleaned_rgb, cv2.COLOR_BGR2GRAY)
			
 
				 
			
 
				     fig, axes = plt.subplots(1, 2, figsize=(20, 14))
			
 
				     axes[0].imshow(img_np)
			
 
				     axes[0].set_title(title_orig, fontsize=14)
			
 
				     axes[0].axis('off')
			
 
				 
			
 
				+    subtitle = f"method={settings.method}, threshold={settings.threshold}"
			
 
				+    if contrast:
			
 
				+        subtitle += f", contrast={contrast.get('method', 'on')}"
			
 
				     axes[1].imshow(cleaned, cmap='gray')
			
 
				-    axes[1].set_title(f"去水印后  threshold={threshold}", fontsize=14)
			
 
				+    axes[1].set_title(f"去水印后  {subtitle}", fontsize=14)
			
 
				     axes[1].axis('off')
			
 
				 
			
 
				     plt.tight_layout()
			
 
				     plt.show()
			
 
				 
			
 
				 
			
 
				+def _run_process_document(
			
 
				+    input_path: Path,
			
 
				+    output_path: Path,
			
 
				+    settings: WatermarkToolSettings,
			
 
				+    *,
			
 
				+    page_range: Optional[str] = None,
			
 
				+    force_image: bool = False,
			
 
				+    save_debug: bool = False,
			
 
				+    debug_output_dir: Optional[Path] = None,
			
 
				+) -> int:
			
 
				+    return process_document(
			
 
				+        input_path,
			
 
				+        output_path,
			
 
				+        settings,
			
 
				+        page_range=page_range,
			
 
				+        force_image=force_image,
			
 
				+        save_debug=save_debug,
			
 
				+        debug_output_dir=debug_output_dir,
			
 
				+    )
			
 
				+
			
 
				+
			
 
				+def compare_watermark_methods(
			
 
				+    input_path: Path,
			
 
				+    output_dir: Path,
			
 
				+    settings: WatermarkToolSettings,
			
 
				+) -> Dict[str, str]:
			
 
				+    """
			
 
				+    同一张图对比 threshold 与 masked_adaptive，输出三联图与 meta。
			
 
				+
			
 
				+    Returns:
			
 
				+        各输出文件路径
			
 
				+    """
			
 
				+    from PIL import Image
			
 
				+
			
 
				+    output_dir.mkdir(parents=True, exist_ok=True)
			
 
				+    stem = input_path.stem
			
 
				+    img_rgb = np.array(Image.open(str(input_path)).convert("RGB"))
			
 
				+    contrast = _active_contrast_enhancement(settings)
			
 
				+
			
 
				+    paths: Dict[str, str] = {}
			
 
				+    results: Dict[str, np.ndarray] = {}
			
 
				+
			
 
				+    for method in ("threshold", "masked_adaptive"):
			
 
				+        sub = copy.deepcopy(settings)
			
 
				+        sub.method = method
			
 
				+        dbg: Dict[str, Any] = {}
			
 
				+        out = _apply_image_watermark_removal(
			
 
				+            img_rgb,
			
 
				+            settings=sub,
			
 
				+            contrast_enhancement=contrast,
			
 
				+            removal_debug=dbg,
			
 
				+        )
			
 
				+        out_rgb = cv2.cvtColor(out, cv2.COLOR_BGR2RGB)
			
 
				+        results[method] = out_rgb
			
 
				+        out_path = output_dir / f"{stem}_cleaned_{method}.png"
			
 
				+        Image.fromarray(out_rgb).save(str(out_path))
			
 
				+        paths[method] = str(out_path)
			
 
				+        meta_path = output_dir / f"{stem}_meta_{method}.json"
			
 
				+        meta = {
			
 
				+            "method": method,
			
 
				+            "threshold": settings.threshold,
			
 
				+            "mask_mode": dbg.get("mask_mode"),
			
 
				+            "direction_filter": dbg.get("direction_filter"),
			
 
				+            "whiten_mode": dbg.get("whiten_mode"),
			
 
				+            "T_wm": dbg.get("T_wm"),
			
 
				+            "T_protect": dbg.get("T_protect"),
			
 
				+            "mode": dbg.get("mode"),
			
 
				+            "midtone_ratio": dbg.get("midtone_ratio"),
			
 
				+            "wm_candidate_ratio": dbg.get("wm_candidate_ratio"),
			
 
				+            "geom_mask_ratio": dbg.get("geom_mask_ratio"),
			
 
				+            "geom_candidate_ratio": dbg.get("geom_candidate_ratio"),
			
 
				+            "wm_mask_ratio": dbg.get("wm_mask_ratio"),
			
 
				+            "white_pixel_ratio": dbg.get("white_pixel_ratio"),
			
 
				+            "hough_kept_lines": dbg.get("hough_kept_lines"),
			
 
				+            "hough_diag_candidates": dbg.get("hough_diag_candidates"),
			
 
				+            "hough_total_lines": dbg.get("hough_total_lines"),
			
 
				+            "dominant_angles": dbg.get("dominant_angles"),
			
 
				+            "whiten_gray_low": dbg.get("whiten_gray_low"),
			
 
				+        }
			
 
				+        meta_path.write_text(
			
 
				+            json.dumps(meta, ensure_ascii=False, indent=2), encoding="utf-8"
			
 
				+        )
			
 
				+        paths[f"meta_{method}"] = str(meta_path)
			
 
				+        if method == "masked_adaptive":
			
 
				+            layer_paths = save_watermark_mask_debug_layers(
			
 
				+                img_rgb, output_dir, stem, dbg, image_format="png"
			
 
				+            )
			
 
				+            paths.update(layer_paths)
			
 
				+
			
 
				+    h = max(results["threshold"].shape[0], results["masked_adaptive"].shape[0])
			
 
				+
			
 
				+    def _resize_rgb(arr: np.ndarray) -> np.ndarray:
			
 
				+        if arr.shape[0] == h:
			
 
				+            return arr
			
 
				+        scale = h / arr.shape[0]
			
 
				+        w = int(arr.shape[1] * scale)
			
 
				+        return cv2.resize(arr, (w, h))
			
 
				+
			
 
				+    triple = np.hstack(
			
 
				+        [_resize_rgb(img_rgb)]
			
 
				+        + [_resize_rgb(results[m]) for m in ("threshold", "masked_adaptive")]
			
 
				+    )
			
 
				+    compare_path = output_dir / f"{stem}_compare_orig_threshold_masked.png"
			
 
				+    cv2.imwrite(
			
 
				+        str(compare_path),
			
 
				+        cv2.cvtColor(triple, cv2.COLOR_RGB2BGR),
			
 
				+    )
			
 
				+    paths["compare_triple"] = str(compare_path)
			
 
				+    logger.info(f"✅ 方法对比已保存: {compare_path}")
			
 
				+    return paths
			
 
				+
			
 
				+
			
 
				 def main():
			
 
				     parser = argparse.ArgumentParser(
			
 
				-        description="银行流水水印去除工具",
			
 
				+        description="银行流水水印去除工具（参数默认来自场景 YAML，与 main_v2 Pipeline 一致）",
			
 
				         formatter_class=argparse.RawDescriptionHelpFormatter,
			
 
				         epilog=__doc__,
			
 
				     )
			
 
				     parser.add_argument("input", type=Path, help="输入 PDF / 图片文件或目录（批量模式）")
			
 
				-    parser.add_argument("-o", "--output", type=Path, default=None,
			
 
				-                        help="输出路径（单文件模式；默认在原文件名后加 _cleaned）")
			
 
				-    parser.add_argument("--threshold", type=int, default=160,
			
 
				-                        help="灰度阈值 (140-180)，默认 160")
			
 
				-    parser.add_argument("--morph-kernel", type=int, default=2,
			
 
				-                        help="形态学闭运算核大小，0 跳过，默认 2")
			
 
				-    parser.add_argument("--dpi", type=int, default=200,
			
 
				-                        help="渲染 DPI，默认 200")
			
 
				-    parser.add_argument("--batch", action="store_true",
			
 
				-                        help="批量模式：处理目录下所有 PDF 和图片")
			
 
				-    parser.add_argument("--preview", action="store_true",
			
 
				-                        help="预览模式：展示单页对比图（不保存）")
			
 
				-    parser.add_argument("--page", type=int, default=0,
			
 
				-                        help="预览页码（0-based），默认第 0 页")
			
 
				-    parser.add_argument("--page-range", type=str, default=None,
			
 
				-                        help="处理页面范围，如 '1-3,5,7-9'（从 1 开始，仅对 PDF 有效）")
			
 
				-    parser.add_argument("--force-image", action="store_true",
			
 
				-                        help="强制对文字型 PDF 使用图像化处理（会失去可搜索性，适用于 XObject 方法无法去除的内联水印）")
			
 
				+    parser.add_argument(
			
 
				+        "-c",
			
 
				+        "--config",
			
 
				+        type=Path,
			
 
				+        default=_DEFAULT_CONFIG_PATH,
			
 
				+        help=f"场景配置文件，读取 preprocessor.watermark_removal（默认: {_DEFAULT_CONFIG_PATH.name}）",
			
 
				+    )
			
 
				+    parser.add_argument(
			
 
				+        "-o",
			
 
				+        "--output",
			
 
				+        type=Path,
			
 
				+        default=None,
			
 
				+        help="输出路径（单文件模式；默认在原文件名后加 _cleaned）",
			
 
				+    )
			
 
				+    parser.add_argument("--batch", action="store_true", help="批量处理目录下所有 PDF 和图片")
			
 
				+    parser.add_argument("--preview", action="store_true", help="预览模式：展示单页对比图（不保存）")
			
 
				+    parser.add_argument("--page", type=int, default=0, help="预览页码（0-based）")
			
 
				+    parser.add_argument(
			
 
				+        "--page-range",
			
 
				+        type=str,
			
 
				+        default=None,
			
 
				+        help="PDF 页面范围，如 '1-3,5,7-9'（从 1 开始）",
			
 
				+    )
			
 
				+    parser.add_argument(
			
 
				+        "--force-image",
			
 
				+        action="store_true",
			
 
				+        help="文字型 PDF 强制走图像去水印（失去可搜索性）",
			
 
				+    )
			
 
				+    parser.add_argument(
			
 
				+        "--debug",
			
 
				+        action="store_true",
			
 
				+        help="保存调试图到 debug_comparison/watermark_removal/",
			
 
				+    )
			
 
				+    parser.add_argument(
			
 
				+        "--debug-dir",
			
 
				+        type=Path,
			
 
				+        default=None,
			
 
				+        help="调试图根目录（默认 -o 的父目录；格式见配置文件 debug_options.image_format）",
			
 
				+    )
			
 
				+    # 以下为覆盖配置文件的少量旋钮（未指定则完全使用 YAML）
			
 
				+    override = parser.add_argument_group("覆盖配置文件（可选）")
			
 
				+    override.add_argument(
			
 
				+        "--threshold",
			
 
				+        type=int,
			
 
				+        default=None,
			
 
				+        help="覆盖 watermark_removal.threshold（140-180）",
			
 
				+    )
			
 
				+    override.add_argument(
			
 
				+        "--morph-kernel",
			
 
				+        type=int,
			
 
				+        default=None,
			
 
				+        help="覆盖 watermark_removal.morph_close_kernel",
			
 
				+    )
			
 
				+    override.add_argument("--dpi", type=int, default=None, help="覆盖 input.dpi")
			
 
				+    override.add_argument("--no-contrast", action="store_true", help="关闭 contrast_enhancement")
			
 
				+    override.add_argument(
			
 
				+        "--text-black-target",
			
 
				+        type=int,
			
 
				+        default=None,
			
 
				+        help="覆盖 contrast_enhancement.text_black_target（text_restore）",
			
 
				+    )
			
 
				+    override.add_argument(
			
 
				+        "--method",
			
 
				+        type=str,
			
 
				+        default=None,
			
 
				+        choices=["threshold", "masked", "masked_adaptive"],
			
 
				+        help="覆盖 watermark_removal.method",
			
 
				+    )
			
 
				+    parser.add_argument(
			
 
				+        "--compare-methods",
			
 
				+        action="store_true",
			
 
				+        help="对比 threshold 与 masked_adaptive，输出三联图到 -o 目录",
			
 
				+    )
			
 
				 
			
 
				     args = parser.parse_args()
			
 
				 
			
 
				-    if args.preview:
			
 
				-        preview_page(
			
 
				-            args.input,
			
 
				-            page_idx=args.page,
			
 
				+    try:
			
 
				+        settings = resolve_watermark_settings(
			
 
				+            args.config,
			
 
				             threshold=args.threshold,
			
 
				+            morph_close_kernel=args.morph_kernel,
			
 
				             dpi=args.dpi,
			
 
				+            no_contrast=args.no_contrast,
			
 
				+            text_black_target=args.text_black_target,
			
 
				+            method=args.method,
			
 
				         )
			
 
				+    except FileNotFoundError as e:
			
 
				+        logger.error(str(e))
			
 
				+        sys.exit(1)
			
 
				+
			
 
				+    logger.info(
			
 
				+        f"📋 配置: {args.config} | method={settings.method} | "
			
 
				+        f"threshold={settings.threshold} | morph_kernel={settings.morph_close_kernel} | "
			
 
				+        f"dpi={settings.dpi} | contrast={settings.contrast_enhancement}"
			
 
				+    )
			
 
				+
			
 
				+    if args.compare_methods:
			
 
				+        input_path = args.input
			
 
				+        if not input_path.is_file():
			
 
				+            logger.error(f"文件不存在: {input_path}")
			
 
				+            sys.exit(1)
			
 
				+        out_dir = args.output or (
			
 
				+            input_path.parent / "debug_comparison" / "watermark_method_compare"
			
 
				+        )
			
 
				+        paths = compare_watermark_methods(input_path, out_dir, settings)
			
 
				+        for k, v in paths.items():
			
 
				+            logger.info(f"  {k}: {v}")
			
 
				+        return
			
 
				+
			
 
				+    if args.preview:
			
 
				+        preview_page(args.input, settings, page_idx=args.page)
			
 
				         return
			
 
				 
			
 
				     if args.batch:
			
@@ -345,7 +792,15 @@ def main():
 
				         for file in all_files:
			
 
				             out_file = out_dir / f"{file.stem}_cleaned{file.suffix}"
			
 
				             try:
			
 
				-                process_document(file, out_file, args.threshold, args.morph_kernel, args.dpi, args.page_range, args.force_image)
			
 
				+                _run_process_document(
			
 
				+                    file,
			
 
				+                    out_file,
			
 
				+                    settings,
			
 
				+                    page_range=args.page_range,
			
 
				+                    force_image=args.force_image,
			
 
				+                    save_debug=args.debug,
			
 
				+                    debug_output_dir=args.debug_dir or out_dir,
			
 
				+                )
			
 
				             except Exception as e:
			
 
				                 logger.error(f"❌ 处理失败 {file.name}: {e}")
			
 
				         logger.info(f"✅ 批量处理完成，共 {len(all_files)} 个文件 -> {out_dir}")
			
@@ -360,7 +815,15 @@ def main():
 
				         )
			
 
				         suffix = input_path.suffix.lower()
			
 
				         if suffix == ".pdf" or suffix in IMAGE_SUFFIXES:
			
 
				-            process_document(input_path, output_path, args.threshold, args.morph_kernel, args.dpi, args.page_range, args.force_image)
			
 
				+            _run_process_document(
			
 
				+                input_path,
			
 
				+                output_path,
			
 
				+                settings,
			
 
				+                page_range=args.page_range,
			
 
				+                force_image=args.force_image,
			
 
				+                save_debug=args.debug,
			
 
				+                debug_output_dir=args.debug_dir or output_path.parent,
			
 
				+            )
			
 
				         else:
			
 
				             logger.error(f"不支持的文件格式: {suffix}，支持 PDF 和 {IMAGE_SUFFIXES}")
			
 
				             sys.exit(1)
			
@@ -379,14 +842,15 @@ if __name__ == "__main__":
 
				             # 文字PDF测试
			
 
				             # "input": "/Users/zhch158/workspace/data/流水分析/提取自赤峰黄金2023年报.pdf",
			
 
				             # "input": "/Users/zhch158/workspace/data/测试文字PDF-水印.pdf",
			
 
				-            "input": "/Users/zhch158/workspace/data/非结构化文档识别统一平台（ocr_platform）-交易流水识别，财报识别.pdf",
			
 
				+            # "input": "/Users/zhch158/workspace/data/非结构化文档识别统一平台（ocr_platform）-交易流水识别，财报识别.pdf",
			
 
				+            "input": "/Users/zhch158/workspace/data/流水分析/彭_广东兴宁农村商业银行/bank_statement_yusys_local/彭_广东兴宁农村商业银行/彭_广东兴宁农村商业银行_page_002.png",
			
 
				             # "output": "./output/杨万益_福建农信",
			
 
				             # 页面范围（可选，支持 "1-5,7" 语法，仅对 PDF 有效）
			
 
				             # "page_range": "3",  # 仅处理第 1 页（对应 --page-range 参数）
			
 
				-            "dpi": 200,
			
 
				-            "threshold": 160,
			
 
				-            "morph_kernel": 0,  # 遮罩替换模式下不需要闭运算
			
 
				-            # "preview": True,
			
 
				+            "config": str(_DEFAULT_CONFIG_PATH),
			
 
				+            "preview": True,
			
 
				+            "debug": True,
			
 
				+            "compare-methods": True,
			
 
				         }
			
 
				 
			
 
				         # 构造参数（注意 input 是位置参数，morph_kernel 对应 --morph-kernel）