7 ساعت پیش · 62bfdb256f
--- a/ocr_tools/lab/cell_preprocess_lab/aggregate_recommendation.json
+++ b/ocr_tools/lab/cell_preprocess_lab/aggregate_recommendation.json
@@ -0,0 +1,117 @@
 
				+{
			
 
				+  "min_hit_score": 0.9,
			
 
				+  "per_case": [
			
 
				+    {
			
 
				+      "report": "output/彭_广东兴宁农村商业银行/cell219_sweep/cell219_lines_AT存折取款/sweep_report.json",
			
 
				+      "input": "/Users/zhch158/workspace/data/流水分析/彭_广东兴宁农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/彭_广东兴宁农村商业银行_page_002_0/cell219_lines_AT存折取款_raw.png",
			
 
				+      "target": "ATM存折取款",
			
 
				+      "qualified_count": 2,
			
 
				+      "top_tag": "threshold_t150_c0_ob_u128_det0.5",
			
 
				+      "top_score": 0.951827,
			
 
				+      "top_text": "ATM存折取款"
			
 
				+    },
			
 
				+    {
			
 
				+      "report": "output/彭_广东兴宁农村商业银行/cell071_sweep/cell071_empty_empty/sweep_report.json",
			
 
				+      "input": "/Users/zhch158/workspace/data/流水分析/彭_广东兴宁农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/彭_广东兴宁农村商业银行_page_001_0/cell071_empty_empty_raw.png",
			
 
				+      "target": "20241224",
			
 
				+      "qualified_count": 16,
			
 
				+      "top_tag": "threshold_t150_cl_1.0_8_ob_u192_det0.5",
			
 
				+      "top_score": 0.995878,
			
 
				+      "top_text": "20241224"
			
 
				+    },
			
 
				+    {
			
 
				+      "report": "output/彭_广东兴宁农村商业银行/cell007_sweep/cell007_whole_longer_易型交类/sweep_report.json",
			
 
				+      "input": "/Users/zhch158/workspace/data/流水分析/彭_广东兴宁农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/彭_广东兴宁农村商业银行_page_002_0/cell007_whole_longer_易型交类_raw.png",
			
 
				+      "target": "交易类型",
			
 
				+      "qualified_count": 35,
			
 
				+      "top_tag": "threshold_t150_cl_1.0_8_oa_u96_det0.5",
			
 
				+      "top_score": 0.999876,
			
 
				+      "top_text": "交易类型"
			
 
				+    },
			
 
				+    {
			
 
				+      "report": "output/彭_广东兴宁农村商业银行/cell007_p005_sweep/cell007_empty_empty/sweep_report.json",
			
 
				+      "input": "/Users/zhch158/workspace/data/流水分析/彭_广东兴宁农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/彭_广东兴宁农村商业银行_page_005_0/cell007_empty_empty_raw.png",
			
 
				+      "target": "交易类型",
			
 
				+      "qualified_count": 43,
			
 
				+      "top_tag": "threshold_t150_cl_1.0_8_oa_u96_det0.5",
			
 
				+      "top_score": 0.999915,
			
 
				+      "top_text": "交易类型"
			
 
				+    },
			
 
				+    {
			
 
				+      "report": "output/钟_广东陆丰农村商业银行/cell077_sweep/cell077_empty_empty/sweep_report.json",
			
 
				+      "input": "/Users/zhch158/workspace/data/流水分析/钟_广东陆丰农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/钟_广东陆丰农村商业银行_page_001_0/cell077_empty_empty_raw.png",
			
 
				+      "target": "专项资金",
			
 
				+      "qualified_count": 29,
			
 
				+      "top_tag": "threshold_t155_cl_1.0_8_ob_u96_det0.5",
			
 
				+      "top_score": 0.999815,
			
 
				+      "top_text": "专项资金"
			
 
				+    },
			
 
				+    {
			
 
				+      "report": "output/钟_广东陆丰农村商业银行/cell217_sweep/cell217_empty_empty/sweep_report.json",
			
 
				+      "input": "/Users/zhch158/workspace/data/流水分析/钟_广东陆丰农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/钟_广东陆丰农村商业银行_page_001_0/cell217_empty_empty_raw.png",
			
 
				+      "target": "专项资金",
			
 
				+      "qualified_count": 53,
			
 
				+      "top_tag": "threshold_t155_cl_1.0_8_ob_u96_det0.5",
			
 
				+      "top_score": 0.999855,
			
 
				+      "top_text": "专项资金"
			
 
				+    },
			
 
				+    {
			
 
				+      "report": "output/钟_广东陆丰农村商业银行/cell017_sweep/cell017_empty_empty/sweep_report.json",
			
 
				+      "input": "/Users/zhch158/workspace/data/流水分析/钟_广东陆丰农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/钟_广东陆丰农村商业银行_page_003_0/cell017_empty_empty_raw.png",
			
 
				+      "target": "专项资金",
			
 
				+      "qualified_count": 53,
			
 
				+      "top_tag": "threshold_t155_cl_1.0_8_ob_u96_det0.5",
			
 
				+      "top_score": 0.999575,
			
 
				+      "top_text": "专项资金"
			
 
				+    }
			
 
				+  ],
			
 
				+  "intersection_tags": [],
			
 
				+  "intersection_count": 0,
			
 
				+  "recommended_tag": "threshold_t150_cl_1.0_8_ob_u96_det0.5",
			
 
				+  "pick_reason": "无全局 tag 交集，按各 case 榜首做分字段多数票（跳过 baseline）",
			
 
				+  "majority_fields": {
			
 
				+    "method": "threshold",
			
 
				+    "threshold": 150,
			
 
				+    "contrast_cfg": {
			
 
				+      "method": "clahe",
			
 
				+      "clip_limit": 1.0,
			
 
				+      "tile_grid_size": 8
			
 
				+    },
			
 
				+    "contrast_order": "before_upscale",
			
 
				+    "upscale": 96,
			
 
				+    "det_db_box_thresh": 0.5
			
 
				+  },
			
 
				+  "pass1_cell_preprocess": {
			
 
				+    "watermark": {
			
 
				+      "enabled": true,
			
 
				+      "method": "threshold",
			
 
				+      "threshold": 150
			
 
				+    },
			
 
				+    "upscale_min_side": 96,
			
 
				+    "contrast": {
			
 
				+      "enabled": true,
			
 
				+      "method": "clahe",
			
 
				+      "clip_limit": 1.0,
			
 
				+      "tile_grid_size": 8
			
 
				+    },
			
 
				+    "enhance_retry": {
			
 
				+      "enabled": true,
			
 
				+      "contrast": {
			
 
				+        "enabled": true,
			
 
				+        "method": "clahe",
			
 
				+        "clip_limit": 1.0,
			
 
				+        "tile_grid_size": 4
			
 
				+      }
			
 
				+    }
			
 
				+  },
			
 
				+  "pass2_enhance_retry": {
			
 
				+    "enabled": true,
			
 
				+    "contrast": {
			
 
				+      "enabled": true,
			
 
				+      "method": "clahe",
			
 
				+      "clip_limit": 1.0,
			
 
				+      "tile_grid_size": 4
			
 
				+    }
			
 
				+  },
			
 
				+  "pass2_tag": "threshold_t150_cl_1.0_8_ob_u96_det0.5"
			
 
				+}
			
--- a/ocr_tools/lab/cell_preprocess_lab/cell_sweep.py
+++ b/ocr_tools/lab/cell_preprocess_lab/cell_sweep.py
@@ -24,6 +24,10 @@
 
				 
			
 
				     # 指定目标文字，自动统计 HIT 命中率
			
 
				     python cell_sweep.py /path/to/tablecell_ocr/ -o ./out --best-only -t "交易类型"
			
 
				+
			
 
				+    # 多 case 批量扫描 + 汇总 Pass1/Pass2 建议
			
 
				+    python cell_sweep.py --cases sweep_cases.json
			
 
				+    python cell_sweep.py --aggregate-only --cases sweep_cases.json
			
 
				 """
			
 
				 from __future__ import annotations
			
 
				 
			
@@ -392,6 +396,32 @@ def _match_hit(text: str, target: Optional[str]) -> Optional[str]:
 
				     return None
			
 
				 
			
 
				 
			
 
				+def _collect_qualified_hits(
			
 
				+    results: List[Dict[str, Any]],
			
 
				+    target: Optional[str],
			
 
				+    *,
			
 
				+    min_score: float = 0.9,
			
 
				+    ocr_mode: str = "det_rec",
			
 
				+) -> List[Dict[str, Any]]:
			
 
				+    """命中 target 且 score > min_score 的组合（按 tag 去重，保留最高分）。"""
			
 
				+    if not target:
			
 
				+        return []
			
 
				+    by_tag: Dict[str, Dict[str, Any]] = {}
			
 
				+    for r in results:
			
 
				+        if r.get("ocr_mode") != ocr_mode:
			
 
				+            continue
			
 
				+        if not _match_hit(r.get("text", "") or "", target):
			
 
				+            continue
			
 
				+        score = float(r.get("score") or 0)
			
 
				+        if score <= min_score:
			
 
				+            continue
			
 
				+        tag = str(r.get("tag") or "")
			
 
				+        prev = by_tag.get(tag)
			
 
				+        if prev is None or score > float(prev.get("score") or 0):
			
 
				+            by_tag[tag] = r
			
 
				+    return sorted(by_tag.values(), key=lambda x: -(float(x.get("score") or 0)))
			
 
				+
			
 
				+
			
 
				 def run_sweep(
			
 
				     input_path: Path,
			
 
				     out_dir: Path,
			
@@ -408,6 +438,7 @@ def run_sweep(
 
				     save_images: bool,
			
 
				     run_baseline: bool,
			
 
				     baseline_upscale: int,
			
 
				+    min_hit_score: float = 0.9,
			
 
				 ) -> Dict[str, Any]:
			
 
				     resolved = resolve_input_image(input_path, prefer_raw=prefer_raw)
			
 
				     raw = cv2.imread(str(resolved))
			
@@ -499,13 +530,34 @@ def run_sweep(
 
				                     row["match"] = m
			
 
				                     hits.append(row)
			
 
				 
			
 
				+    qualified_hits = _collect_qualified_hits(
			
 
				+        results, target, min_score=min_hit_score, ocr_mode="det_rec"
			
 
				+    )
			
 
				     report = {
			
 
				         "input": str(resolved),
			
 
				         "input_requested": str(input_path),
			
 
				         "output_dir": str(cell_out),
			
 
				         "target": target,
			
 
				+        "min_hit_score": min_hit_score,
			
 
				         "total_trials": total,
			
 
				         "hits": hits,
			
 
				+        "hits_target_score_above": [
			
 
				+            {
			
 
				+                "tag": r.get("tag"),
			
 
				+                "score": r.get("score"),
			
 
				+                "text": r.get("text"),
			
 
				+                "match": r.get("match"),
			
 
				+                "method": r.get("method"),
			
 
				+                "threshold": r.get("threshold"),
			
 
				+                "contrast_method": r.get("contrast_method"),
			
 
				+                "contrast_order": r.get("contrast_order"),
			
 
				+                "contrast_cfg": r.get("contrast_cfg"),
			
 
				+                "upscale": r.get("upscale"),
			
 
				+                "det_db_box_thresh": r.get("det_db_box_thresh"),
			
 
				+                "ocr_mode": r.get("ocr_mode"),
			
 
				+            }
			
 
				+            for r in qualified_hits
			
 
				+        ],
			
 
				         "all_results": results,
			
 
				     }
			
 
				     report_path = cell_out / "sweep_report.json"
			
@@ -513,28 +565,57 @@ def run_sweep(
 
				         json.dumps(report, ensure_ascii=False, indent=2), encoding="utf-8"
			
 
				     )
			
 
				 
			
 
				-    # ── 结论报告：按 OCR score 排序，分组对比 ──
			
 
				-    _print_conclusions(stem, results, target)
			
 
				+    _print_conclusions(stem, results, target, min_hit_score=min_hit_score)
			
 
				 
			
 
				     return report
			
 
				 
			
 
				 
			
 
				+def _sorted_summary_labels(values: set) -> List[str]:
			
 
				+    """将可能含 None 的集合转为可排序的展示标签（baseline 行字段常为 None）。"""
			
 
				+    labels: List[str] = []
			
 
				+    if None in values:
			
 
				+        labels.append("baseline")
			
 
				+    labels.extend(sorted(str(v) for v in values if v is not None))
			
 
				+    return labels
			
 
				+
			
 
				+
			
 
				+def _format_param_row(r: Dict[str, Any]) -> str:
			
 
				+    """单行参数组合描述。"""
			
 
				+    cfg = r.get("contrast_cfg") or {}
			
 
				+    cm = r.get("contrast_method", "none")
			
 
				+    extra = ""
			
 
				+    if cm == "clahe":
			
 
				+        extra = f" cl={cfg.get('clip_limit')} tile={cfg.get('tile_grid_size')}"
			
 
				+    elif cm == "text_restore":
			
 
				+        extra = f" t={cfg.get('text_black_target')} bg={cfg.get('background_threshold')}"
			
 
				+    elif cm == "gamma":
			
 
				+        extra = f" g={cfg.get('gamma')}"
			
 
				+    elif cm == "linear":
			
 
				+        extra = f" b={cfg.get('black_percentile')} w={cfg.get('white_percentile')}"
			
 
				+    order = "放大前" if r.get("contrast_order") == "before_upscale" else "放大后"
			
 
				+    return (
			
 
				+        f"wm={r.get('method')} thresh={r.get('threshold', 'd')} contrast={cm}{extra} "
			
 
				+        f"order={order} upscale={r.get('upscale')} det={r.get('det_db_box_thresh')}"
			
 
				+    )
			
 
				+
			
 
				+
			
 
				 def _print_conclusions(
			
 
				     stem: str,
			
 
				     results: List[Dict[str, Any]],
			
 
				     target: Optional[str],
			
 
				+    *,
			
 
				+    min_hit_score: float = 0.9,
			
 
				 ) -> None:
			
 
				-    """打印实验结论：按 OCR score 排序，分组展示最优组合。"""
			
 
				+    """先列出命中 target 且 score>阈值的全部参数组合，再输出结论。"""
			
 
				     if not results:
			
 
				         return
			
 
				 
			
 
				     print(f"\n{'='*70}")
			
 
				     print(f"  实验结论: {stem}")
			
 
				     if target:
			
 
				-        print(f"  目标文字: {target}")
			
 
				+        print(f"  目标文字: {target!r}  阈值: score > {min_hit_score} (det_rec)")
			
 
				     print(f"{'='*70}")
			
 
				 
			
 
				-    # 取 det_rec 模式的结果（优先用检测+识别完整结果）
			
 
				     dr_results = [r for r in results if r.get("ocr_mode") == "det_rec" and r.get("text")]
			
 
				     if not dr_results:
			
 
				         dr_results = [r for r in results if r.get("text")]
			
@@ -543,77 +624,88 @@ def _print_conclusions(
 
				         print("  (无有效 OCR 结果)")
			
 
				         return
			
 
				 
			
 
				-    # ── 1. 全局 Top-5 ──
			
 
				-    scored = sorted(dr_results, key=lambda r: -(r.get("score") or 0))
			
 
				-    print("\n  全局 OCR 得分 Top-5:")
			
 
				-    for i, r in enumerate(scored[:5], 1):
			
 
				-        print(f"    {i}. score={r.get('score', 0):.4f}  text={r.get('text', '')!r}")
			
 
				-        print(f"       tag={r.get('tag', '')}")
			
 
				-
			
 
				-    # ── 2. 按 contrast 方法分组最佳 ──
			
 
				-    print("\n  按 contrast 方法分组最优（score 最高）:")
			
 
				-    groups: Dict[str, List[Dict[str, Any]]] = {}
			
 
				-    for r in scored:
			
 
				-        cm = r.get("contrast_method", "?")
			
 
				-        groups.setdefault(cm, []).append(r)
			
 
				-
			
 
				-    for cm in sorted(groups.keys()):
			
 
				-        best = groups[cm][0]
			
 
				-        wm = best.get("method", "?")
			
 
				-        print(f"    [{cm}] 最佳: score={best.get('score', 0):.4f} "
			
 
				-              f"wm={wm} upscale={best.get('upscale')} "
			
 
				-              f"text={best.get('text', '')!r}")
			
 
				-
			
 
				-    # ── 3. 有 watermark 处理 vs 无 watermark 处理对比 ──
			
 
				-    print("\n  去水印开关对比（同 contrast 方法，最高 score）:")
			
 
				-    wm_groups: Dict[str, Dict[str, Any]] = {}
			
 
				-    for r in scored:
			
 
				-        cm = r.get("contrast_method", "?")
			
 
				-        wm = r.get("method", "?") if r.get("method") != "none" else "无去水印"
			
 
				-        key = f"{cm}|{wm}"
			
 
				-        cur_score = r.get("score") or 0
			
 
				-        prev_score = (wm_groups.get(key) or {}).get("score") or 0
			
 
				-        if key not in wm_groups or cur_score > prev_score:
			
 
				-            wm_groups[key] = r
			
 
				-
			
 
				-    for cm in sorted(set(r.get("contrast_method", "?") for r in scored)):
			
 
				-        wm_rows = [r for k, r in wm_groups.items() if k.startswith(cm + "|")]
			
 
				-        if wm_rows:
			
 
				-            best_row = max(wm_rows, key=lambda r: r.get("score") or 0)
			
 
				-            wm_label = "无去水印" if best_row.get("method") == "none" else best_row.get("method", "?")
			
 
				-            print(f"    [{cm}] 最优: wm={wm_label}  score={best_row.get('score', 0):.4f} "
			
 
				-                  f"text={best_row.get('text', '')!r}")
			
 
				-
			
 
				-    # ── 4. 放大顺序对比 ──
			
 
				-    print("\n  放大前/后对比（同方法，最高 score）:")
			
 
				-    order_data: Dict[str, Dict[str, Any]] = {}
			
 
				-    for r in scored:
			
 
				-        cm = r.get("contrast_method", "?")
			
 
				-        co = r.get("contrast_order", "?")
			
 
				-        key = f"{cm}|{co}"
			
 
				-        cur_score = r.get("score") or 0
			
 
				-        prev_score = (order_data.get(key) or {}).get("score") or 0
			
 
				-        if key not in order_data or cur_score > prev_score:
			
 
				-            order_data[key] = r
			
 
				-
			
 
				-    for cm in sorted(set(r.get("contrast_method", "?") for r in scored)):
			
 
				-        b_score = (order_data.get(f"{cm}|before_upscale") or {}).get("score") or 0
			
 
				-        a_score = (order_data.get(f"{cm}|after_upscale") or {}).get("score") or 0
			
 
				-        better = "放大前" if b_score > a_score else ("放大后" if a_score > b_score else "持平")
			
 
				-        if b_score or a_score:
			
 
				-            print(f"    [{cm}] 放大前={b_score:.4f}  放大后={a_score:.4f}  更优: {better}")
			
 
				-
			
 
				-    # ── 5. HIT 命中率统计 ──
			
 
				-    if target:
			
 
				-        hit_count = sum(1 for r in results if r.get("match"))
			
 
				-        hit_by_cm: Dict[str, int] = {}
			
 
				-        for r in results:
			
 
				-            if r.get("match"):
			
 
				-                cm = r.get("contrast_method", "?")
			
 
				-                hit_by_cm[cm] = hit_by_cm.get(cm, 0) + 1
			
 
				-        print(f"\n  HIT 命中率 (target={target}): {hit_count}/{len(results)}")
			
 
				-        for cm in sorted(hit_by_cm.keys()):
			
 
				-            print(f"    [{cm}] HIT={hit_by_cm[cm]}")
			
 
				+    scored = sorted(dr_results, key=lambda r: -(float(r.get("score") or 0)))
			
 
				+    qualified = _collect_qualified_hits(
			
 
				+        results, target, min_score=min_hit_score, ocr_mode="det_rec"
			
 
				+    )
			
 
				+
			
 
				+    # ── 1. 命中 target 且 score > 阈值 的全部参数组合 ──
			
 
				+    print(f"\n  【命中列表】共 {len(qualified)} 组 (target 匹配 + score > {min_hit_score}):")
			
 
				+    if not target:
			
 
				+        print("    (未指定 -t/--target，跳过命中列表)")
			
 
				+    elif not qualified:
			
 
				+        print("    (无满足条件的组合)")
			
 
				+        # 仍展示最接近的 HIT
			
 
				+        near = [
			
 
				+            r for r in scored
			
 
				+            if _match_hit(r.get("text", "") or "", target)
			
 
				+        ]
			
 
				+        if near:
			
 
				+            print(f"    提示: 有 {len(near)} 组命中 target 但 score <= {min_hit_score}，最高分:")
			
 
				+            for r in near[:5]:
			
 
				+                print(
			
 
				+                    f"      score={float(r.get('score', 0)):.4f}  text={r.get('text', '')!r}"
			
 
				+                )
			
 
				+                print(f"      tag={r.get('tag', '')}")
			
 
				+    else:
			
 
				+        for i, r in enumerate(qualified, 1):
			
 
				+            print(
			
 
				+                f"    {i}. score={float(r.get('score', 0)):.4f}  "
			
 
				+                f"match={r.get('match')}  text={r.get('text', '')!r}"
			
 
				+            )
			
 
				+            print(f"       tag={r.get('tag', '')}")
			
 
				+            print(f"       {_format_param_row(r)}")
			
 
				+
			
 
				+    # ── 2. 结论 ──
			
 
				+    print("\n  【结论】")
			
 
				+    if qualified:
			
 
				+        best = qualified[0]
			
 
				+        print(
			
 
				+            f"    推荐参数组合: {best.get('tag')} "
			
 
				+            f"(score={float(best.get('score', 0)):.4f}, text={best.get('text', '')!r})"
			
 
				+        )
			
 
				+        print(f"    {_format_param_row(best)}")
			
 
				+
			
 
				+        # 在合格集合内做简要对比
			
 
				+        cm_best: Dict[str, Dict[str, Any]] = {}
			
 
				+        for r in qualified:
			
 
				+            cm = r.get("contrast_method") or "baseline"
			
 
				+            if cm not in cm_best or float(r.get("score") or 0) > float(
			
 
				+                cm_best[cm].get("score") or 0
			
 
				+            ):
			
 
				+                cm_best[cm] = r
			
 
				+        print("    合格组合内各 contrast 最优:")
			
 
				+        for cm in sorted(cm_best.keys(), key=str):
			
 
				+            r = cm_best[cm]
			
 
				+            print(
			
 
				+                f"      [{cm}] score={float(r.get('score', 0)):.4f}  tag={r.get('tag', '')}"
			
 
				+            )
			
 
				+
			
 
				+        wm_set = {r.get("method") for r in qualified}
			
 
				+        order_set = {r.get("contrast_order") for r in qualified}
			
 
				+        upscale_vals = {r.get("upscale") for r in qualified}
			
 
				+        upscale_set = _sorted_summary_labels(
			
 
				+            {str(v) if v is not None else "baseline" for v in upscale_vals}
			
 
				+        )
			
 
				+        print(
			
 
				+            f"    合格组合涉及: 去水印={_sorted_summary_labels(wm_set)}  "
			
 
				+            f"放大顺序={_sorted_summary_labels(order_set)}  upscale={upscale_set}"
			
 
				+        )
			
 
				+        print(f"    共 {len(qualified)} 组参数可用于生产配置参考")
			
 
				+    else:
			
 
				+        top = scored[0] if scored else None
			
 
				+        if top and target and _match_hit(top.get("text", "") or "", target):
			
 
				+            print(
			
 
				+                f"    无 score>{min_hit_score} 的命中组合；最高分命中: "
			
 
				+                f"{top.get('tag')} score={float(top.get('score', 0)):.4f}"
			
 
				+            )
			
 
				+        elif top:
			
 
				+            print(
			
 
				+                f"    无命中 target 的组合；全局最高 det_rec: "
			
 
				+                f"{top.get('tag')} score={float(top.get('score', 0)):.4f} text={top.get('text', '')!r}"
			
 
				+            )
			
 
				+        else:
			
 
				+            print("    无可用结论")
			
 
				 
			
 
				     print(f"{'='*70}\n")
			
 
				 
			
@@ -659,6 +751,221 @@ def _parse_best_config(tag: str) -> Dict[str, Any]:
 
				     return cfg
			
 
				 
			
 
				 
			
 
				+def _tag_to_cell_preprocess_yaml(tag: str) -> Dict[str, Any]:
			
 
				+    """将 sweep tag 转为 second_pass_ocr.cell_preprocess 片段（Pass1 + Pass2）。"""
			
 
				+    cfg = _parse_best_config(tag)
			
 
				+    cm = cfg["contrast_cfg"].get("method", "none")
			
 
				+    cpp: Dict[str, Any] = {
			
 
				+        "watermark": {
			
 
				+            "enabled": cfg["method"] != "none",
			
 
				+            "method": cfg["method"],
			
 
				+        },
			
 
				+        "upscale_min_side": cfg["upscale"],
			
 
				+    }
			
 
				+    if cfg["method"] == "threshold" and cfg.get("threshold") is not None:
			
 
				+        cpp["watermark"]["threshold"] = cfg["threshold"]
			
 
				+    if cm != "none":
			
 
				+        contrast = {"enabled": True, "method": cm, **{k: v for k, v in cfg["contrast_cfg"].items() if k != "method"}}
			
 
				+        cpp["contrast"] = contrast
			
 
				+    else:
			
 
				+        cpp["contrast"] = {"enabled": False}
			
 
				+    pass2_contrast: Dict[str, Any] = dict(cpp.get("contrast") or {"enabled": False})
			
 
				+    if pass2_contrast.get("enabled") and pass2_contrast.get("method") == "clahe":
			
 
				+        pass2_contrast = dict(pass2_contrast)
			
 
				+        pass2_contrast["tile_grid_size"] = int(4)
			
 
				+    cpp["enhance_retry"] = {
			
 
				+        "enabled": True,
			
 
				+        "upscale_min_side": cfg["upscale"],
			
 
				+        "contrast": pass2_contrast,
			
 
				+    }
			
 
				+    return cpp
			
 
				+
			
 
				+
			
 
				+def _qualified_from_report(report: Dict[str, Any], min_score: float) -> List[Dict[str, Any]]:
			
 
				+    qh = report.get("hits_target_score_above")
			
 
				+    if qh is not None:
			
 
				+        return list(qh)
			
 
				+    return _collect_qualified_hits(
			
 
				+        report.get("all_results") or [],
			
 
				+        report.get("target"),
			
 
				+        min_score=min_score,
			
 
				+        ocr_mode="det_rec",
			
 
				+    )
			
 
				+
			
 
				+
			
 
				+def _majority_key(items: Sequence[Any]) -> Any:
			
 
				+    from collections import Counter
			
 
				+
			
 
				+    if not items:
			
 
				+        return None
			
 
				+    return Counter(items).most_common(1)[0][0]
			
 
				+
			
 
				+
			
 
				+def aggregate_sweep_reports(
			
 
				+    report_paths: Sequence[Path],
			
 
				+    *,
			
 
				+    min_hit_score: float = 0.9,
			
 
				+) -> Dict[str, Any]:
			
 
				+    """跨多个 sweep_report.json 汇总，输出 Pass1/Pass2 配置建议。"""
			
 
				+    per_case: List[Dict[str, Any]] = []
			
 
				+    all_qualified_tags: List[set] = []
			
 
				+
			
 
				+    for rp in report_paths:
			
 
				+        if not rp.is_file():
			
 
				+            per_case.append({"report": str(rp), "error": "missing"})
			
 
				+            continue
			
 
				+        report = json.loads(rp.read_text(encoding="utf-8"))
			
 
				+        qualified = _qualified_from_report(report, min_hit_score)
			
 
				+        tags = [str(r.get("tag") or "") for r in qualified if r.get("tag")]
			
 
				+        all_qualified_tags.append(set(tags))
			
 
				+        top = qualified[0] if qualified else None
			
 
				+        per_case.append(
			
 
				+            {
			
 
				+                "report": str(rp),
			
 
				+                "input": report.get("input"),
			
 
				+                "target": report.get("target"),
			
 
				+                "qualified_count": len(qualified),
			
 
				+                "top_tag": top.get("tag") if top else None,
			
 
				+                "top_score": top.get("score") if top else None,
			
 
				+                "top_text": top.get("text") if top else None,
			
 
				+            }
			
 
				+        )
			
 
				+
			
 
				+    ok_cases = [c for c in per_case if c.get("top_tag")]
			
 
				+    intersection: set = set.intersection(*all_qualified_tags) if all_qualified_tags else set()
			
 
				+    intersection_sorted = sorted(
			
 
				+        intersection,
			
 
				+        key=lambda t: -max(
			
 
				+            float(r.get("score") or 0)
			
 
				+            for rp in report_paths
			
 
				+            if rp.is_file()
			
 
				+            for r in _qualified_from_report(json.loads(rp.read_text(encoding="utf-8")), min_hit_score)
			
 
				+            if r.get("tag") == t
			
 
				+        ),
			
 
				+    )
			
 
				+
			
 
				+    pick_tag: Optional[str] = None
			
 
				+    pick_reason = ""
			
 
				+    majority_fields: Dict[str, Any] = {}
			
 
				+    if intersection_sorted:
			
 
				+        pick_tag = intersection_sorted[0]
			
 
				+        pick_reason = f"全部 {len(report_paths)} 个 case 的合格集合交集，取最高分 tag"
			
 
				+    elif ok_cases:
			
 
				+        parsed: List[Dict[str, Any]] = []
			
 
				+        for c in ok_cases:
			
 
				+            tag = c["top_tag"]
			
 
				+            if tag and str(tag).startswith("baseline"):
			
 
				+                continue
			
 
				+            try:
			
 
				+                parsed.append(_parse_best_config(str(tag)))
			
 
				+            except ValueError:
			
 
				+                continue
			
 
				+        if parsed:
			
 
				+            pick_reason = "无全局 tag 交集，按各 case 榜首做分字段多数票（跳过 baseline）"
			
 
				+            method = _majority_key([p["method"] for p in parsed])
			
 
				+            thresh = _majority_key([p.get("threshold") for p in parsed])
			
 
				+            upscale = _majority_key([p["upscale"] for p in parsed])
			
 
				+            cm = _majority_key([p["contrast_cfg"].get("method") for p in parsed])
			
 
				+            c_cfgs = [p["contrast_cfg"] for p in parsed if p["contrast_cfg"].get("method") == cm]
			
 
				+            contrast_cfg: Dict[str, Any] = {"method": cm or "none"}
			
 
				+            if cm == "clahe" and c_cfgs:
			
 
				+                contrast_cfg["clip_limit"] = _majority_key([c.get("clip_limit") for c in c_cfgs])
			
 
				+                contrast_cfg["tile_grid_size"] = _majority_key(
			
 
				+                    [c.get("tile_grid_size") for c in c_cfgs]
			
 
				+                )
			
 
				+            synthetic = {
			
 
				+                "method": method,
			
 
				+                "threshold": thresh,
			
 
				+                "contrast_cfg": contrast_cfg,
			
 
				+                "contrast_order": _majority_key([p["contrast_order"] for p in parsed]),
			
 
				+                "upscale": upscale,
			
 
				+                "det_db_box_thresh": _majority_key([p["det_db_box_thresh"] for p in parsed]),
			
 
				+            }
			
 
				+            c_tag = _contrast_tag(contrast_cfg)
			
 
				+            o_tag = "b" if synthetic["contrast_order"] == "before_upscale" else "a"
			
 
				+            t_s = str(synthetic["threshold"] or "d")
			
 
				+            pick_tag = (
			
 
				+                f"{method}_t{t_s}_{c_tag}_o{o_tag}_u{synthetic['upscale']}"
			
 
				+                f"_det{synthetic['det_db_box_thresh']}"
			
 
				+            )
			
 
				+            majority_fields = synthetic
			
 
				+        else:
			
 
				+            pick_tag = _majority_key([c["top_tag"] for c in ok_cases])
			
 
				+            pick_reason = "无全局交集，按各 case 榜首 tag 多数票（含 baseline）"
			
 
				+    pass1_cpp = _tag_to_cell_preprocess_yaml(pick_tag) if pick_tag else None
			
 
				+
			
 
				+    def _is_pass2_tile_tag(t: str) -> bool:
			
 
				+        import re
			
 
				+        return bool(re.search(r"cl_[\d.]+_4_", t))
			
 
				+
			
 
				+    pass2_candidates = [t for t in intersection_sorted if _is_pass2_tile_tag(t)]
			
 
				+    pass2_tag = pass2_candidates[0] if pass2_candidates else pick_tag
			
 
				+    pass2_cpp = _tag_to_cell_preprocess_yaml(pass2_tag) if pass2_tag else None
			
 
				+
			
 
				+    return {
			
 
				+        "min_hit_score": min_hit_score,
			
 
				+        "per_case": per_case,
			
 
				+        "intersection_tags": intersection_sorted[:20],
			
 
				+        "intersection_count": len(intersection),
			
 
				+        "recommended_tag": pick_tag,
			
 
				+        "pick_reason": pick_reason,
			
 
				+        "majority_fields": majority_fields,
			
 
				+        "pass1_cell_preprocess": pass1_cpp,
			
 
				+        "pass2_enhance_retry": (pass2_cpp or {}).get("enhance_retry") if pass2_cpp else None,
			
 
				+        "pass2_tag": pass2_tag,
			
 
				+    }
			
 
				+
			
 
				+
			
 
				+_CASE_META_KEYS = frozenset({"name", "note", "description"})
			
 
				+
			
 
				+
			
 
				+def _config_to_argv(cfg: Dict[str, Any]) -> List[str]:
			
 
				+    argv = [str(cfg["input"])]
			
 
				+    for key, value in cfg.items():
			
 
				+        if key == "input" or key in _CASE_META_KEYS:
			
 
				+            continue
			
 
				+        flag = f"--{key.replace('_', '-')}"
			
 
				+        if isinstance(value, bool) and value:
			
 
				+            argv.append(flag)
			
 
				+        elif not isinstance(value, bool):
			
 
				+            argv.extend([flag, str(value)])
			
 
				+    return argv
			
 
				+
			
 
				+
			
 
				+def _load_cases_json(path: Path) -> List[Dict[str, Any]]:
			
 
				+    data = json.loads(path.read_text(encoding="utf-8"))
			
 
				+    shared = data.get("shared") or {}
			
 
				+    cases = data.get("cases") or []
			
 
				+    out: List[Dict[str, Any]] = []
			
 
				+    for c in cases:
			
 
				+        merged = {**shared, **c}
			
 
				+        out.append(merged)
			
 
				+    return out
			
 
				+
			
 
				+
			
 
				+def _find_sweep_report(case_output: Path, input_path: Path) -> Optional[Path]:
			
 
				+    stem = Path(str(input_path)).stem.removesuffix("_raw")
			
 
				+    direct = case_output / stem / "sweep_report.json"
			
 
				+    if direct.is_file():
			
 
				+        return direct
			
 
				+    hits = sorted(case_output.rglob("sweep_report.json"))
			
 
				+    return hits[0] if hits else None
			
 
				+
			
 
				+
			
 
				+def run_cases_batch(cases: Sequence[Dict[str, Any]]) -> List[Dict[str, Any]]:
			
 
				+    """顺序执行多组 case（每组独立 output）。"""
			
 
				+    summaries: List[Dict[str, Any]] = []
			
 
				+    for i, case in enumerate(cases, 1):
			
 
				+        name = case.get("name") or case.get("input")
			
 
				+        print(f"\n{'#'*70}\n  批量 case {i}/{len(cases)}: {name}\n{'#'*70}")
			
 
				+        argv = _config_to_argv(case)
			
 
				+        main(argv)
			
 
				+        out = Path(case["output"])
			
 
				+        rp = _find_sweep_report(out, Path(case["input"]))
			
 
				+        summaries.append({"name": name, "output": str(out), "report": str(rp) if rp else None})
			
 
				+    return summaries
			
 
				+
			
 
				+
			
 
				 def run_best_config(
			
 
				     input_path: Path,
			
 
				     out_dir: Path,
			
@@ -723,6 +1030,8 @@ def _build_arg_parser() -> argparse.ArgumentParser:
 
				     p.add_argument(
			
 
				         "input",
			
 
				         type=Path,
			
 
				+        nargs="?",
			
 
				+        default=None,
			
 
				         help="单元格裁剪图路径，或 tablecell_ocr 目录（批量扫描）",
			
 
				     )
			
 
				     p.add_argument(
			
@@ -739,6 +1048,12 @@ def _build_arg_parser() -> argparse.ArgumentParser:
 
				         help="期望 OCR 文本；用于标记 HIT（子串匹配）。省略则任意非空为 HIT",
			
 
				     )
			
 
				     p.add_argument(
			
 
				+        "--min-hit-score",
			
 
				+        type=float,
			
 
				+        default=0.9,
			
 
				+        help="结论中「命中列表」的最低 score 阈值（默认 0.9，仅 det_rec）",
			
 
				+    )
			
 
				+    p.add_argument(
			
 
				         "--model-dir",
			
 
				         type=Path,
			
 
				         default=None,
			
@@ -806,11 +1121,80 @@ def _build_arg_parser() -> argparse.ArgumentParser:
 
				         default="threshold_t150_cl_1.0_8_ob_u128_det0.5",
			
 
				         help="最优参数 tag，如 threshold_t150_cl_1.0_8_ob_u128_det0.5",
			
 
				     )
			
 
				+    p.add_argument(
			
 
				+        "--cases",
			
 
				+        type=Path,
			
 
				+        default=None,
			
 
				+        help="批量 case JSON（见 sweep_cases.json），顺序跑网格扫描",
			
 
				+    )
			
 
				+    p.add_argument(
			
 
				+        "--aggregate-only",
			
 
				+        action="store_true",
			
 
				+        help="不扫描，仅根据已有 sweep_report.json 汇总 Pass1/Pass2 建议",
			
 
				+    )
			
 
				+    p.add_argument(
			
 
				+        "--aggregate-out",
			
 
				+        type=Path,
			
 
				+        default=None,
			
 
				+        help="汇总输出路径（默认 <cases 父目录>/aggregate_recommendation.json）",
			
 
				+    )
			
 
				     return p
			
 
				 
			
 
				 
			
 
				 def main(argv: Optional[Sequence[str]] = None) -> None:
			
 
				     args = _build_arg_parser().parse_args(argv)
			
 
				+
			
 
				+    if args.aggregate_only:
			
 
				+        if not args.cases or not args.cases.is_file():
			
 
				+            raise SystemExit("--aggregate-only 需要 --cases <sweep_cases.json>")
			
 
				+        cases = _load_cases_json(args.cases)
			
 
				+        report_paths: List[Path] = []
			
 
				+        for case in cases:
			
 
				+            out = Path(case["output"])
			
 
				+            rp = _find_sweep_report(out, Path(case["input"]))
			
 
				+            if rp:
			
 
				+                report_paths.append(rp)
			
 
				+            else:
			
 
				+                print(f"  跳过（无报告）: {case.get('name') or case['input']}")
			
 
				+        agg = aggregate_sweep_reports(
			
 
				+            report_paths, min_hit_score=args.min_hit_score
			
 
				+        )
			
 
				+        agg_out = args.aggregate_out or args.cases.parent / "aggregate_recommendation.json"
			
 
				+        agg_out.parent.mkdir(parents=True, exist_ok=True)
			
 
				+        agg_out.write_text(json.dumps(agg, ensure_ascii=False, indent=2), encoding="utf-8")
			
 
				+        print(f"\n汇总完成 -> {agg_out}")
			
 
				+        print(f"  推荐 tag: {agg.get('recommended_tag')}")
			
 
				+        print(f"  交集合格 tag 数: {agg.get('intersection_count')}")
			
 
				+        if agg.get("pass1_cell_preprocess"):
			
 
				+            print("\n  Pass1 cell_preprocess 片段:")
			
 
				+            print(json.dumps(agg["pass1_cell_preprocess"], ensure_ascii=False, indent=2))
			
 
				+        if agg.get("pass2_enhance_retry"):
			
 
				+            print("\n  Pass2 enhance_retry 片段:")
			
 
				+            print(json.dumps(agg["pass2_enhance_retry"], ensure_ascii=False, indent=2))
			
 
				+        return
			
 
				+
			
 
				+    if args.cases and args.cases.is_file():
			
 
				+        if args.input is not None:
			
 
				+            print("  提示: 已指定 --cases，忽略 positional input")
			
 
				+        cases = _load_cases_json(args.cases)
			
 
				+        run_cases_batch(cases)
			
 
				+        report_paths = []
			
 
				+        for case in cases:
			
 
				+            rp = _find_sweep_report(Path(case["output"]), Path(case["input"]))
			
 
				+            if rp:
			
 
				+                report_paths.append(rp)
			
 
				+        if report_paths:
			
 
				+            agg = aggregate_sweep_reports(
			
 
				+                report_paths, min_hit_score=args.min_hit_score
			
 
				+            )
			
 
				+            agg_out = args.aggregate_out or args.cases.parent / "aggregate_recommendation.json"
			
 
				+            agg_out.write_text(json.dumps(agg, ensure_ascii=False, indent=2), encoding="utf-8")
			
 
				+            print(f"\n批量汇总 -> {agg_out}")
			
 
				+            print(f"  推荐 tag: {agg.get('recommended_tag')} ({agg.get('pick_reason')})")
			
 
				+        return
			
 
				+
			
 
				+    if args.input is None:
			
 
				+        raise SystemExit("需要 input 路径，或使用 --cases / --aggregate-only")
			
 
				     inputs = collect_inputs(args.input, prefer_raw=not args.no_prefer_raw)
			
 
				     if not inputs:
			
 
				         raise SystemExit("未找到可扫描的图像")
			
@@ -878,7 +1262,7 @@ def main(argv: Optional[Sequence[str]] = None) -> None:
 
				 
			
 
				     if args.quick:
			
 
				         thresholds = [150, 155]
			
 
				-        upscales = [128, 192]
			
 
				+        upscales = [96, 128, 192]
			
 
				         det_threshs = [0.5]
			
 
				     else:
			
 
				         thresholds = _parse_csv_ints(args.thresholds)
			
@@ -911,11 +1295,16 @@ def main(argv: Optional[Sequence[str]] = None) -> None:
 
				             save_images=not args.no_save_images,
			
 
				             run_baseline=not args.no_baseline,
			
 
				             baseline_upscale=args.baseline_upscale,
			
 
				+            min_hit_score=args.min_hit_score,
			
 
				         )
			
 
				+        qh = report.get("hits_target_score_above") or []
			
 
				         summary.append(
			
 
				             {
			
 
				                 "input": report["input"],
			
 
				                 "hits": len(report["hits"]),
			
 
				+                "hits_target_score_above": len(qh),
			
 
				+                "top_qualified_tag": qh[0]["tag"] if qh else None,
			
 
				+                "top_qualified_score": qh[0]["score"] if qh else None,
			
 
				                 "report": str(Path(report["output_dir"]) / "sweep_report.json"),
			
 
				             }
			
 
				         )
			
@@ -926,46 +1315,20 @@ def main(argv: Optional[Sequence[str]] = None) -> None:
 
				     )
			
 
				     print(f"\n全部完成，索引: {index_path}")
			
 
				     for s in summary:
			
 
				-        print(f"  {s['input']}: {s['hits']} hits -> {s['report']}")
			
 
				+        qn = s.get("hits_target_score_above", 0)
			
 
				+        top = s.get("top_qualified_tag")
			
 
				+        print(
			
 
				+            f"  {s['input']}: hits={s['hits']}  "
			
 
				+            f"qualified(score>{args.min_hit_score})={qn}"
			
 
				+            + (f"  top={top}" if top else "")
			
 
				+            + f" -> {s['report']}"
			
 
				+        )
			
 
				 
			
 
				 
			
 
				 if __name__ == "__main__":
			
 
				     if len(sys.argv) == 1:
			
 
				-        print("ℹ️  未提供命令行参数，使用默认配置运行...")
			
 
				-        default_config = {
			
 
				-            # "input": "/Users/zhch158/workspace/data/流水分析/彭_广东兴宁农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/彭_广东兴宁农村商业银行_page_002_0/cell219_empty_empty_raw.png",
			
 
				-            # "output": "./output/彭_广东兴宁农村商业银行/cell219_sweep",
			
 
				-            # "target": "ATM存折取款",
			
 
				-
			
 
				-            # "input": "/Users/zhch158/workspace/data/流水分析/彭_广东兴宁农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/彭_广东兴宁农村商业银行_page_002_0/cell007_whole_longer_易型交类_raw.png",
			
 
				-            # "output": "./output/彭_广东兴宁农村商业银行/cell007_sweep",
			
 
				-            # "target": "交易类型",
			
 
				-            # "quick": True,
			
 
				-
			
 
				-            # "input": "/Users/zhch158/workspace/data/流水分析/钟_广东陆丰农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/钟_广东陆丰农村商业银行_page_001_0/cell217_empty_empty_raw.png",
			
 
				-            # "output": "./output/钟_广东陆丰农村商业银行/cell217_sweep",
			
 
				-            # "target": "专项资金",
			
 
				-            # "quick": True,
			
 
				-
			
 
				-            # "input": "/Users/zhch158/workspace/data/流水分析/彭_广东兴宁农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/彭_广东兴宁农村商业银行_page_002_0",
			
 
				-            # "output": "./output/彭_广东兴宁农村商业银行",
			
 
				-            # "best-config": "threshold_t150_cl_1.0_8_ob_u128_det0.5",
			
 
				-            # "best-only": True,
			
 
				-
			
 
				-            "input": "/Users/zhch158/workspace/data/流水分析/钟_广东陆丰农村商业银行/bank_statement_yusys_local/debug/table_recognition_wired/tablecell_ocr/钟_广东陆丰农村商业银行_page_001_0",
			
 
				-            "output": "./output/钟_广东陆丰农村商业银行",
			
 
				-            # "best-config": "threshold_t150_cl_1.0_8_ob_u128_det0.5",
			
 
				-            "best-config": "threshold_t150_cl_1.0_4_ob_u128_det0.5",
			
 
				-            "best-only": True,
			
 
				-        }
			
 
				-        sys.argv = [sys.argv[0], default_config["input"]]
			
 
				-        for key, value in default_config.items():
			
 
				-            if key == "input":
			
 
				-                continue
			
 
				-            flag = f"--{key.replace('_', '-')}"
			
 
				-            if isinstance(value, bool) and value:
			
 
				-                sys.argv.append(flag)
			
 
				-            elif not isinstance(value, bool):
			
 
				-                sys.argv.extend([flag, str(value)])
			
 
				+        cases_path = Path(__file__).resolve().parent / "sweep_cases.json"
			
 
				+        print(f"ℹ️  未提供命令行参数，使用批量 cases: {cases_path.name}")
			
 
				+        sys.argv = [sys.argv[0], "--cases", str(cases_path)]
			
 
				 
			
 
				     sys.exit(main())
			
--- a/ocr_tools/lab/cell_preprocess_lab/sweep_cases.json
+++ b/ocr_tools/lab/cell_preprocess_lab/sweep_cases.json
@@ -0,0 +1,50 @@
 
				+{
			
 
				+  "shared": {
			
 
				+    "quick": true,
			
 
				+    "min-hit-score": 0.9
			
 
				+  },
			
 
				+  "cases": [
			
 
				+    {
			
 
				+      "name": "彭_cell219",
			
 
				+      "input": "./input/cell219_lines_AT存折取款_raw.png",
			
 
				+      "output": "./output/彭_广东兴宁农村商业银行/cell219_sweep",
			
 
				+      "target": "ATM存折取款"
			
 
				+    },
			
 
				+    {
			
 
				+      "name": "彭_cell071",
			
 
				+      "input": "./input/cell071_empty_empty_raw.png",
			
 
				+      "output": "./output/彭_广东兴宁农村商业银行/cell071_sweep",
			
 
				+      "target": "20241224"
			
 
				+    },
			
 
				+    {
			
 
				+      "name": "彭_cell007_p002_易型交类",
			
 
				+      "input": "./input/cell007_whole_longer_易型交类_raw.png",
			
 
				+      "output": "./output/彭_广东兴宁农村商业银行/cell007_sweep",
			
 
				+      "target": "交易类型"
			
 
				+    },
			
 
				+    {
			
 
				+      "name": "彭_cell007_p005",
			
 
				+      "input": "./input/cell007_empty_empty_raw.png",
			
 
				+      "output": "./output/彭_广东兴宁农村商业银行/cell007_p005_sweep",
			
 
				+      "target": "交易类型"
			
 
				+    },
			
 
				+    {
			
 
				+      "name": "钟_cell077",
			
 
				+      "input": "./input/cell077_empty_empty_raw.png",
			
 
				+      "output": "./output/钟_广东陆丰农村商业银行/cell077_sweep",
			
 
				+      "target": "专项资金"
			
 
				+    },
			
 
				+    {
			
 
				+      "name": "钟_cell217",
			
 
				+      "input": "./input/cell217_empty_empty_raw.png",
			
 
				+      "output": "./output/钟_广东陆丰农村商业银行/cell217_sweep",
			
 
				+      "target": "专项资金"
			
 
				+    },
			
 
				+    {
			
 
				+      "name": "钟_cell017",
			
 
				+      "input": "./input/cell017_empty_empty_raw.png",
			
 
				+      "output": "./output/钟_广东陆丰农村商业银行/cell017_sweep",
			
 
				+      "target": "专项资金"
			
 
				+    }
			
 
				+  ]
			
 
				+}