Browse Source

fix: refine confidence handling in predictions and update hash utility for image processing

myhloli 3 tháng trước cách đây
mục cha
commit
d58a440ffc

+ 2 - 3
mineru/backend/pipeline/model_json_to_middle_json.py

@@ -17,19 +17,18 @@ from mineru.utils.llm_aided import llm_aided_title
 from mineru.utils.model_utils import clean_memory
 from mineru.backend.pipeline.pipeline_magic_model import MagicModel
 from mineru.utils.ocr_utils import OcrConfidence
-from mineru.utils.pdf_reader import image_to_b64str
 from mineru.utils.span_block_fix import fill_spans_in_blocks, fix_discarded_block, fix_block_spans
 from mineru.utils.span_pre_proc import remove_outside_spans, remove_overlaps_low_confidence_spans, \
     remove_overlaps_min_spans, txt_spans_extract
 from mineru.version import __version__
-from mineru.utils.hash_utils import str_md5
+from mineru.utils.hash_utils import bytes_md5
 
 
 def page_model_info_to_page_info(page_model_info, image_dict, page, image_writer, page_index, ocr_enable=False, formula_enabled=True):
     scale = image_dict["scale"]
     page_pil_img = image_dict["img_pil"]
     # page_img_md5 = str_md5(image_dict["img_base64"])
-    page_img_md5 = str_md5(image_to_b64str(page_pil_img))
+    page_img_md5 = bytes_md5(page_pil_img.tobytes())
     page_w, page_h = map(int, page.get_size())
     magic_model = MagicModel(page_model_info, scale)
 

+ 2 - 0
mineru/model/layout/doclayout_yolo.py

@@ -62,6 +62,8 @@ class DocLayoutYOLOModel:
                 batch = images[idx: idx + batch_size]
                 if batch_size == 1:
                     conf = 0.9 * self.conf
+                else:
+                    conf = self.conf
                 predictions = self.model.predict(
                     batch,
                     imgsz=self.imgsz,