Эх сурвалжийг харах

add pdf compatibility for ppchatocrv3

liuhongen1234567 1 жил өмнө
parent
commit
6dd4108633

+ 3 - 2
paddlex/inference/pipelines/ppchatocrv3/ppchatocrv3.py

@@ -252,6 +252,7 @@ class PPChatOCRPipeline(_TableRecPipeline):
         for idx, (img_info, layout_pred) in enumerate(
             zip(img_info_list, self.layout_predictor(img_list))
         ):
+            page_id = idx
             single_img_res = {
                 "input_path": "",
                 "layout_result": DetResult({}),
@@ -373,8 +374,8 @@ class PPChatOCRPipeline(_TableRecPipeline):
             single_img_res["ocr_result"] = ocr_res
             single_img_res["table_ocr_result"] = all_table_ocr_res
             single_img_res["layout_parsing_result"] = structure_res
-
-            yield VisualResult(single_img_res)
+            single_img_res["layout_parsing_result"]["page_id"] = page_id + 1
+            yield VisualResult(single_img_res, page_id, inputs)
 
     def decode_visual_result(self, visual_result):
         ocr_text = []