| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143 |
- # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- from typing import Any, Dict, List
- from .....utils.deps import function_requires_deps, is_dep_available
- from ...infra import utils as serving_utils
- from ...infra.config import AppConfig
- from ...infra.models import AIStudioResultResponse
- from ...schemas.pp_structurev3 import INFER_ENDPOINT, InferRequest, InferResult
- from .._app import create_app, primary_operation
- from ._common import common
- from ._common import ocr as ocr_common
- if is_dep_available("fastapi"):
- from fastapi import FastAPI
- @function_requires_deps("fastapi")
- def create_pipeline_app(pipeline: Any, app_config: AppConfig) -> "FastAPI":
- app, ctx = create_app(
- pipeline=pipeline, app_config=app_config, app_aiohttp_session=True
- )
- ocr_common.update_app_context(ctx)
- @primary_operation(
- app,
- INFER_ENDPOINT,
- "infer",
- )
- async def _infer(
- request: InferRequest,
- ) -> AIStudioResultResponse[InferResult]:
- pipeline = ctx.pipeline
- log_id = serving_utils.generate_log_id()
- images, data_info = await ocr_common.get_images(request, ctx)
- result = await pipeline.infer(
- images,
- use_doc_orientation_classify=request.useDocOrientationClassify,
- use_doc_unwarping=request.useDocUnwarping,
- use_textline_orientation=request.useTextlineOrientation,
- use_seal_recognition=request.useSealRecognition,
- use_table_recognition=request.useTableRecognition,
- use_formula_recognition=request.useFormulaRecognition,
- use_chart_recognition=request.useChartRecognition,
- use_region_detection=request.useRegionDetection,
- layout_threshold=request.layoutThreshold,
- layout_nms=request.layoutNms,
- layout_unclip_ratio=request.layoutUnclipRatio,
- layout_merge_bboxes_mode=request.layoutMergeBboxesMode,
- text_det_limit_side_len=request.textDetLimitSideLen,
- text_det_limit_type=request.textDetLimitType,
- text_det_thresh=request.textDetThresh,
- text_det_box_thresh=request.textDetBoxThresh,
- text_det_unclip_ratio=request.textDetUnclipRatio,
- text_rec_score_thresh=request.textRecScoreThresh,
- seal_det_limit_side_len=request.sealDetLimitSideLen,
- seal_det_limit_type=request.sealDetLimitType,
- seal_det_thresh=request.sealDetThresh,
- seal_det_box_thresh=request.sealDetBoxThresh,
- seal_det_unclip_ratio=request.sealDetUnclipRatio,
- seal_rec_score_thresh=request.sealRecScoreThresh,
- use_wired_table_cells_trans_to_html=request.useWiredTableCellsTransToHtml,
- use_wireless_table_cells_trans_to_html=request.useWirelessTableCellsTransToHtml,
- use_table_orientation_classify=request.useTableOrientationClassify,
- use_ocr_results_with_table_cells=request.useOcrResultsWithTableCells,
- use_e2e_wired_table_rec_model=request.useE2eWiredTableRecModel,
- use_e2e_wireless_table_rec_model=request.useE2eWirelessTableRecModel,
- )
- layout_parsing_results: List[Dict[str, Any]] = []
- for i, (img, item) in enumerate(zip(images, result)):
- pruned_res = common.prune_result(item.json["res"])
- md_data = item.markdown
- md_text = md_data["markdown_texts"]
- md_imgs = await serving_utils.call_async(
- common.postprocess_images,
- md_data["markdown_images"],
- log_id,
- filename_template=f"markdown_{i}/{{key}}",
- file_storage=ctx.extra["file_storage"],
- return_urls=ctx.extra["return_img_urls"],
- max_img_size=ctx.extra["max_output_img_size"],
- )
- md_flags = md_data["page_continuation_flags"]
- if ctx.config.visualize:
- imgs = {
- "input_img": img,
- **item.img,
- }
- imgs = await serving_utils.call_async(
- common.postprocess_images,
- imgs,
- log_id,
- filename_template=f"{{key}}_{i}.jpg",
- file_storage=ctx.extra["file_storage"],
- return_urls=ctx.extra["return_img_urls"],
- max_img_size=ctx.extra["max_output_img_size"],
- )
- else:
- imgs = {}
- layout_parsing_results.append(
- dict(
- prunedResult=pruned_res,
- markdown=dict(
- text=md_text,
- images=md_imgs,
- isStart=md_flags[0],
- isEnd=md_flags[1],
- ),
- outputImages=(
- {k: v for k, v in imgs.items() if k != "input_img"}
- if imgs
- else None
- ),
- inputImage=imgs.get("input_img"),
- )
- )
- return AIStudioResultResponse[InferResult](
- logId=log_id,
- result=InferResult(
- layoutParsingResults=layout_parsing_results,
- dataInfo=data_info,
- ),
- )
- return app
|