paddleocr_vl.py 2.2 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273
  1. # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved.
  2. #
  3. # Licensed under the Apache License, Version 2.0 (the "License");
  4. # you may not use this file except in compliance with the License.
  5. # You may obtain a copy of the License at
  6. #
  7. # http://www.apache.org/licenses/LICENSE-2.0
  8. #
  9. # Unless required by applicable law or agreed to in writing, software
  10. # distributed under the License is distributed on an "AS IS" BASIS,
  11. # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  12. # See the License for the specific language governing permissions and
  13. # limitations under the License.
  14. from typing import Dict, Final, List, Optional, Tuple, Union
  15. from pydantic import BaseModel
  16. from ..infra.models import DataInfo, PrimaryOperations
  17. from .shared import ocr
  18. __all__ = [
  19. "INFER_ENDPOINT",
  20. "InferRequest",
  21. "LayoutParsingResult",
  22. "InferResult",
  23. "PRIMARY_OPERATIONS",
  24. ]
  25. INFER_ENDPOINT: Final[str] = "/layout-parsing"
  26. class InferRequest(ocr.BaseInferRequest):
  27. useDocOrientationClassify: Optional[bool] = None
  28. useDocUnwarping: Optional[bool] = None
  29. useLayoutDetection: Optional[bool] = None
  30. useChartRecognition: Optional[bool] = None
  31. layoutThreshold: Optional[Union[float, dict]] = None
  32. layoutNms: Optional[bool] = None
  33. layoutUnclipRatio: Optional[Union[float, Tuple[float, float], dict]] = None
  34. layoutMergeBboxesMode: Optional[Union[str, dict]] = None
  35. promptLabel: Optional[str] = None
  36. formatBlockContent: Optional[bool] = None
  37. repetitionPenalty: Optional[float] = None
  38. temperature: Optional[float] = None
  39. topP: Optional[float] = None
  40. minPixels: Optional[int] = None
  41. maxPixels: Optional[int] = None
  42. prettifyMarkdown: bool = True
  43. showFormulaNumber: bool = False
  44. visualize: Optional[bool] = None
  45. class MarkdownData(BaseModel):
  46. text: str
  47. images: Optional[Dict[str, str]] = None
  48. class LayoutParsingResult(BaseModel):
  49. prunedResult: dict
  50. markdown: MarkdownData
  51. outputImages: Optional[Dict[str, str]] = None
  52. inputImage: Optional[str] = None
  53. class InferResult(BaseModel):
  54. layoutParsingResults: List[LayoutParsingResult]
  55. dataInfo: DataInfo
  56. PRIMARY_OPERATIONS: Final[PrimaryOperations] = {
  57. "infer": (INFER_ENDPOINT, InferRequest, InferResult),
  58. }