| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115 |
- # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- from typing import Dict, Final, List, Optional, Tuple, Union
- from pydantic import BaseModel
- from ..infra.models import DataInfo, PrimaryOperations
- from .shared import ocr
- __all__ = [
- "ANALYZE_IMAGES_ENDPOINT",
- "AnalyzeImagesRequest",
- "LayoutParsingResult",
- "AnalyzeImagesResult",
- "TRANSLATE_ENDPOINT",
- "TranslateRequest",
- "TranslationResult",
- "TranslateResult",
- "PRIMARY_OPERATIONS",
- ]
- ANALYZE_IMAGES_ENDPOINT: Final[str] = "/doctrans-visual"
- class AnalyzeImagesRequest(ocr.BaseInferRequest):
- useDocOrientationClassify: Optional[bool] = False
- useDocUnwarping: Optional[bool] = False
- useTextlineOrientation: Optional[bool] = None
- useSealRecognition: Optional[bool] = None
- useTableRecognition: Optional[bool] = None
- useFormulaRecognition: Optional[bool] = None
- useChartRecognition: Optional[bool] = False
- useRegionDetection: Optional[bool] = None
- layoutThreshold: Optional[Union[float, dict]] = None
- layoutNms: Optional[bool] = None
- layoutUnclipRatio: Optional[Union[float, Tuple[float, float], dict]] = None
- layoutMergeBboxesMode: Optional[Union[str, dict]] = None
- textDetLimitSideLen: Optional[int] = None
- textDetLimitType: Optional[str] = None
- textDetThresh: Optional[float] = None
- textDetBoxThresh: Optional[float] = None
- textDetUnclipRatio: Optional[float] = None
- textRecScoreThresh: Optional[float] = None
- sealDetLimitSideLen: Optional[int] = None
- sealDetLimitType: Optional[str] = None
- sealDetThresh: Optional[float] = None
- sealDetBoxThresh: Optional[float] = None
- sealDetUnclipRatio: Optional[float] = None
- sealRecScoreThresh: Optional[float] = None
- useWiredTableCellsTransToHtml: bool = False
- useWirelessTableCellsTransToHtml: bool = False
- useTableOrientationClassify: bool = True
- useOcrResultsWithTableCells: bool = True
- useE2eWiredTableRecModel: bool = False
- useE2eWirelessTableRecModel: bool = True
- visualize: Optional[bool] = None
- class LayoutParsingResult(BaseModel):
- prunedResult: dict
- markdown: ocr.MarkdownData
- outputImages: Optional[Dict[str, str]] = None
- inputImage: Optional[str] = None
- class AnalyzeImagesResult(BaseModel):
- layoutParsingResults: List[LayoutParsingResult]
- dataInfo: DataInfo
- TRANSLATE_ENDPOINT: Final[str] = "/doctrans-translate"
- class TranslateRequest(BaseModel):
- markdownList: List[ocr.MarkdownData]
- targetLanguage: str = "zh"
- chunkSize: int = 5000
- taskDescription: Optional[str] = None
- outputFormat: Optional[str] = None
- rulesStr: Optional[str] = None
- fewShotDemoTextContent: Optional[str] = None
- fewShotDemoKeyValueList: Optional[str] = None
- chatBotConfig: Optional[dict] = None
- sleepInterval: float = 0
- class TranslationResult(BaseModel):
- language: str
- markdown: ocr.MarkdownData
- class TranslateResult(BaseModel):
- translationResults: List[TranslationResult]
- PRIMARY_OPERATIONS: Final[PrimaryOperations] = {
- "analyzeImages": (
- ANALYZE_IMAGES_ENDPOINT,
- AnalyzeImagesRequest,
- AnalyzeImagesResult,
- ),
- "translate": (TRANSLATE_ENDPOINT, TranslateRequest, TranslateResult),
- }
|