| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778 |
- # Copyright (c) 2024 PaddlePaddle Authors. All Rights Reserved.
- #
- # Licensed under the Apache License, Version 2.0 (the "License");
- # you may not use this file except in compliance with the License.
- # You may obtain a copy of the License at
- #
- # http://www.apache.org/licenses/LICENSE-2.0
- #
- # Unless required by applicable law or agreed to in writing, software
- # distributed under the License is distributed on an "AS IS" BASIS,
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- # See the License for the specific language governing permissions and
- # limitations under the License.
- from enum import Enum
- from typing import Final, List, Literal, Optional, Union
- from pydantic import BaseModel, HttpUrl
- from ....utils.deps import is_dep_available
- from ..infra.models import PrimaryOperations
- if is_dep_available("openai"):
- from openai.types.chat import ChatCompletion
- __all__ = [
- "INFER_ENDPOINT",
- "InferRequest",
- "PRIMARY_OPERATIONS",
- ]
- INFER_ENDPOINT: Final[str] = "/document-understanding"
- class ContentType(str, Enum):
- TEXT = "text"
- IMAGE_URL = "image_url"
- class RoleType(str, Enum):
- USER = "user"
- ASSISTANT = "assistant"
- SYSTEM = "system"
- class ImageUrl(BaseModel):
- url: Union[HttpUrl, str]
- detail: Optional[Literal["low", "high", "auto"]] = "auto"
- class TextContent(BaseModel):
- type: Literal[ContentType.TEXT] = ContentType.TEXT
- text: str
- class ImageContent(BaseModel):
- type: Literal[ContentType.IMAGE_URL] = ContentType.IMAGE_URL
- image_url: Union[HttpUrl, ImageUrl]
- class Message(BaseModel):
- role: str
- content: Union[str, List[Union[TextContent, ImageContent]]]
- class InferRequest(BaseModel):
- model: str
- messages: List[Message]
- max_tokens: Optional[int] = 1024
- temperature: Optional[float] = 0.1
- top_p: Optional[float] = 0.95
- stream: Optional[bool] = False
- max_image_tokens: Optional[int] = None
- PRIMARY_OPERATIONS: Final[PrimaryOperations] = {
- "infer": (INFER_ENDPOINT, InferRequest, ChatCompletion),
- }
|