Dockerfile 593 B

123456789101112131415161718
  1. FROM python:3.10
  2. RUN apt-get update \
  3. && apt-get install -y libgl1 \
  4. && rm -rf /var/lib/apt/lists/*
  5. ENV PIP_NO_CACHE_DIR=0
  6. ENV PYTHONUNBUFFERED=1
  7. ENV PYTHONDONTWRITEBYTECODE=1
  8. RUN python -m pip install 'paddlex>=3.3.5,<3.4'
  9. RUN python -m pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.14/flash_attn-2.8.2+cu128torch2.8-cp310-cp310-linux_x86_64.whl \
  10. && paddlex --install genai-vllm-server
  11. EXPOSE 8080
  12. CMD ["paddlex_genai_server", "--model_name", "PaddleOCR-VL-0.9B", "--host", "0.0.0.0", "--port", "8080", "--backend", "vllm"]