Dockerfile 5.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163
  1. # 1. Should I use `syntax` parser directive?
  2. # 2. Can I use `COPY --link` to optimize caching?
  3. # 3. Create a non-root user for deployment?
  4. # 4. Should I use APT repository mirrors?
  5. # 5. Use cache mounts for `pip`?
  6. ARG DEVICE_TYPE=gpu
  7. ARG ENV_TYPE=prod
  8. ARG PIP_INDEX_URL=https://pypi.org/simple
  9. # GPU base
  10. # nvcr.io/nvidia/cuda:11.8.0-devel-ubuntu20.04
  11. # We use the `devel` version because the CUDA toolchain is needed for JIT.
  12. # However, can we use a smaller base image by not including tools and
  13. # libraries that are not required?
  14. FROM nvcr.io/nvidia/cuda@sha256:03681bbd11fea044ff3e3a5d65e190a6f935af30c56e03e740b27e4563f61e0f AS gpu-base
  15. # CPU base
  16. # ubuntu:20.04
  17. FROM ubuntu:20.04@sha256:8feb4d8ca5354def3d8fce243717141ce31e2c428701f6682bd2fafe15388214 AS cpu-base
  18. # Base
  19. FROM ${DEVICE_TYPE}-base AS base
  20. ARG PIP_INDEX_URL
  21. # Should I add `SHELL ["/bin/bash", "-c"]`?
  22. ENV DEBIAN_FRONTEND=noninteractive
  23. RUN mkdir /paddlex
  24. RUN echo 'deb http://archive.ubuntu.com/ubuntu jammy main universe' > /etc/apt/sources.list.d/jammy-temp.list \
  25. && apt-get update \
  26. && apt-get install -y --no-install-recommends python3.10 python3.10-venv \
  27. && python3.10 -m venv /paddlex/py310 \
  28. && rm -rf /var/lib/apt/lists/*
  29. ENV PATH="/paddlex/py310/bin:${PATH}"
  30. ENV PIP_DISABLE_PIP_VERSION_CHECK=1
  31. ENV PIP_NO_CACHE_DIR=0
  32. ENV PYTHONUNBUFFERED=1
  33. ENV PYTHONDONTWRITEBYTECODE=1
  34. ENV PIP_INDEX_URL=${PIP_INDEX_URL}
  35. # Requirement collection
  36. FROM base AS rc
  37. RUN python -m pip install pip-tools==7.4.1
  38. # `ENTRYPOINT` and `CMD`?
  39. # Build stage 1
  40. FROM base AS build1
  41. RUN apt-get update \
  42. && apt-get install -y --no-install-recommends wget unzip \
  43. && rm -rf /var/lib/apt/lists/*
  44. RUN mkdir -p /paddlex/libs
  45. # Build stage 2 for GPU
  46. FROM build1 AS gpu-build2
  47. RUN mkdir -p /paddlex/tensorrt
  48. RUN --mount=type=bind,source=deploy/hps/server_env/cudnn-linux-x86_64-8.9.7.29_cuda11-archive.tar.xz,target=/tmp/cudnn-linux-x86_64-8.9.7.29_cuda11-archive.tar.xz \
  49. tar -xf /tmp/cudnn-linux-x86_64-8.9.7.29_cuda11-archive.tar.xz -C /paddlex \
  50. && mv /paddlex/cudnn-linux-x86_64-8.9.7.29_cuda11-archive/lib/* /paddlex/libs/
  51. RUN --mount=type=bind,source=deploy/hps/server_env/TensorRT-8.6.1.6.Linux.x86_64-gnu.cuda-11.8.tar.gz,target=/tmp/TensorRT-8.6.1.6.Linux.x86_64-gnu.cuda-11.8.tar.gz \
  52. tar -xf /tmp/TensorRT-8.6.1.6.Linux.x86_64-gnu.cuda-11.8.tar.gz -C /paddlex \
  53. && mv /paddlex/TensorRT-8.6.1.6 /paddlex/tensorrt \
  54. && rm -rf /paddlex/tensorrt/data /paddlex/tensorrt/doc /paddlex/tensorrt/python /paddlex/tensorrt/samples
  55. # Build Stage 2 for CPU
  56. FROM build1 AS cpu-build2
  57. # Build Stage 3
  58. FROM ${DEVICE_TYPE}-build2 AS build3
  59. ARG DEVICE_TYPE
  60. ARG ENV_TYPE
  61. RUN wget -P /paddlex "https://paddle-model-ecology.bj.bcebos.com/paddlex/PaddleX3.0/deploy/deps/tritonserver/tritonserver-2.15.0-${DEVICE_TYPE}.zip" \
  62. && unzip "/paddlex/tritonserver-2.15.0-${DEVICE_TYPE}.zip" -d /paddlex \
  63. && mv "/paddlex/tritonserver-2.15.0-${DEVICE_TYPE}" /paddlex/tritonserver \
  64. && rm "/paddlex/tritonserver-2.15.0-${DEVICE_TYPE}.zip"
  65. RUN --mount=type=bind,source=deploy/hps/server_env/requirements/${DEVICE_TYPE}.txt,target=/tmp/requirements.txt \
  66. --mount=type=bind,source=deploy/hps/server_env/requirements/${DEVICE_TYPE}_hpi.txt,target=/tmp/hpi_requirements.txt \
  67. --mount=type=bind,source=deploy/hps/server_env/requirements/${DEVICE_TYPE}_dev.txt,target=/tmp/dev_requirements.txt \
  68. python -m pip install --requirement /tmp/requirements.txt --requirement /tmp/hpi_requirements.txt \
  69. && if [ "${ENV_TYPE}" = 'dev' ]; then \
  70. python -m pip install --requirement /tmp/dev_requirements.txt; \
  71. fi \
  72. && python -m pip install https://paddle-whl.bj.bcebos.com/nightly/cu126/safetensors/safetensors-0.6.2.dev0-cp38-abi3-linux_x86_64.whl
  73. RUN --mount=type=bind,source=.,target=/tmp/PaddleX,rw \
  74. python -m pip install --no-deps /tmp/PaddleX
  75. RUN --mount=type=bind,source=deploy/hps/server_env/paddlex-hps-server,target=/tmp/paddlex-hps-server,rw \
  76. python -m pip install --no-deps /tmp/paddlex-hps-server
  77. # GPU Deployment
  78. FROM base AS gpu-deployment
  79. RUN apt-get update \
  80. && apt-get install -y --no-install-recommends datacenter-gpu-manager \
  81. && rm -rf /var/lib/apt/lists/*
  82. COPY --from=build3 --chown=paddlex:paddlex /paddlex/tensorrt /paddlex/tensorrt
  83. ENV LD_LIBRARY_PATH="/paddlex/tensorrt/lib:${LD_LIBRARY_PATH}"
  84. RUN mkdir /paddlex/libs
  85. RUN ln -s /usr/local/cuda-11.8/targets/x86_64-linux/lib/libcublas.so.11 /paddlex/libs/libcublas.so \
  86. && ln -s /usr/local/cuda-11.8/targets/x86_64-linux/lib/libcufft.so.10 /paddlex/libs/libcufft.so \
  87. && ln -s /usr/local/cuda-11.8/targets/x86_64-linux/lib/libcurand.so.10 /paddlex/libs/libcurand.so \
  88. && ln -s /usr/local/cuda-11.8/targets/x86_64-linux/lib/libcusolver.so.11 /paddlex/libs/libcusolver.so \
  89. && ln -s /usr/local/cuda-11.8/targets/x86_64-linux/lib/libcusparse.so.11 /paddlex/libs/libcusparse.so
  90. # CPU Deployment
  91. FROM base AS cpu-deployment
  92. # Deployment
  93. FROM ${DEVICE_TYPE}-deployment AS deployment
  94. # Should we use an environment variable to store the version?
  95. RUN groupadd -g 1000 paddlex \
  96. && useradd -m -s /bin/bash -u 1000 -g 1000 paddlex
  97. # Not sure if all these deps are necessary
  98. RUN apt-get update \
  99. && apt-get install -y --no-install-recommends libre2-5 libssl1.1 libb64-0d libnuma1 libarchive13 python3.10-dev libgl1-mesa-glx libglib2.0-0 libgomp1 ccache binutils build-essential texlive texlive-latex-base texlive-latex-extra \
  100. && rm -rf /var/lib/apt/lists/*
  101. COPY --from=build3 --chown=paddlex:paddlex /paddlex/libs /paddlex/libs
  102. # Should I use `ldconfig`?
  103. ENV LD_LIBRARY_PATH="/paddlex/libs:${LD_LIBRARY_PATH}"
  104. COPY --from=build3 --chown=paddlex:paddlex /paddlex/tritonserver /opt/tritonserver
  105. ENV PATH="/opt/tritonserver/bin:${PATH}"
  106. # Is the merging safe?
  107. COPY --from=build3 --chown=paddlex:paddlex /paddlex/py310 /paddlex/py310
  108. RUN mkdir /paddlex/var \
  109. && chown paddlex:paddlex /paddlex/var
  110. USER paddlex
  111. USER root
  112. CMD ["/bin/bash"]