willow-inference-server (latest)

Published 2025-08-26 22:19:26 +02:00 by cs

Installation

docker pull git.stop.pe/cs/willow-inference-server:latest
sha256:65eb1e596cc083122b96a987375fb28b214d472cb130b0c4d57e14102a935a27

Image layers

ARG RELEASE
ARG LAUNCHPAD_BUILD_ARCH
LABEL org.opencontainers.image.ref.name=ubuntu
LABEL org.opencontainers.image.version=22.04
ADD file:140fb5108b4a2861b5718ad03b4a5174bba03589ea8d4c053e6a0b282f439ff3 in /
CMD ["/bin/bash"]
RUN /bin/sh -c export DEBIAN_FRONTEND=noninteractive && apt-get update && apt-get install -y --no-install-recommends apt-utils build-essential ca-certificates curl libncurses5 libncursesw5 patch wget rsync unzip jq gnupg libtcmalloc-minimal4 # buildkit
ARG CUDA_VERSION
ARG CUDA_DRIVER_VERSION
ARG JETPACK_HOST_MOUNTS
ENV CUDA_VERSION=12.2.1.020 CUDA_DRIVER_VERSION=535.86.10 CUDA_CACHE_DISABLE=1 NVIDIA_REQUIRE_JETPACK_HOST_MOUNTS=
RUN |3 CUDA_VERSION=12.2.1.020 CUDA_DRIVER_VERSION=535.86.10 JETPACK_HOST_MOUNTS= /bin/sh -c /nvidia/build-scripts/installCUDA.sh # buildkit
RUN |3 CUDA_VERSION=12.2.1.020 CUDA_DRIVER_VERSION=535.86.10 JETPACK_HOST_MOUNTS= /bin/sh -c cp -vprd /nvidia/. / && patch -p0 < /etc/startup_scripts.patch && rm -f /etc/startup_scripts.patch # buildkit
ENV _CUDA_COMPAT_PATH=/usr/local/cuda/compat ENV=/etc/shinit_v2 BASH_ENV=/etc/bash.bashrc SHELL=/bin/bash NVIDIA_REQUIRE_CUDA=cuda>=9.0
LABEL com.nvidia.volumes.needed=nvidia_driver com.nvidia.cuda.version=9.0
ARG NCCL_VERSION
ARG CUBLAS_VERSION
ARG CUFFT_VERSION
ARG CURAND_VERSION
ARG CUSPARSE_VERSION
ARG CUSOLVER_VERSION
ARG CUTENSOR_VERSION
ARG NPP_VERSION
ARG NVJPEG_VERSION
ARG CUDNN_VERSION
ARG TRT_VERSION
ARG TRTOSS_VERSION
ARG NSIGHT_SYSTEMS_VERSION
ARG NSIGHT_COMPUTE_VERSION
ENV NCCL_VERSION=2.18.3 CUBLAS_VERSION=12.2.5.1 CUFFT_VERSION=11.0.8.91 CURAND_VERSION=10.3.3.129 CUSPARSE_VERSION=12.1.2.129 CUSOLVER_VERSION=11.5.1.129 CUTENSOR_VERSION=1.7.0.1 NPP_VERSION=12.2.0.5 NVJPEG_VERSION=12.2.1.2 CUDNN_VERSION=8.9.4.25 TRT_VERSION=8.6.1.6+cuda12.0.1.011 TRTOSS_VERSION=23.08 NSIGHT_SYSTEMS_VERSION=2023.2.3.1001 NSIGHT_COMPUTE_VERSION=2023.2.1.3
RUN |17 CUDA_VERSION=12.2.1.020 CUDA_DRIVER_VERSION=535.86.10 JETPACK_HOST_MOUNTS= NCCL_VERSION=2.18.3 CUBLAS_VERSION=12.2.5.1 CUFFT_VERSION=11.0.8.91 CURAND_VERSION=10.3.3.129 CUSPARSE_VERSION=12.1.2.129 CUSOLVER_VERSION=11.5.1.129 CUTENSOR_VERSION=1.7.0.1 NPP_VERSION=12.2.0.5 NVJPEG_VERSION=12.2.1.2 CUDNN_VERSION=8.9.4.25 TRT_VERSION=8.6.1.6+cuda12.0.1.011 TRTOSS_VERSION=23.08 NSIGHT_SYSTEMS_VERSION=2023.2.3.1001 NSIGHT_COMPUTE_VERSION=2023.2.1.3 /bin/sh -c /nvidia/build-scripts/installNCCL.sh && /nvidia/build-scripts/installLIBS.sh && /nvidia/build-scripts/installCUDNN.sh && /nvidia/build-scripts/installTRT.sh && /nvidia/build-scripts/installNSYS.sh && /nvidia/build-scripts/installNCU.sh && /nvidia/build-scripts/installCUTENSOR.sh # buildkit
LABEL com.nvidia.nccl.version=2.18.3 com.nvidia.cublas.version=12.2.5.1 com.nvidia.cufft.version=11.0.8.91 com.nvidia.curand.version=10.3.3.129 com.nvidia.cusparse.version=12.1.2.129 com.nvidia.cusolver.version=11.5.1.129 com.nvidia.cutensor.version=1.7.0.1 com.nvidia.npp.version=12.2.0.5 com.nvidia.nvjpeg.version=12.2.1.2 com.nvidia.cudnn.version=8.9.4.25 com.nvidia.tensorrt.version=8.6.1.6+cuda12.0.1.011 com.nvidia.tensorrtoss.version=23.08 com.nvidia.nsightsystems.version=2023.2.3.1001 com.nvidia.nsightcompute.version=2023.2.1.3
ARG DALI_VERSION
ARG DALI_BUILD
ARG POLYGRAPHY_VERSION
ARG TRANSFORMER_ENGINE_VERSION
ENV DALI_VERSION=1.28.0 DALI_BUILD=8915302 POLYGRAPHY_VERSION=0.47.1 TRANSFORMER_ENGINE_VERSION=0.11
ADD docs.tgz / # buildkit
RUN |21 CUDA_VERSION=12.2.1.020 CUDA_DRIVER_VERSION=535.86.10 JETPACK_HOST_MOUNTS= NCCL_VERSION=2.18.3 CUBLAS_VERSION=12.2.5.1 CUFFT_VERSION=11.0.8.91 CURAND_VERSION=10.3.3.129 CUSPARSE_VERSION=12.1.2.129 CUSOLVER_VERSION=11.5.1.129 CUTENSOR_VERSION=1.7.0.1 NPP_VERSION=12.2.0.5 NVJPEG_VERSION=12.2.1.2 CUDNN_VERSION=8.9.4.25 TRT_VERSION=8.6.1.6+cuda12.0.1.011 TRTOSS_VERSION=23.08 NSIGHT_SYSTEMS_VERSION=2023.2.3.1001 NSIGHT_COMPUTE_VERSION=2023.2.1.3 DALI_VERSION=1.28.0 DALI_BUILD=8915302 POLYGRAPHY_VERSION=0.47.1 TRANSFORMER_ENGINE_VERSION=0.11 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit
ARG _LIBPATH_SUFFIX
ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin LD_LIBRARY_PATH=/usr/local/cuda/compat/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64 NVIDIA_VISIBLE_DEVICES=all NVIDIA_DRIVER_CAPABILITIES=compute,utility,video
COPY entrypoint/ /opt/nvidia/ # buildkit
ENV NVIDIA_PRODUCT_NAME=CUDA
ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]
COPY NVIDIA_Deep_Learning_Container_License.pdf /workspace/ # buildkit
RUN /bin/sh -c export DEBIAN_FRONTEND=noninteractive && apt-get update && apt-get install -y --no-install-recommends build-essential git libglib2.0-0 less libnl-route-3-200 libnl-3-dev libnl-route-3-dev libnuma-dev libnuma1 libpmi2-0-dev nano numactl openssh-client vim wget && rm -rf /var/lib/apt/lists/* # buildkit
ARG GDRCOPY_VERSION
ARG HPCX_VERSION
ARG RDMACORE_VERSION
ARG MOFED_VERSION=5.4-rdmacore39.0
ARG OPENUCX_VERSION
ARG OPENMPI_VERSION
ENV GDRCOPY_VERSION=2.3 HPCX_VERSION=2.15 MOFED_VERSION=5.4-rdmacore39.0 OPENUCX_VERSION=1.15.0 OPENMPI_VERSION=4.1.5rc2 RDMACORE_VERSION=39.0
ARG TARGETARCH
RUN |7 GDRCOPY_VERSION=2.3 HPCX_VERSION=2.15 RDMACORE_VERSION=39.0 MOFED_VERSION=5.4-rdmacore39.0 OPENUCX_VERSION=1.15.0 OPENMPI_VERSION=4.1.5rc2 TARGETARCH=amd64 /bin/sh -c cd /nvidia && ( export DEBIAN_FRONTEND=noninteractive && apt-get update && apt-get install -y --no-install-recommends libibverbs1 libibverbs-dev librdmacm1 librdmacm-dev libibumad3 libibumad-dev ibverbs-utils ibverbs-providers && rm -rf /var/lib/apt/lists/* && rm $(dpkg-query -L libibverbs-dev librdmacm-dev libibumad-dev | grep "\(\.so\|\.a\)$") ) && ( cd opt/gdrcopy/ && dpkg -i libgdrapi_*.deb ) && ( cp -r opt/hpcx /opt/ && cp etc/ld.so.conf.d/hpcx.conf /etc/ld.so.conf.d/ && ln -sf /opt/hpcx/ompi /usr/local/mpi && ln -sf /opt/hpcx/ucx /usr/local/ucx && sed -i 's/^\(hwloc_base_binding_policy\) = core$/\1 = none/' /opt/hpcx/ompi/etc/openmpi-mca-params.conf && sed -i 's/^\(btl = self\)$/#\1/' /opt/hpcx/ompi/etc/openmpi-mca-params.conf ) && ldconfig # buildkit
ENV OPAL_PREFIX=/opt/hpcx/ompi PATH=/usr/local/mpi/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/ucx/bin
ENV OMPI_MCA_coll_hcoll_enable=0
COPY cuda-*.patch /tmp # buildkit
RUN |7 GDRCOPY_VERSION=2.3 HPCX_VERSION=2.15 RDMACORE_VERSION=39.0 MOFED_VERSION=5.4-rdmacore39.0 OPENUCX_VERSION=1.15.0 OPENMPI_VERSION=4.1.5rc2 TARGETARCH=amd64 /bin/sh -c export DEVEL=1 BASE=0 && /nvidia/build-scripts/installNCU.sh && /nvidia/build-scripts/installCUDA.sh && /nvidia/build-scripts/installLIBS.sh && /nvidia/build-scripts/installNCCL.sh && /nvidia/build-scripts/installCUDNN.sh && /nvidia/build-scripts/installCUTENSOR.sh && /nvidia/build-scripts/installTRT.sh && /nvidia/build-scripts/installNSYS.sh && if [ -f "/tmp/cuda-${_CUDA_VERSION_MAJMIN}.patch" ]; then patch -p0 < /tmp/cuda-${_CUDA_VERSION_MAJMIN}.patch; fi && rm -f /tmp/cuda-*.patch # buildkit
ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs:
ENV NVIDIA_PRODUCT_NAME=NVIDIA TensorRT
ENV TENSORRT_VERSION=8.6.1.6+cuda12.0.1.011
LABEL com.nvidia.tensorrt.version=8.6.1.6+cuda12.0.1.011
ARG NVIDIA_TENSORRT_VERSION
ENV NVIDIA_TENSORRT_VERSION=23.08
ARG TRTOSS_VERSION=master
ENV TENSORRT_OSS_VERSION=master
ARG PYVER=2.7
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c if [ "$PYVER" == "3.8" ]; then DISTUTILS="python3-distutils"; fi # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c PYSFX=`[ "$PYVER" != "2.7" ] && echo "$PYVER" | cut -c1-1 || echo ""` && apt-get update && DEBIAN_FRONTEND="noninteractive" apt-get install -y --no-install-recommends tzdata && apt-get install -y --no-install-recommends python$PYSFX python$PYVER-dev $DISTUTILS python$PYSFX-pip libssl-dev unzip && rm -rf /var/lib/apt/lists/* # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c CMAKE_VERSION=3.24 CMAKE_PATCH=0 CMAKE_DIR=cmake-${CMAKE_VERSION}.${CMAKE_PATCH} && cd /usr/local/src && wget https://cmake.org/files/v${CMAKE_VERSION}/${CMAKE_DIR}.tar.gz && tar -xvf ${CMAKE_DIR}.tar.gz && cd ${CMAKE_DIR} && ./bootstrap --parallel=$(nproc) && make -j$(nproc) install && cd .. && rm -rf ${CMAKE_DIR}* # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c cd ${HOME} && git clone -b v2.2.3 https://github.com/pybind/pybind11.git # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c rm -f /usr/bin/python && ln -s /usr/bin/python$PYVER /usr/bin/python # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c MAJ=`echo "$PYVER" | cut -c1-1` && rm -f /usr/bin/python$MAJ && ln -s /usr/bin/python$PYVER /usr/bin/python$MAJ # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c curl -O https://bootstrap.pypa.io/get-pip.py && python get-pip.py && rm get-pip.py # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c pip install --upgrade --no-cache-dir 'numpy<1.24' && pip install --upgrade --no-cache-dir pycuda pillow # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c rm -f /etc/dpkg/dpkg.cfg.d/excludes # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c URL=$(VERIFY=1 BASE=0 DEVEL=0 SAMPLES=0 PYTHON=0 /nvidia/build-scripts/installTRT.sh 2>/dev/null | sed -n "s/^.*\(http.*\)tar.*$/\1/p")tar && FILE=$(wget -O - $URL 2>/dev/null | sed -n 's/^.*href="\(TensorRT[^"]*\)".*$/\1/p' | grep -v internal) && wget --quiet $URL/$FILE -O - | tar -xz && PY=$(python -c 'import sys; print(str(sys.version_info[0])+str(sys.version_info[1]))') && pip install TensorRT-*/python/tensorrt-*-cp$PY*.whl && pip install TensorRT-*/graphsurgeon/graphsurgeon-*.whl && pip install TensorRT-*/uff/uff-*.whl && mv /usr/src/tensorrt /opt/ && mv TensorRT-*/samples /opt/tensorrt/ && mv TensorRT-*/data /opt/tensorrt/ && ln -s /opt/tensorrt /usr/src/tensorrt && rm -r TensorRT-* && UFF_PATH=$(pip show uff | sed -n 's/Location: \(.*\)$/\1/p')/uff && sed -i 's/from tensorflow import GraphDef/from tensorflow.python import GraphDef/' $UFF_PATH/converters/tensorflow/conversion_helpers.py && chmod +x ${UFF_PATH}/bin/convert_to_uff.py && ln -sf ${UFF_PATH}/bin/convert_to_uff.py /usr/local/bin/convert-to-uff # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c pip install --no-cache-dir --extra-index-url https://pypi.ngc.nvidia.com --extra-index-url https://tensorrt-read-only:Tensorrt\@123@urm.nvidia.com/artifactory/api/pypi/sw-tensorrt-pypi/simple polygraphy # buildkit
COPY python_setup.sh /opt/tensorrt/python/python_setup.sh # buildkit
COPY install_opensource.sh /opt/tensorrt/ # buildkit
ENV PATH=/opt/tensorrt/bin:/usr/local/mpi/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/ucx/bin
COPY trt8.5-samples-cuda12.patch /tmp/ # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c cd /opt/tensorrt/samples && patch -p2 < /tmp/trt8.5-samples-cuda12.patch && rm /tmp/trt8.5-samples-cuda12.patch # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c mkdir -p /workspace/tensorrt && cp -r /opt/tensorrt/bin /workspace/tensorrt && cp -r /opt/tensorrt/samples /workspace/tensorrt && ln -s /opt/tensorrt/data /workspace/tensorrt && chmod -R a+w /workspace/tensorrt/bin && chmod -R a+w /workspace/tensorrt/samples # buildkit
ADD docs.tgz / # buildkit
WORKDIR /workspace
COPY README.md README.md # buildkit
RUN |3 NVIDIA_TENSORRT_VERSION=23.08 TRTOSS_VERSION=master PYVER=3.10 /bin/sh -c ln -sf ${_CUDA_COMPAT_PATH}/lib.real ${_CUDA_COMPAT_PATH}/lib && echo ${_CUDA_COMPAT_PATH}/lib > /etc/ld.so.conf.d/00-cuda-compat.conf && ldconfig && rm -f ${_CUDA_COMPAT_PATH}/lib # buildkit
COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit
ARG NVIDIA_BUILD_ID
ENV NVIDIA_BUILD_ID=66128967
LABEL com.nvidia.build.id=66128967
ARG NVIDIA_BUILD_REF
LABEL com.nvidia.build.ref=ba56432c7d5a2178d1e104da8d2e85edba7f8c23
WORKDIR /app
RUN /bin/sh -c apt-get update && apt-get install -y zstd git-lfs && rm -rf /var/lib/apt/lists/* # buildkit
COPY requirements.txt . # buildkit
RUN /bin/sh -c pip install -r requirements.txt # buildkit
RUN /bin/sh -c pip install -U torch==2.1.0 torchvision==0.16.0 torchaudio==2.1.0 # buildkit
ENV CTRANSLATE2_ROOT=/opt/ctranslate2
ENV LD_LIBRARY_PATH=/usr/local/cuda/compat/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64:/opt/ctranslate2/lib
COPY /opt/ctranslate2 /opt/ctranslate2 # buildkit
RUN /bin/sh -c python3 -m pip --no-cache-dir install $CTRANSLATE2_ROOT/*.whl && rm $CTRANSLATE2_ROOT/*.whl # buildkit
RUN /bin/sh -c pip install auto-gptq --extra-index-url https://huggingface.github.io/autogptq-index/whl/cu118/ # buildkit
COPY . . # buildkit
CMD ["/bin/sh" "-c" "./entrypoint.sh"]
EXPOSE map[19000/tcp:{}]
EXPOSE map[19001/tcp:{}]

Labels

Key Value
com.nvidia.build.id 66128967
com.nvidia.build.ref ba56432c7d5a2178d1e104da8d2e85edba7f8c23
com.nvidia.cublas.version 12.2.5.1
com.nvidia.cuda.version 9.0
com.nvidia.cudnn.version 8.9.4.25
com.nvidia.cufft.version 11.0.8.91
com.nvidia.curand.version 10.3.3.129
com.nvidia.cusolver.version 11.5.1.129
com.nvidia.cusparse.version 12.1.2.129
com.nvidia.cutensor.version 1.7.0.1
com.nvidia.nccl.version 2.18.3
com.nvidia.npp.version 12.2.0.5
com.nvidia.nsightcompute.version 2023.2.1.3
com.nvidia.nsightsystems.version 2023.2.3.1001
com.nvidia.nvjpeg.version 12.2.1.2
com.nvidia.tensorrt.version 8.6.1.6+cuda12.0.1.011
com.nvidia.tensorrtoss.version 23.08
com.nvidia.volumes.needed nvidia_driver
org.opencontainers.image.ref.name ubuntu
org.opencontainers.image.version 22.04
Details
Container
2025-08-26 22:19:26 +02:00
7
OCI / Docker
linux/amd64
7.7 GiB
Versions (1) View all
latest 2025-08-26