Eric X. Liu eric

vllm (2025-06-08-3123ba)

Published 2025-06-08 17:55:09 +00:00 by eric

Installation

docker pull git.ericxliu.me/eric/vllm:2025-06-08-3123ba
sha256:3abf718133a2ff63c2ca18fdb3c07fb40e3230faadd78924f19d91563c884823

Image Layers

ARG RELEASE
ARG LAUNCHPAD_BUILD_ARCH
LABEL org.opencontainers.image.ref.name=ubuntu
LABEL org.opencontainers.image.version=22.04
ADD file:63d5ab3ef0aab308c0e71cb67292c5467f60deafa9b0418cbb220affcd078444 in /
CMD ["/bin/bash"]
ENV NVARCH=x86_64
ENV NVIDIA_REQUIRE_CUDA=cuda>=12.2 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526
ENV NV_CUDA_CUDART_VERSION=12.2.140-1
ENV NV_CUDA_COMPAT_PACKAGE=cuda-compat-12-2
ARG TARGETARCH
LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.0-1_all.deb && dpkg -i cuda-keyring_1.0-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit
ENV CUDA_VERSION=12.2.2
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-2=${NV_CUDA_CUDART_VERSION} ${NV_CUDA_COMPAT_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit
ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64
COPY NGC-DL-CONTAINER-LICENSE / # buildkit
ENV NVIDIA_VISIBLE_DEVICES=all
ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
ENV NV_CUDA_LIB_VERSION=12.2.2-1
ENV NV_NVTX_VERSION=12.2.140-1
ENV NV_LIBNPP_VERSION=12.2.1.4-1
ENV NV_LIBNPP_PACKAGE=libnpp-12-2=12.2.1.4-1
ENV NV_LIBCUSPARSE_VERSION=12.1.2.141-1
ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-12-2
ENV NV_LIBCUBLAS_VERSION=12.2.5.6-1
ENV NV_LIBCUBLAS_PACKAGE=libcublas-12-2=12.2.5.6-1
ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2
ENV NV_LIBNCCL_PACKAGE_VERSION=2.19.3-1
ENV NCCL_VERSION=2.19.3-1
ENV NV_LIBNCCL_PACKAGE=libnccl2=2.19.3-1+cuda12.2
ARG TARGETARCH
LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-12-2=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-12-2=${NV_NVTX_VERSION} libcusparse-12-2=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit
COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit
COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit
ENV NVIDIA_PRODUCT_NAME=CUDA
ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]
ENV NV_CUDA_LIB_VERSION=12.2.2-1
ENV NV_CUDA_CUDART_DEV_VERSION=12.2.140-1
ENV NV_NVML_DEV_VERSION=12.2.140-1
ENV NV_LIBCUSPARSE_DEV_VERSION=12.1.2.141-1
ENV NV_LIBNPP_DEV_VERSION=12.2.1.4-1
ENV NV_LIBNPP_DEV_PACKAGE=libnpp-dev-12-2=12.2.1.4-1
ENV NV_LIBCUBLAS_DEV_VERSION=12.2.5.6-1
ENV NV_LIBCUBLAS_DEV_PACKAGE_NAME=libcublas-dev-12-2
ENV NV_LIBCUBLAS_DEV_PACKAGE=libcublas-dev-12-2=12.2.5.6-1
ENV NV_CUDA_NSIGHT_COMPUTE_VERSION=12.2.2-1
ENV NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE=cuda-nsight-compute-12-2=12.2.2-1
ENV NV_NVPROF_VERSION=12.2.142-1
ENV NV_NVPROF_DEV_PACKAGE=cuda-nvprof-12-2=12.2.142-1
ENV NV_LIBNCCL_DEV_PACKAGE_NAME=libnccl-dev
ENV NV_LIBNCCL_DEV_PACKAGE_VERSION=2.19.3-1
ENV NCCL_VERSION=2.19.3-1
ENV NV_LIBNCCL_DEV_PACKAGE=libnccl-dev=2.19.3-1+cuda12.2
ARG TARGETARCH
LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-dev-12-2=${NV_CUDA_CUDART_DEV_VERSION} cuda-command-line-tools-12-2=${NV_CUDA_LIB_VERSION} cuda-minimal-build-12-2=${NV_CUDA_LIB_VERSION} cuda-libraries-dev-12-2=${NV_CUDA_LIB_VERSION} cuda-nvml-dev-12-2=${NV_NVML_DEV_VERSION} ${NV_NVPROF_DEV_PACKAGE} ${NV_LIBNPP_DEV_PACKAGE} libcusparse-dev-12-2=${NV_LIBCUSPARSE_DEV_VERSION} ${NV_LIBCUBLAS_DEV_PACKAGE} ${NV_LIBNCCL_DEV_PACKAGE} ${NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_DEV_PACKAGE_NAME} ${NV_LIBNCCL_DEV_PACKAGE_NAME} # buildkit
ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs
ARG CUDA_VERSION=12.2.2
ARG PYTHON_VERSION=3.12
WORKDIR /vllm-workspace
ENV DEBIAN_FRONTEND=noninteractive
ARG TARGETPLATFORM
SHELL [/bin/bash -c]
RUN |3 CUDA_VERSION=12.2.2 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/bash -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit
RUN |3 CUDA_VERSION=12.2.2 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/bash -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl wget sudo vim python3-pip && apt-get install -y ffmpeg libsm6 libxext6 libgl1 && for i in 1 2 3; do add-apt-repository -y ppa:deadsnakes/ppa && break || { echo "Attempt $i failed, retrying in 5s..."; sleep 5; }; done && apt-get update -y && apt-get install -y python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS https://bootstrap.pypa.io/get-pip.py | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit
RUN |3 CUDA_VERSION=12.2.2 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/bash -c python3 -m pip install uv # buildkit
ENV UV_HTTP_TIMEOUT=500
ENV UV_INDEX_STRATEGY=unsafe-best-match
RUN |3 CUDA_VERSION=12.2.2 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/bash -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit
RUN |3 CUDA_VERSION=12.2.2 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/bash -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then uv pip install --system --index-url https://download.pytorch.org/whl/nightly/cu128 "torch==2.8.0.dev20250318+cu128" "torchvision==0.22.0.dev20250319"; uv pip install --system --index-url https://download.pytorch.org/whl/nightly/cu128 --pre pytorch_triton==3.3.0+gitab727c40; fi # buildkit
RUN |3 CUDA_VERSION=12.2.2 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/bash -c uv pip install --system dist/*.whl --verbose --extra-index-url https://download.pytorch.org/whl/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
RUN |3 CUDA_VERSION=12.2.2 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/bash -c . /etc/environment && if [ "$TARGETPLATFORM" != "linux/arm64" ]; then if [[ "$CUDA_VERSION" == 12.8* ]]; then uv pip install --system https://download.pytorch.org/whl/cu128/flashinfer/flashinfer_python-0.2.5%2Bcu128torch2.7-cp38-abi3-linux_x86_64.whl; else export TORCH_CUDA_ARCH_LIST='7.5 8.0 8.9 9.0+PTX'; CUDA_MAJOR="${CUDA_VERSION%%.*}"; if [ "$CUDA_MAJOR" -lt 12 ]; then export FLASHINFER_ENABLE_SM90=0; fi; uv pip install --system --no-build-isolation "git+https://github.com/flashinfer-ai/flashinfer@21ea1d2545f74782b91eb8c08fd503ac4c0743fc" ; fi fi # buildkit
COPY examples examples # buildkit
COPY benchmarks benchmarks # buildkit
COPY ./vllm/collect_env.py . # buildkit
RUN |3 CUDA_VERSION=12.2.2 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/bash -c . /etc/environment && uv pip list # buildkit
COPY requirements/build.txt requirements/build.txt # buildkit
RUN |3 CUDA_VERSION=12.2.2 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/bash -c uv pip install --system -r requirements/build.txt --extra-index-url https://download.pytorch.org/whl/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
ARG TARGETPLATFORM
ENV UV_HTTP_TIMEOUT=500
RUN |1 TARGETPLATFORM=linux/amd64 /bin/bash -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then uv pip install --system accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.42.0' 'timm==0.9.10' boto3 runai-model-streamer runai-model-streamer[s3]; else uv pip install --system accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.45.3' 'timm==0.9.10' boto3 runai-model-streamer runai-model-streamer[s3]; fi # buildkit
ENV VLLM_USAGE_SOURCE=production-docker-image
ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"]

Labels

Key Value
maintainer NVIDIA CORPORATION <cudatools@nvidia.com>
org.opencontainers.image.ref.name ubuntu
org.opencontainers.image.version 22.04
Details
Container
2025-06-08 17:55:09 +00:00
1
OCI / Docker
linux/amd64
7.4 GiB
Versions (5) View all
latest 2025-08-08
2025-08-08-fc8b89 2025-08-08
2025-06-08-3123ba 2025-06-08
2025-06-08-0e7123 2025-06-08
nightly 2025-06-08