Namespace
vllm
Image / Tag
vllm-openai:nightly-a238cbd89d07b4b0ed8fb3dff3c219a3ee3a1651
Content Digest
sha256:e3fd8b512a65979c2f3477de8976bb98f477412e9f920344946ad488a93ed269
Details
Created

2025-12-06 06:45:54 UTC

Size

8.3 GB

Content Digest
Labels
  • maintainer
    NVIDIA CORPORATION <cudatools@nvidia.com>
  • org.opencontainers.image.ref.name
    ubuntu
  • org.opencontainers.image.version
    22.04

Environment
CUDA_VERSION

12.9.1

DEBIAN_FRONTEND

noninteractive

LD_LIBRARY_PATH

/usr/local/nvidia/lib64:/usr/local/cuda/lib64:/usr/local/cuda/lib64

NVARCH

x86_64

NVIDIA_DRIVER_CAPABILITIES

compute,utility

NVIDIA_REQUIRE_CUDA

cuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571

NVIDIA_VISIBLE_DEVICES

all

NV_CUDA_CUDART_VERSION

12.9.79-1

PATH

/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

UV_HTTP_TIMEOUT

500

UV_INDEX_STRATEGY

unsafe-best-match

UV_LINK_MODE

copy

VLLM_USAGE_SOURCE

production-docker-image


Layers

[#000] sha256:66587c81b81a58d07e40c48d900a1517516bbf58c4378c687d89d645824f5e5f - 0.34% (29 MB)

[#001] sha256:f29b1d4013a93a17a4d4acbb760170b608e6707e85419f0e1a2973233f1c0080 - 0.05% (4.43 MB)

[#002] sha256:340d44d2921c44112afe4f535a1a3bcfdc4eed5093388d098937942f7f883739 - 1.16% (98.7 MB)

[#003] sha256:59a4bcbddda3c45ff4949d35d2321b6eca9eaff7daae2334c99226bb19f60c3a - 0.0% (184 Bytes)

[#004] sha256:6e8af4fd0a071982e528b634ba99dec2474c21147f99748be708f36e10e3f4c2 - 0.0% (6.72 KB)

[#005] sha256:1cb38f62db51af30b28de37e6dd075e0acfc2b4ef89046d16ebf56be70e5b2e9 - 0.0% (104 Bytes)

[#006] sha256:4f8bfc9b42556cf08825630c243f61c74fd37df0c1c1405b79420b7da166f0fc - 0.0% (229 Bytes)

[#007] sha256:7bc0c07ee56a635a3ad373c1a3037f85b8a27cf679776bda46485c14845a6d46 - 2.58% (219 MB)

[#008] sha256:c202bdc28f166b1e0f8f89c5fe72ecf67493dbf2de642f19672e3035700eaa6e - 15.56% (1.29 GB)

[#009] sha256:6a2139942f1baa1511335ae6374af835cc062b796330db7bb69800f9257a52a1 - 0.5% (42.4 MB)

[#010] sha256:2c1e830c82fedbaee77903c51e3ab2c184b6e12414f7bb5deb4340c75db59c54 - 0.0% (11.1 KB)

[#011] sha256:87771e5a516cb10f5ace5fbe98a4e1945a3834c7d43872f9b68f1259447f50f9 - 62.59% (5.2 GB)

[#012] sha256:c1c35da6533816b034ffe1cd664f4d2a3dc1ebad57bfd10d29a08d273bb1effd - 14.41% (1.2 GB)

[#013] sha256:08147c2d1dd4405d3c78799d3b2914c4e6912c12359e3b8e714c3df4efb7df3c - 0.0% (189 KB)

[#014] sha256:e3a019af594c0552be59a45644e0fb3915007d2ab9bf8c70a7c1937df260c911 - 0.0% (169 KB)

[#015] sha256:17184632aa4fa1cd2739e75b963344d63b7c4436a934dd59a50756b7770b3d30 - 0.0% (8.21 KB)

[#016] sha256:c70e86b7d130c2ed284675b2615aedba87095978baa2ac17eb90dfb4dbf417db - 0.0% (121 Bytes)

[#017] sha256:e9fdaa555352f4678f0e5e94a2428cc156d4ff4a2be96f54503d6bc8fcc171a0 - 0.09% (7.61 MB)

[#018] sha256:6fd16840b0d75fc8d4de4c9d9e6036d61022eab8a9874171eabee1acd830a75a - 1.06% (89.9 MB)

[#019] sha256:457aee086e49493c70ebb19dd9e28334255650c0918c91b50c07300d4a484319 - 0.01% (525 KB)

[#020] sha256:6a26fcd97f19791e15061d66d4150ee69431d932515bf41d8f9ab87462c076f4 - 1.65% (140 MB)


History
2025-07-14 16:33:29 UTC

/bin/sh -c #(nop) ARG RELEASE

2025-07-14 16:33:29 UTC

/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH

2025-07-14 16:33:29 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu

2025-07-14 16:33:29 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04

2025-07-14 16:33:31 UTC

/bin/sh -c #(nop) ADD file:415bbc01dfb447d002e2d8173e113ef025d2bbfa20f1205823fa699dc87a2019 in /

2025-07-14 16:33:32 UTC

/bin/sh -c #(nop) CMD ["/bin/bash"]

2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)

ENV NVARCH=x86_64

2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_REQUIRE_CUDA=cuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571

2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_VERSION=12.9.79-1

2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit

2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)

ENV CUDA_VERSION=12.9.1

2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-9=${NV_CUDA_CUDART_VERSION} cuda-compat-12-9 && rm -rf /var/lib/apt/lists/* # buildkit

2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit

2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)

ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64

2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)

COPY NGC-DL-CONTAINER-LICENSE / # buildkit

2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_VISIBLE_DEVICES=all

2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ARG CUDA_VERSION

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ARG PYTHON_VERSION

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ARG INSTALL_KV_CONNECTORS=false

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

WORKDIR /vllm-workspace

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ENV DEBIAN_FRONTEND=noninteractive

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ARG TARGETPLATFORM

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ARG GDRCOPY_CUDA_VERSION=12.8

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ARG GDRCOPY_OS_VERSION=Ubuntu22_04

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

SHELL [/bin/bash -c]

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ARG DEADSNAKES_MIRROR_URL

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ARG DEADSNAKES_GPGKEY_URL

2025-12-06 06:20:47 UTC (buildkit.dockerfile.v0)

ARG GET_PIP_URL

2025-12-06 06:21:28 UTC (buildkit.dockerfile.v0)

RUN |9 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit

2025-12-06 06:25:17 UTC (buildkit.dockerfile.v0)

RUN |9 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y --no-install-recommends software-properties-common curl sudo python3-pip ffmpeg libsm6 libxext6 libgl1 && if [ ! -z ${DEADSNAKES_MIRROR_URL} ] ; then if [ ! -z "${DEADSNAKES_GPGKEY_URL}" ] ; then mkdir -p -m 0755 /etc/apt/keyrings ; curl -L ${DEADSNAKES_GPGKEY_URL} | gpg --dearmor > /etc/apt/keyrings/deadsnakes.gpg ; sudo chmod 644 /etc/apt/keyrings/deadsnakes.gpg ; echo "deb [signed-by=/etc/apt/keyrings/deadsnakes.gpg] ${DEADSNAKES_MIRROR_URL} $(lsb_release -cs) main" > /etc/apt/sources.list.d/deadsnakes.list ; fi ; else for i in 1 2 3; do add-apt-repository -y ppa:deadsnakes/ppa && break || { echo "Attempt $i failed, retrying in 5s..."; sleep 5; }; done ; fi && apt-get update -y && apt-get install -y --no-install-recommends python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && rm -rf /var/lib/apt/lists/* && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS ${GET_PIP_URL} | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit

2025-12-06 06:26:30 UTC (buildkit.dockerfile.v0)

RUN |9 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c CUDA_VERSION_DASH=$(echo $CUDA_VERSION | cut -d. -f1,2 | tr '.' '-') && apt-get update -y && apt-get install -y --no-install-recommends cuda-nvcc-${CUDA_VERSION_DASH} cuda-cudart-${CUDA_VERSION_DASH} cuda-nvrtc-${CUDA_VERSION_DASH} cuda-cuobjdump-${CUDA_VERSION_DASH} libcurand-dev-${CUDA_VERSION_DASH} libcublas-${CUDA_VERSION_DASH} libnccl-dev && rm -rf /var/lib/apt/lists/* # buildkit

2025-12-06 06:26:30 UTC (buildkit.dockerfile.v0)

ARG PIP_INDEX_URL UV_INDEX_URL

2025-12-06 06:26:30 UTC (buildkit.dockerfile.v0)

ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL

2025-12-06 06:26:30 UTC (buildkit.dockerfile.v0)

ARG PYTORCH_CUDA_INDEX_BASE_URL

2025-12-06 06:26:30 UTC (buildkit.dockerfile.v0)

ARG PIP_KEYRING_PROVIDER UV_KEYRING_PROVIDER

2025-12-06 06:26:33 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c python3 -m pip install uv # buildkit

2025-12-06 06:26:33 UTC (buildkit.dockerfile.v0)

ENV UV_HTTP_TIMEOUT=500

2025-12-06 06:26:33 UTC (buildkit.dockerfile.v0)

ENV UV_INDEX_STRATEGY=unsafe-best-match

2025-12-06 06:26:33 UTC (buildkit.dockerfile.v0)

ENV UV_LINK_MODE=copy

2025-12-06 06:26:33 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit

2025-12-06 06:43:41 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c uv pip install --system dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit

2025-12-06 06:45:31 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c uv pip install --system flashinfer-cubin==0.5.3 && uv pip install --system flashinfer-jit-cache==0.5.3 --extra-index-url https://flashinfer.ai/whl/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') && flashinfer show-config # buildkit

2025-12-06 06:45:31 UTC (buildkit.dockerfile.v0)

COPY examples examples # buildkit

2025-12-06 06:45:31 UTC (buildkit.dockerfile.v0)

COPY benchmarks benchmarks # buildkit

2025-12-06 06:45:31 UTC (buildkit.dockerfile.v0)

COPY ./vllm/collect_env.py . # buildkit

2025-12-06 06:45:32 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c . /etc/environment && uv pip list # buildkit

2025-12-06 06:45:33 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c sh -c 'if ls /tmp/deepgemm/dist/*.whl >/dev/null 2>&1; then uv pip install --system /tmp/deepgemm/dist/*.whl; else echo "No DeepGEMM wheels to install; skipping."; fi' # buildkit

2025-12-06 06:45:33 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64:/usr/local/cuda/lib64

2025-12-06 06:45:36 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c uv pip install --system ep_kernels/dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit

2025-12-06 06:45:42 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c set -eux; case "${TARGETPLATFORM}" in linux/arm64) UUARCH="aarch64" ;; linux/amd64) UUARCH="x64" ;; *) echo "Unsupported TARGETPLATFORM: ${TARGETPLATFORM}" >&2; exit 1 ;; esac; /tmp/install_gdrcopy.sh "${GDRCOPY_OS_VERSION}" "${GDRCOPY_CUDA_VERSION}" "${UUARCH}" # buildkit

2025-12-06 06:45:42 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib64:/usr/local/cuda/lib64:/usr/local/cuda/lib64

2025-12-06 06:45:42 UTC (buildkit.dockerfile.v0)

ARG TARGETPLATFORM

2025-12-06 06:45:42 UTC (buildkit.dockerfile.v0)

ARG INSTALL_KV_CONNECTORS=false

2025-12-06 06:45:42 UTC (buildkit.dockerfile.v0)

ARG PIP_INDEX_URL UV_INDEX_URL

2025-12-06 06:45:42 UTC (buildkit.dockerfile.v0)

ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL

2025-12-06 06:45:42 UTC (buildkit.dockerfile.v0)

ENV UV_HTTP_TIMEOUT=500

2025-12-06 06:45:54 UTC (buildkit.dockerfile.v0)

RUN |6 TARGETPLATFORM=linux/amd64 INSTALL_KV_CONNECTORS=true PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= /bin/bash -c if [ "$INSTALL_KV_CONNECTORS" = "true" ]; then uv pip install --system -r /tmp/kv_connectors.txt; fi; if [ "$TARGETPLATFORM" = "linux/arm64" ]; then BITSANDBYTES_VERSION="0.42.0"; else BITSANDBYTES_VERSION="0.46.1"; fi; uv pip install --system accelerate hf_transfer modelscope "bitsandbytes>=${BITSANDBYTES_VERSION}" 'timm>=1.0.17' 'runai-model-streamer[s3,gcs]>=0.15.3' # buildkit

2025-12-06 06:45:54 UTC (buildkit.dockerfile.v0)

ENV VLLM_USAGE_SOURCE=production-docker-image

2025-12-06 06:45:54 UTC (buildkit.dockerfile.v0)

ENTRYPOINT ["vllm" "serve"]

Details
Created

2025-12-06 06:46:06 UTC

Size

7.7 GB

Content Digest
Labels
  • maintainer
    NVIDIA CORPORATION <cudatools@nvidia.com>
  • org.opencontainers.image.ref.name
    ubuntu
  • org.opencontainers.image.version
    22.04

Environment
CUDA_VERSION

12.9.1

DEBIAN_FRONTEND

noninteractive

LD_LIBRARY_PATH

/usr/local/nvidia/lib64:/usr/local/cuda/lib64:/usr/local/cuda/lib64

NVARCH

sbsa

NVIDIA_DRIVER_CAPABILITIES

compute,utility

NVIDIA_REQUIRE_CUDA

cuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571

NVIDIA_VISIBLE_DEVICES

all

NV_CUDA_CUDART_VERSION

12.9.79-1

PATH

/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

UV_HTTP_TIMEOUT

500

UV_INDEX_STRATEGY

unsafe-best-match

UV_LINK_MODE

copy

VLLM_USAGE_SOURCE

production-docker-image


Layers

[#000] sha256:2ea2730b4ab400d71167ddb8627f741637496aa57128fdfc248d6a9f799d76e9 - 0.34% (27.1 MB)

[#001] sha256:7aa2d0bb5c94f1cf869e71e4db856d2ca0733f5eaab55dd514441da9616abb35 - 0.06% (4.38 MB)

[#002] sha256:5136ae4e75ffd61960e9220c7d7625a3ee213ff63c25fdc24e85bfe229b16ab5 - 1.18% (93.1 MB)

[#003] sha256:6f760a753c5e1fc35281126d63b6ca9bef93e49f89a826a2bc2786e293d88f00 - 0.0% (182 Bytes)

[#004] sha256:6e8af4fd0a071982e528b634ba99dec2474c21147f99748be708f36e10e3f4c2 - 0.0% (6.72 KB)

[#005] sha256:157799cc72cfb22c4b5eff6d7e27c3f62f5d213cb4dd7875d5c3542cbfcda3ba - 0.0% (104 Bytes)

[#006] sha256:93f6be7b04731ff14ff5338c6fb15f6cd5066ccc1c0379ab8a848a6fa0859239 - 0.0% (231 Bytes)

[#007] sha256:2f94d60369c9707defad246b887d49bc208f11f9eefd60cb49d5f8856e5f443d - 2.59% (204 MB)

[#008] sha256:aef7d52538ad08674d12110e8fda0ad50dfbeb53ea86091ec79a77643be1d05e - 16.09% (1.24 GB)

[#009] sha256:1b0c2a76bb4789633524055dc60ffdb7de477e2295a07523882e4c98abe110f7 - 0.51% (40.4 MB)

[#010] sha256:cac672964b8f769da180ff77c3e7dbd3736b3fcb7f04c8bb88b888975966b794 - 0.0% (10.8 KB)

[#011] sha256:462cb93223e4c9428549ead7f4d4445ed3410f5cbfa76eafa7d06641a95a3609 - 58.23% (4.48 GB)

[#012] sha256:7895d9aa0f8aaff75f9287b08dc9037940bc66cd307b7a0458d1248c0c44d3d5 - 15.44% (1.19 GB)

[#013] sha256:ca2909093229fd398b4d9ad34b958884069127e7546e86ed22adbb30dfae5fea - 0.0% (189 KB)

[#014] sha256:3616b36cd27be9fef490370176725a62ae21c7768dbfe029c7a898132a30436a - 0.0% (169 KB)

[#015] sha256:a6e6d403761c1d923b55ad88344fa15775ed91e585318f00749059d1341eac2e - 0.0% (8.2 KB)

[#016] sha256:c12ce58d017c222cfccb010dd2362071c194081013c64fdb0f1291bb04273e85 - 0.0% (121 Bytes)

[#017] sha256:15487e4b91e7beca8a12dd1b77fdee4c363ac2e8cfd657dc36118a7f9bb2d540 - 0.09% (7.44 MB)

[#018] sha256:75d1c4e5e3cc774360f5af043adcbf5800c9b15c468448630b8dd2de15feb6fb - 1.14% (89.6 MB)

[#019] sha256:b38b65d92031064fe55f2b84edee1c230b97d7bf4a449cfcbbba6458ef6b4fc6 - 0.01% (522 KB)

[#020] sha256:74ceea412f0336ee69a0e0e81c2f9f8864980438a364251ca7ed0143c5523115 - 4.32% (341 MB)


History
2025-07-14 16:34:14 UTC

/bin/sh -c #(nop) ARG RELEASE

2025-07-14 16:34:14 UTC

/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH

2025-07-14 16:34:14 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu

2025-07-14 16:34:14 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04

2025-07-14 16:34:16 UTC

/bin/sh -c #(nop) ADD file:834c1c2a4c7753a37759a9b21f64a990572643eee18669b1faa782fee45355ed in /

2025-07-14 16:34:17 UTC

/bin/sh -c #(nop) CMD ["/bin/bash"]

2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)

ENV NVARCH=sbsa

2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_REQUIRE_CUDA=cuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571

2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_VERSION=12.9.79-1

2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=arm64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit

2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)

ENV CUDA_VERSION=12.9.1

2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=arm64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-9=${NV_CUDA_CUDART_VERSION} cuda-compat-12-9 && rm -rf /var/lib/apt/lists/* # buildkit

2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=arm64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit

2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)

ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64

2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)

COPY NGC-DL-CONTAINER-LICENSE / # buildkit

2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_VISIBLE_DEVICES=all

2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ARG CUDA_VERSION

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ARG PYTHON_VERSION

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ARG INSTALL_KV_CONNECTORS=false

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

WORKDIR /vllm-workspace

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ENV DEBIAN_FRONTEND=noninteractive

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ARG TARGETPLATFORM

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ARG GDRCOPY_CUDA_VERSION=12.8

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ARG GDRCOPY_OS_VERSION=Ubuntu22_04

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

SHELL [/bin/bash -c]

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ARG DEADSNAKES_MIRROR_URL

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ARG DEADSNAKES_GPGKEY_URL

2025-12-06 06:13:08 UTC (buildkit.dockerfile.v0)

ARG GET_PIP_URL

2025-12-06 06:14:10 UTC (buildkit.dockerfile.v0)

RUN |9 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit

2025-12-06 06:17:59 UTC (buildkit.dockerfile.v0)

RUN |9 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y --no-install-recommends software-properties-common curl sudo python3-pip ffmpeg libsm6 libxext6 libgl1 && if [ ! -z ${DEADSNAKES_MIRROR_URL} ] ; then if [ ! -z "${DEADSNAKES_GPGKEY_URL}" ] ; then mkdir -p -m 0755 /etc/apt/keyrings ; curl -L ${DEADSNAKES_GPGKEY_URL} | gpg --dearmor > /etc/apt/keyrings/deadsnakes.gpg ; sudo chmod 644 /etc/apt/keyrings/deadsnakes.gpg ; echo "deb [signed-by=/etc/apt/keyrings/deadsnakes.gpg] ${DEADSNAKES_MIRROR_URL} $(lsb_release -cs) main" > /etc/apt/sources.list.d/deadsnakes.list ; fi ; else for i in 1 2 3; do add-apt-repository -y ppa:deadsnakes/ppa && break || { echo "Attempt $i failed, retrying in 5s..."; sleep 5; }; done ; fi && apt-get update -y && apt-get install -y --no-install-recommends python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && rm -rf /var/lib/apt/lists/* && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS ${GET_PIP_URL} | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit

2025-12-06 06:19:05 UTC (buildkit.dockerfile.v0)

RUN |9 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c CUDA_VERSION_DASH=$(echo $CUDA_VERSION | cut -d. -f1,2 | tr '.' '-') && apt-get update -y && apt-get install -y --no-install-recommends cuda-nvcc-${CUDA_VERSION_DASH} cuda-cudart-${CUDA_VERSION_DASH} cuda-nvrtc-${CUDA_VERSION_DASH} cuda-cuobjdump-${CUDA_VERSION_DASH} libcurand-dev-${CUDA_VERSION_DASH} libcublas-${CUDA_VERSION_DASH} libnccl-dev && rm -rf /var/lib/apt/lists/* # buildkit

2025-12-06 06:19:05 UTC (buildkit.dockerfile.v0)

ARG PIP_INDEX_URL UV_INDEX_URL

2025-12-06 06:19:05 UTC (buildkit.dockerfile.v0)

ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL

2025-12-06 06:19:05 UTC (buildkit.dockerfile.v0)

ARG PYTORCH_CUDA_INDEX_BASE_URL

2025-12-06 06:19:05 UTC (buildkit.dockerfile.v0)

ARG PIP_KEYRING_PROVIDER UV_KEYRING_PROVIDER

2025-12-06 06:19:07 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c python3 -m pip install uv # buildkit

2025-12-06 06:19:07 UTC (buildkit.dockerfile.v0)

ENV UV_HTTP_TIMEOUT=500

2025-12-06 06:19:07 UTC (buildkit.dockerfile.v0)

ENV UV_INDEX_STRATEGY=unsafe-best-match

2025-12-06 06:19:07 UTC (buildkit.dockerfile.v0)

ENV UV_LINK_MODE=copy

2025-12-06 06:19:08 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit

2025-12-06 06:43:27 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c uv pip install --system dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit

2025-12-06 06:45:20 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c uv pip install --system flashinfer-cubin==0.5.3 && uv pip install --system flashinfer-jit-cache==0.5.3 --extra-index-url https://flashinfer.ai/whl/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') && flashinfer show-config # buildkit

2025-12-06 06:45:21 UTC (buildkit.dockerfile.v0)

COPY examples examples # buildkit

2025-12-06 06:45:21 UTC (buildkit.dockerfile.v0)

COPY benchmarks benchmarks # buildkit

2025-12-06 06:45:21 UTC (buildkit.dockerfile.v0)

COPY ./vllm/collect_env.py . # buildkit

2025-12-06 06:45:21 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c . /etc/environment && uv pip list # buildkit

2025-12-06 06:45:22 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c sh -c 'if ls /tmp/deepgemm/dist/*.whl >/dev/null 2>&1; then uv pip install --system /tmp/deepgemm/dist/*.whl; else echo "No DeepGEMM wheels to install; skipping."; fi' # buildkit

2025-12-06 06:45:22 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64:/usr/local/cuda/lib64

2025-12-06 06:45:25 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c uv pip install --system ep_kernels/dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit

2025-12-06 06:45:38 UTC (buildkit.dockerfile.v0)

RUN |16 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c set -eux; case "${TARGETPLATFORM}" in linux/arm64) UUARCH="aarch64" ;; linux/amd64) UUARCH="x64" ;; *) echo "Unsupported TARGETPLATFORM: ${TARGETPLATFORM}" >&2; exit 1 ;; esac; /tmp/install_gdrcopy.sh "${GDRCOPY_OS_VERSION}" "${GDRCOPY_CUDA_VERSION}" "${UUARCH}" # buildkit

2025-12-06 06:45:38 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib64:/usr/local/cuda/lib64:/usr/local/cuda/lib64

2025-12-06 06:45:38 UTC (buildkit.dockerfile.v0)

ARG TARGETPLATFORM

2025-12-06 06:45:38 UTC (buildkit.dockerfile.v0)

ARG INSTALL_KV_CONNECTORS=false

2025-12-06 06:45:38 UTC (buildkit.dockerfile.v0)

ARG PIP_INDEX_URL UV_INDEX_URL

2025-12-06 06:45:38 UTC (buildkit.dockerfile.v0)

ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL

2025-12-06 06:45:38 UTC (buildkit.dockerfile.v0)

ENV UV_HTTP_TIMEOUT=500

2025-12-06 06:46:06 UTC (buildkit.dockerfile.v0)

RUN |6 TARGETPLATFORM=linux/arm64 INSTALL_KV_CONNECTORS=true PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= /bin/bash -c if [ "$INSTALL_KV_CONNECTORS" = "true" ]; then uv pip install --system -r /tmp/kv_connectors.txt; fi; if [ "$TARGETPLATFORM" = "linux/arm64" ]; then BITSANDBYTES_VERSION="0.42.0"; else BITSANDBYTES_VERSION="0.46.1"; fi; uv pip install --system accelerate hf_transfer modelscope "bitsandbytes>=${BITSANDBYTES_VERSION}" 'timm>=1.0.17' 'runai-model-streamer[s3,gcs]>=0.15.3' # buildkit

2025-12-06 06:46:06 UTC (buildkit.dockerfile.v0)

ENV VLLM_USAGE_SOURCE=production-docker-image

2025-12-06 06:46:06 UTC (buildkit.dockerfile.v0)

ENTRYPOINT ["vllm" "serve"]

Danger Zone
Delete Tag

Please be careful as this will not just delete the reference but also the actual content!

For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.

Delete