2025-10-03 22:45:54 UTC
11.6 GB
/usr/local/cuda
CUDA_VERSION12.8.1
DEBIAN_FRONTENDnoninteractive
LD_LIBRARY_PATH/usr/local/cuda/lib64
LIBRARY_PATH/usr/local/cuda/lib64/stubs
NCCL_VERSION2.25.1-1
NVARCHx86_64
NVIDIA_DRIVER_CAPABILITIEScompute,utility
NVIDIA_PRODUCT_NAMECUDA
NVIDIA_REQUIRE_CUDAcuda>=12.8 brand=unknown,driver>=470,driver<471 brand=grid,driver>=470,driver<471 brand=tesla,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=vapps,driver>=470,driver<471 brand=vpc,driver>=470,driver<471 brand=vcs,driver>=470,driver<471 brand=vws,driver>=470,driver<471 brand=cloudgaming,driver>=470,driver<471 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566
NVIDIA_VISIBLE_DEVICESall
NV_CUDA_CUDART_DEV_VERSION12.8.90-1
NV_CUDA_CUDART_VERSION12.8.90-1
NV_CUDA_LIB_VERSION12.8.1-1
NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGEcuda-nsight-compute-12-8=12.8.1-1
NV_CUDA_NSIGHT_COMPUTE_VERSION12.8.1-1
NV_LIBCUBLAS_DEV_PACKAGElibcublas-dev-12-8=12.8.4.1-1
NV_LIBCUBLAS_DEV_PACKAGE_NAMElibcublas-dev-12-8
NV_LIBCUBLAS_DEV_VERSION12.8.4.1-1
NV_LIBCUBLAS_PACKAGElibcublas-12-8=12.8.4.1-1
NV_LIBCUBLAS_PACKAGE_NAMElibcublas-12-8
NV_LIBCUBLAS_VERSION12.8.4.1-1
NV_LIBCUSPARSE_DEV_VERSION12.5.8.93-1
NV_LIBCUSPARSE_VERSION12.5.8.93-1
NV_LIBNCCL_DEV_PACKAGElibnccl-dev=2.25.1-1+cuda12.8
NV_LIBNCCL_DEV_PACKAGE_NAMElibnccl-dev
NV_LIBNCCL_DEV_PACKAGE_VERSION2.25.1-1
NV_LIBNCCL_PACKAGElibnccl2=2.25.1-1+cuda12.8
NV_LIBNCCL_PACKAGE_NAMElibnccl2
NV_LIBNCCL_PACKAGE_VERSION2.25.1-1
NV_LIBNPP_DEV_PACKAGElibnpp-dev-12-8=12.3.3.100-1
NV_LIBNPP_DEV_VERSION12.3.3.100-1
NV_LIBNPP_PACKAGElibnpp-12-8=12.3.3.100-1
NV_LIBNPP_VERSION12.3.3.100-1
NV_NVML_DEV_VERSION12.8.90-1
NV_NVPROF_DEV_PACKAGEcuda-nvprof-12-8=12.8.90-1
NV_NVPROF_VERSION12.8.90-1
NV_NVTX_VERSION12.8.90-1
PATH/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
UV_HTTP_TIMEOUT500
UV_INDEX_STRATEGYunsafe-best-match
UV_LINK_MODEcopy
VLLM_USAGE_SOURCEproduction-docker-image
[#000] sha256:8f84a9f2102e97a4a6bf673b150fc9894df5acc9618ad3484c6c36f768c1caa0 - 0.24% (29 MB)
[#001] sha256:b95112eaf2836b9c7193858419f6d17933a873c4a2c9227dc497f5e090ea9c87 - 0.04% (4.42 MB)
[#002] sha256:030ef82509363afebdc78482e6f8c07f2bc8b65a45caf082c2a9a621c7deae63 - 0.52% (61.3 MB)
[#003] sha256:72ac9ccfda38d144ef8e3aadbd5851e7fa9aacd261f8e15d7365db0f816d3433 - 0.0% (186 Bytes)
[#004] sha256:73389fbd088f5ed5d9fd258baced59de092978b4f483920ea6d074522a105119 - 0.0% (6.72 KB)
[#005] sha256:0264850675f7464ed6385d030d281ffb0f2037323c73511a5372948c1c69d92c - 16.52% (1.92 GB)
[#006] sha256:de1d03310308c2871217cf179589d5e7fcd8eee31d8f331b61041347f50404a0 - 0.0% (62.6 KB)
[#007] sha256:c1d2af7fad0f1c6cdaf09c568c086019e834bc6523c30aa9b2b0b24c4b782086 - 0.0% (1.64 KB)
[#008] sha256:5601308b3ac642f7df8b1dc62b9582abdd34857eec6190bcb50162abc5719226 - 0.0% (1.49 KB)
[#009] sha256:6b2035e8b73ed2b018995a7b2c8d607d5527daf948d41964f02cc3ce7ed0699a - 24.0% (2.78 GB)
[#010] sha256:ed71f8f81b33b96e7112757f6828a6dcb0861026aa63c5edc672d13e11045f6d - 0.0% (86.8 KB)
[#011] sha256:dee27977c61a88e0c96530b24952e3cc522f0e869cd855920b5be7cc328fec20 - 0.0% (104 Bytes)
[#012] sha256:36b282865c6a94eb29d4459d94499fcada34c41848910acccb85bbb804dc1541 - 0.0% (230 Bytes)
[#013] sha256:a18a28c84f90b30febe85796790d0a26756a05e7c82b37c03fae219ddc6473d7 - 2.72% (323 MB)
[#014] sha256:f3f6e18150285edf96d401a0936cac0df7ad48bdf6fa2489d438f9d46eeeae65 - 0.35% (41.4 MB)
[#015] sha256:7371fb04cbd5996a56a22aee95360c494c12c1d3a01c177e3beed5cd25c61b25 - 0.0% (12.9 KB)
[#016] sha256:a62c67a7991a65e8ab2e27a6688c2436fd30944c09c32442b9c9e857f9a95d87 - 0.0% (120 Bytes)
[#017] sha256:edc84132aa9ee096a305f08d621701a3618cfa931631f3c4edc842086b6ba86f - 39.63% (4.6 GB)
[#018] sha256:492aaf546a43c8ad23544f286d0e8844de5453293ae9490ff0e1dd5d8e1275d0 - 10.06% (1.17 GB)
[#019] sha256:422b8cb1546346a9a54935d4c8a3bc5cec8efae75da6970955bb9b0f70cea173 - 0.0% (173 KB)
[#020] sha256:20b045626669d0a15d99c406e1a233f573a568f2bd3ad91d1725a75841b03b67 - 0.0% (149 KB)
[#021] sha256:8560373878f54cb596afaac707495ef01cbda1afbfb610d44b2bdaaea6e95239 - 0.0% (8.25 KB)
[#022] sha256:f007d729f4ec361df45fd1a920e9ba36d51383906917d65e93b8de52bbc5ad1c - 0.0% (122 Bytes)
[#023] sha256:220f3f1968ebbc7411b2e04cbfd0ee647fb063582e678f16de4f7a93ff2ecb69 - 0.0% (299 Bytes)
[#024] sha256:7ba297322f59e6f92c9f78ceff52650af6f7f425b89191e827e92c380165a76d - 0.23% (27.7 MB)
[#025] sha256:a688b0cde5470df35f711a5d74a1ac8238853cf68f31c04e8833abf6cf26bf54 - 0.0% (1.44 KB)
[#026] sha256:4647c4903cc1570ec559b700dfc66060c292e4341bc0c1031792da3159de2628 - 0.06% (7.33 MB)
[#027] sha256:e10440dc188e76436816515c76b11a041221ae79ec728fe8c413840d8b4e3768 - 0.0% (906 Bytes)
[#028] sha256:f641668ae021722d040f5c4d4b17cdb6a45afd909dfdda3146c857704d52a264 - 0.0% (573 KB)
[#029] sha256:4f18eae8775e3c223a07ed264eff9934e90603d19fd42b32265fc23f588739c2 - 0.0% (1.51 KB)
[#030] sha256:4c3d87fb42962673d7da8724df8b676076987fd439f239e574cc5c10b65cf968 - 4.64% (551 MB)
[#031] sha256:78b596bcad084e478fb58f5960bb51af74e3da6944160f49fc3bcb480377a811 - 0.0% (236 Bytes)
[#032] sha256:6a16eaeb9de9240bd3d81dc87fd4d2d5060f5374bdc709206ecedb33da21af22 - 0.98% (116 MB)
/bin/sh -c #(nop) ARG RELEASE
2025-01-26 05:31:07 UTC/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH
2025-01-26 05:31:07 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu
2025-01-26 05:31:07 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04
2025-01-26 05:31:10 UTC/bin/sh -c #(nop) ADD file:1b6c8c9518be42fa2afe5e241ca31677fce58d27cdfa88baa91a65a259be3637 in /
2025-01-26 05:31:11 UTC/bin/sh -c #(nop) CMD ["/bin/bash"]
2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)ENV NVARCH=x86_64
2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)ENV NVIDIA_REQUIRE_CUDA=cuda>=12.8 brand=unknown,driver>=470,driver<471 brand=grid,driver>=470,driver<471 brand=tesla,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=vapps,driver>=470,driver<471 brand=vpc,driver>=470,driver<471 brand=vcs,driver>=470,driver<471 brand=vws,driver>=470,driver<471 brand=cloudgaming,driver>=470,driver<471 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566
2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_CUDART_VERSION=12.8.90-1
2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit
2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)ENV CUDA_VERSION=12.8.1
2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-8=${NV_CUDA_CUDART_VERSION} cuda-compat-12-8 && rm -rf /var/lib/apt/lists/* # buildkit
2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit
2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64
2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)COPY NGC-DL-CONTAINER-LICENSE / # buildkit
2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)ENV NVIDIA_VISIBLE_DEVICES=all
2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_LIB_VERSION=12.8.1-1
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_NVTX_VERSION=12.8.90-1
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_VERSION=12.3.3.100-1
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_PACKAGE=libnpp-12-8=12.3.3.100-1
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUSPARSE_VERSION=12.5.8.93-1
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-12-8
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_VERSION=12.8.4.1-1
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_PACKAGE=libcublas-12-8=12.8.4.1-1
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_PACKAGE_VERSION=2.25.1-1
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NCCL_VERSION=2.25.1-1
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_PACKAGE=libnccl2=2.25.1-1+cuda12.8
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-12-8=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-12-8=${NV_NVTX_VERSION} libcusparse-12-8=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENV NVIDIA_PRODUCT_NAME=CUDA
2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_LIB_VERSION=12.8.1-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_CUDART_DEV_VERSION=12.8.90-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_NVML_DEV_VERSION=12.8.90-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUSPARSE_DEV_VERSION=12.5.8.93-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_DEV_VERSION=12.3.3.100-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_DEV_PACKAGE=libnpp-dev-12-8=12.3.3.100-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_DEV_VERSION=12.8.4.1-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_DEV_PACKAGE_NAME=libcublas-dev-12-8
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_DEV_PACKAGE=libcublas-dev-12-8=12.8.4.1-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_NSIGHT_COMPUTE_VERSION=12.8.1-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE=cuda-nsight-compute-12-8=12.8.1-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_NVPROF_VERSION=12.8.90-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_NVPROF_DEV_PACKAGE=cuda-nvprof-12-8=12.8.90-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_DEV_PACKAGE_NAME=libnccl-dev
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_DEV_PACKAGE_VERSION=2.25.1-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NCCL_VERSION=2.25.1-1
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_DEV_PACKAGE=libnccl-dev=2.25.1-1+cuda12.8
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-dev-12-8=${NV_CUDA_CUDART_DEV_VERSION} cuda-command-line-tools-12-8=${NV_CUDA_LIB_VERSION} cuda-minimal-build-12-8=${NV_CUDA_LIB_VERSION} cuda-libraries-dev-12-8=${NV_CUDA_LIB_VERSION} cuda-nvml-dev-12-8=${NV_NVML_DEV_VERSION} ${NV_NVPROF_DEV_PACKAGE} ${NV_LIBNPP_DEV_PACKAGE} libcusparse-dev-12-8=${NV_LIBCUSPARSE_DEV_VERSION} ${NV_LIBCUBLAS_DEV_PACKAGE} ${NV_LIBNCCL_DEV_PACKAGE} ${NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_DEV_PACKAGE_NAME} ${NV_LIBNCCL_DEV_PACKAGE_NAME} # buildkit
2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ARG CUDA_VERSION
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ARG PYTHON_VERSION
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ARG INSTALL_KV_CONNECTORS=false
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)WORKDIR /vllm-workspace
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ENV DEBIAN_FRONTEND=noninteractive
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ARG TARGETPLATFORM
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ARG GDRCOPY_CUDA_VERSION=12.8
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ARG GDRCOPY_OS_VERSION=Ubuntu22_04
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)SHELL [/bin/bash -c]
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ARG DEADSNAKES_MIRROR_URL
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ARG DEADSNAKES_GPGKEY_URL
2025-10-03 21:08:23 UTC (buildkit.dockerfile.v0)ARG GET_PIP_URL
2025-10-03 21:08:24 UTC (buildkit.dockerfile.v0)RUN |9 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit
2025-10-03 21:12:16 UTC (buildkit.dockerfile.v0)RUN |9 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl wget sudo vim python3-pip && apt-get install -y ffmpeg libsm6 libxext6 libgl1 && if [ ! -z ${DEADSNAKES_MIRROR_URL} ] ; then if [ ! -z "${DEADSNAKES_GPGKEY_URL}" ] ; then mkdir -p -m 0755 /etc/apt/keyrings ; curl -L ${DEADSNAKES_GPGKEY_URL} | gpg --dearmor > /etc/apt/keyrings/deadsnakes.gpg ; sudo chmod 644 /etc/apt/keyrings/deadsnakes.gpg ; echo "deb [signed-by=/etc/apt/keyrings/deadsnakes.gpg] ${DEADSNAKES_MIRROR_URL} $(lsb_release -cs) main" > /etc/apt/sources.list.d/deadsnakes.list ; fi ; else for i in 1 2 3; do add-apt-repository -y ppa:deadsnakes/ppa && break || { echo "Attempt $i failed, retrying in 5s..."; sleep 5; }; done ; fi && apt-get update -y && apt-get install -y python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS ${GET_PIP_URL} | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit
2025-10-03 21:12:16 UTC (buildkit.dockerfile.v0)ARG PIP_INDEX_URL UV_INDEX_URL
2025-10-03 21:12:16 UTC (buildkit.dockerfile.v0)ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL
2025-10-03 21:12:16 UTC (buildkit.dockerfile.v0)ARG PYTORCH_CUDA_INDEX_BASE_URL
2025-10-03 21:12:16 UTC (buildkit.dockerfile.v0)ARG PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL
2025-10-03 21:12:16 UTC (buildkit.dockerfile.v0)ARG PIP_KEYRING_PROVIDER UV_KEYRING_PROVIDER
2025-10-03 21:12:18 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c python3 -m pip install uv # buildkit
2025-10-03 21:12:18 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2025-10-03 21:12:18 UTC (buildkit.dockerfile.v0)ENV UV_INDEX_STRATEGY=unsafe-best-match
2025-10-03 21:12:18 UTC (buildkit.dockerfile.v0)ENV UV_LINK_MODE=copy
2025-10-03 21:12:18 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit
2025-10-03 21:12:19 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then uv pip install --system --index-url ${PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') "torch==2.8.0.dev20250318+cu128" "torchvision==0.22.0.dev20250319" ; uv pip install --system --index-url ${PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') --pre pytorch_triton==3.3.0+gitab727c40 ; fi # buildkit
2025-10-03 21:28:07 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c uv pip install --system dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
2025-10-03 21:28:07 UTC (buildkit.dockerfile.v0)ARG FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git
2025-10-03 21:28:07 UTC (buildkit.dockerfile.v0)ARG FLASHINFER_GIT_REF=v0.3.1
2025-10-03 21:28:07 UTC (buildkit.dockerfile.v0)ARG FLASHINFER_AOT_COMPILE=false
2025-10-03 22:39:14 UTC (buildkit.dockerfile.v0)RUN |20 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true /bin/bash -c bash - <<'BASH' . /etc/environment git clone --depth 1 --recursive --shallow-submodules \ --branch ${FLASHINFER_GIT_REF} \ ${FLASHINFER_GIT_REPO} flashinfer pushd flashinfer if [ "${FLASHINFER_AOT_COMPILE}" = "true" ]; then # Exclude CUDA arches for older versions (11.x and 12.0-12.7) # TODO: Update this to allow setting TORCH_CUDA_ARCH_LIST as a build arg. if [[ "${CUDA_VERSION}" == 11.* ]]; then FI_TORCH_CUDA_ARCH_LIST="7.5 8.0 8.9" elif [[ "${CUDA_VERSION}" == 12.[0-7]* ]]; then FI_TORCH_CUDA_ARCH_LIST="7.5 8.0 8.9 9.0a" else # CUDA 12.8+ supports 10.0a and 12.0 FI_TORCH_CUDA_ARCH_LIST="7.5 8.0 8.9 9.0a 10.0a 12.0" fi echo "🏗️ Installing FlashInfer with AOT compilation for arches: ${FI_TORCH_CUDA_ARCH_LIST}" export FLASHINFER_CUDA_ARCH_LIST="${FI_TORCH_CUDA_ARCH_LIST}" # HACK: We need these to run flashinfer.aot before installing flashinfer, get from the package in the future uv pip install --system cuda-python==$(echo $CUDA_VERSION | cut -d. -f1,2) pynvml==$(echo $CUDA_VERSION | cut -d. -f1) nvidia-nvshmem-cu$(echo $CUDA_VERSION | cut -d. -f1) # Build AOT kernels TORCH_CUDA_ARCH_LIST="${FI_TORCH_CUDA_ARCH_LIST}" \ python3 -m flashinfer.aot # Install with no-build-isolation since we already built AOT kernels TORCH_CUDA_ARCH_LIST="${FI_TORCH_CUDA_ARCH_LIST}" \ uv pip install --system --no-build-isolation . \ --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # Download pre-compiled cubins TORCH_CUDA_ARCH_LIST="${FI_TORCH_CUDA_ARCH_LIST}" \ python3 -m flashinfer --download-cubin || echo "WARNING: Failed to download flashinfer cubins." else echo "🏗️ Installing FlashInfer without AOT compilation in JIT mode" uv pip install --system . \ --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') fi popd rm -rf flashinfer BASH # buildkit
2025-10-03 22:39:14 UTC (buildkit.dockerfile.v0)COPY examples examples # buildkit
2025-10-03 22:39:14 UTC (buildkit.dockerfile.v0)COPY benchmarks benchmarks # buildkit
2025-10-03 22:39:14 UTC (buildkit.dockerfile.v0)COPY ./vllm/collect_env.py . # buildkit
2025-10-03 22:39:14 UTC (buildkit.dockerfile.v0)RUN |20 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true /bin/bash -c . /etc/environment && uv pip list # buildkit
2025-10-03 22:39:14 UTC (buildkit.dockerfile.v0)COPY requirements/build.txt requirements/build.txt # buildkit
2025-10-03 22:39:16 UTC (buildkit.dockerfile.v0)RUN |20 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true /bin/bash -c uv pip install --system -r requirements/build.txt --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
2025-10-03 22:39:16 UTC (buildkit.dockerfile.v0)ARG DEEPGEMM_GIT_REF
2025-10-03 22:39:16 UTC (buildkit.dockerfile.v0)COPY tools/install_deepgemm.sh /tmp/install_deepgemm.sh # buildkit
2025-10-03 22:40:02 UTC (buildkit.dockerfile.v0)RUN |21 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true DEEPGEMM_GIT_REF= /bin/bash -c VLLM_DOCKER_BUILD_CONTEXT=1 /tmp/install_deepgemm.sh --cuda-version "${CUDA_VERSION}" ${DEEPGEMM_GIT_REF:+--ref "$DEEPGEMM_GIT_REF"} # buildkit
2025-10-03 22:40:02 UTC (buildkit.dockerfile.v0)COPY tools/install_gdrcopy.sh install_gdrcopy.sh # buildkit
2025-10-03 22:40:07 UTC (buildkit.dockerfile.v0)RUN |21 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true DEEPGEMM_GIT_REF= /bin/bash -c set -eux; case "${TARGETPLATFORM}" in linux/arm64) UUARCH="aarch64" ;; linux/amd64) UUARCH="x64" ;; *) echo "Unsupported TARGETPLATFORM: ${TARGETPLATFORM}" >&2; exit 1 ;; esac; ./install_gdrcopy.sh "${GDRCOPY_OS_VERSION}" "${GDRCOPY_CUDA_VERSION}" "${UUARCH}"; rm ./install_gdrcopy.sh # buildkit
2025-10-03 22:40:07 UTC (buildkit.dockerfile.v0)COPY tools/ep_kernels/install_python_libraries.sh install_python_libraries.sh # buildkit
2025-10-03 22:40:07 UTC (buildkit.dockerfile.v0)ENV CUDA_HOME=/usr/local/cuda
2025-10-03 22:45:45 UTC (buildkit.dockerfile.v0)RUN |21 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true DEEPGEMM_GIT_REF= /bin/bash -c export TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST:-9.0a+PTX}" && bash install_python_libraries.sh # buildkit
2025-10-03 22:45:45 UTC (buildkit.dockerfile.v0)ARG TARGETPLATFORM
2025-10-03 22:45:45 UTC (buildkit.dockerfile.v0)ARG INSTALL_KV_CONNECTORS=false
2025-10-03 22:45:45 UTC (buildkit.dockerfile.v0)ARG PIP_INDEX_URL UV_INDEX_URL
2025-10-03 22:45:45 UTC (buildkit.dockerfile.v0)ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL
2025-10-03 22:45:45 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2025-10-03 22:45:45 UTC (buildkit.dockerfile.v0)COPY requirements/kv_connectors.txt requirements/kv_connectors.txt # buildkit
2025-10-03 22:45:54 UTC (buildkit.dockerfile.v0)RUN |6 TARGETPLATFORM=linux/amd64 INSTALL_KV_CONNECTORS=true PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= /bin/bash -c if [ "$INSTALL_KV_CONNECTORS" = "true" ]; then uv pip install --system -r requirements/kv_connectors.txt; fi; if [ "$TARGETPLATFORM" = "linux/arm64" ]; then BITSANDBYTES_VERSION="0.42.0"; else BITSANDBYTES_VERSION="0.46.1"; fi; uv pip install --system accelerate hf_transfer modelscope "bitsandbytes>=${BITSANDBYTES_VERSION}" 'timm>=1.0.17' boto3 runai-model-streamer runai-model-streamer[s3] # buildkit
2025-10-03 22:45:54 UTC (buildkit.dockerfile.v0)ENV VLLM_USAGE_SOURCE=production-docker-image
2025-10-03 22:45:54 UTC (buildkit.dockerfile.v0)ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"]
2025-10-03 22:45:44 UTC
11.3 GB
/usr/local/cuda
CUDA_VERSION12.9.1
DEBIAN_FRONTENDnoninteractive
LD_LIBRARY_PATH/usr/local/cuda/lib64
LIBRARY_PATH/usr/local/cuda/lib64/stubs
NCCL_VERSION2.27.3-1
NVARCHsbsa
NVIDIA_DRIVER_CAPABILITIEScompute,utility
NVIDIA_PRODUCT_NAMECUDA
NVIDIA_REQUIRE_CUDAcuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571
NVIDIA_VISIBLE_DEVICESall
NV_CUDA_CUDART_DEV_VERSION12.9.79-1
NV_CUDA_CUDART_VERSION12.9.79-1
NV_CUDA_LIB_VERSION12.9.1-1
NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGEcuda-nsight-compute-12-9=12.9.1-1
NV_CUDA_NSIGHT_COMPUTE_VERSION12.9.1-1
NV_LIBCUBLAS_DEV_PACKAGElibcublas-dev-12-9=12.9.1.4-1
NV_LIBCUBLAS_DEV_PACKAGE_NAMElibcublas-dev-12-9
NV_LIBCUBLAS_DEV_VERSION12.9.1.4-1
NV_LIBCUBLAS_PACKAGElibcublas-12-9=12.9.1.4-1
NV_LIBCUBLAS_PACKAGE_NAMElibcublas-12-9
NV_LIBCUBLAS_VERSION12.9.1.4-1
NV_LIBCUSPARSE_DEV_VERSION12.5.10.65-1
NV_LIBCUSPARSE_VERSION12.5.10.65-1
NV_LIBNCCL_DEV_PACKAGElibnccl-dev=2.27.3-1+cuda12.9
NV_LIBNCCL_DEV_PACKAGE_NAMElibnccl-dev
NV_LIBNCCL_DEV_PACKAGE_VERSION2.27.3-1
NV_LIBNCCL_PACKAGElibnccl2=2.27.3-1+cuda12.9
NV_LIBNCCL_PACKAGE_NAMElibnccl2
NV_LIBNCCL_PACKAGE_VERSION2.27.3-1
NV_LIBNPP_DEV_PACKAGElibnpp-dev-12-9=12.4.1.87-1
NV_LIBNPP_DEV_VERSION12.4.1.87-1
NV_LIBNPP_PACKAGElibnpp-12-9=12.4.1.87-1
NV_LIBNPP_VERSION12.4.1.87-1
NV_NVML_DEV_VERSION12.9.79-1
NV_NVTX_VERSION12.9.79-1
PATH/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
UV_HTTP_TIMEOUT500
UV_INDEX_STRATEGYunsafe-best-match
UV_LINK_MODEcopy
VLLM_USAGE_SOURCEproduction-docker-image
[#000] sha256:2ea2730b4ab400d71167ddb8627f741637496aa57128fdfc248d6a9f799d76e9 - 0.23% (27.1 MB)
[#001] sha256:7aa2d0bb5c94f1cf869e71e4db856d2ca0733f5eaab55dd514441da9616abb35 - 0.04% (4.38 MB)
[#002] sha256:5136ae4e75ffd61960e9220c7d7625a3ee213ff63c25fdc24e85bfe229b16ab5 - 0.8% (93.1 MB)
[#003] sha256:6f760a753c5e1fc35281126d63b6ca9bef93e49f89a826a2bc2786e293d88f00 - 0.0% (182 Bytes)
[#004] sha256:6e8af4fd0a071982e528b634ba99dec2474c21147f99748be708f36e10e3f4c2 - 0.0% (6.72 KB)
[#005] sha256:a1a8ac6c8810bbba69c79c0b786559cdb43046337afb5e1072c2dfb7e12081f0 - 18.51% (2.1 GB)
[#006] sha256:2d795fdb14b35972f7cd05a0d3bc05f0dc533568b9f3845936159a5ba02c5efa - 0.0% (62.6 KB)
[#007] sha256:5025e003abc70f17d0181b91a9b463f826a6eff3c11b4ea44db2049d28030f4a - 0.0% (1.64 KB)
[#008] sha256:3dfb0cd50961219324866618c37873560cb92dd42eba2c71227de18c485193b5 - 0.0% (1.49 KB)
[#009] sha256:0ea494e54b55c563449895cf1e9606104fce7f6cdec0bc77470a5ca2db5137c7 - 23.31% (2.64 GB)
[#010] sha256:6bdaf2d0557fe1f99e5382d128801569f6c3bc8056777958161c2f08bbbbf073 - 0.0% (86.9 KB)
[#011] sha256:7d197f5b21324223959f696445365a3be0bf9345a2062b416bd3748db3c12b7e - 0.0% (104 Bytes)
[#012] sha256:30b83943567fd3271fe78e59573b35ebc436e6ed37da21144d502d238d5cd797 - 0.0% (229 Bytes)
[#013] sha256:50497176386cb02a94e84bbfecd7fab2cbcbfd352e32cedc05c13b93b93ca3eb - 2.6% (302 MB)
[#014] sha256:d7a3aa69c39d80e9b0f670b9b6b072b4c104469b649901aff42bc436222b68c3 - 0.34% (39.7 MB)
[#015] sha256:f41952cdf52b89028a217ca008156f65031e3a1cc3c1cd57078597f442c384a4 - 0.0% (12.4 KB)
[#016] sha256:718acd3b56096b9c828d264ddc74673f4bf82f96da236b37122e4889aba69b2d - 1.21% (140 MB)
[#017] sha256:98c567b5a4a1c192da709172abb5904c2aa70da7633e6290cb4a8c5f5c9a7170 - 36.29% (4.11 GB)
[#018] sha256:8e63cb658594cb5a3eeed8c3c9288a2d97daf1188978aa2a7202defdba71f94a - 10.34% (1.17 GB)
[#019] sha256:2fde5409f70d68a2e7d7117349852e1f5f5ad85c8c2ea5934ab71a77d26259c4 - 0.0% (173 KB)
[#020] sha256:de4cfab5d23d68f206ce774f7faa7639cfc89436b6ef57ed685cbc407f6eeaf6 - 0.0% (149 KB)
[#021] sha256:208bf01305297cb38c0f81a2d5d312e9c0df4eca0092cfa3aee293d8e2115105 - 0.0% (8.25 KB)
[#022] sha256:ebe136a4ef7e75aede88086e23c17265832211e0eb1e554b36512e91ccdce373 - 0.0% (122 Bytes)
[#023] sha256:d9711db9011e5f6e4cefae027ddc5ad137438e2eb4289f647cfebe78bee66109 - 0.0% (299 Bytes)
[#024] sha256:78c38a1f8e9add1250f3f46cc6926edf7282a31e7b6022d1ee0e321891dd3427 - 0.25% (28.8 MB)
[#025] sha256:ddd435d8379107139677517465e7b87e83dd6d93975e9d30c69ed9b8c37f6bb3 - 0.0% (1.44 KB)
[#026] sha256:eabd04ca27cbf7eca15e818f8d0c453baadaf53e48e6408c7872fc5bb33a65a0 - 0.06% (7.19 MB)
[#027] sha256:9e07a72571968f684291362fa7a2abcf036f9da6de257f2d02e0e99f66e1b3cc - 0.0% (908 Bytes)
[#028] sha256:5b56b52b4954811788403ccca51fcde732e2d71ccd8f05b6e88083a7a70175ff - 0.0% (565 KB)
[#029] sha256:ed860ff70e7ae791b49414282484352a0773ce9abcab67162b228951ed54d4b9 - 0.0% (1.51 KB)
[#030] sha256:c1f1622669170a88e378bdb2615dd7a0943b684be4ca8e14ca9bf8aeebb331ce - 5.48% (636 MB)
[#031] sha256:75f454b16592c5adf0a252f168142b9346963f49cbf0f061f620b12e30e08667 - 0.0% (235 Bytes)
[#032] sha256:42b8052766dcade4e7db1f724f97f3c92659d227ffeb34aa94359a6c4cb09186 - 0.54% (63 MB)
/bin/sh -c #(nop) ARG RELEASE
2025-07-14 16:34:14 UTC/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH
2025-07-14 16:34:14 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu
2025-07-14 16:34:14 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04
2025-07-14 16:34:16 UTC/bin/sh -c #(nop) ADD file:834c1c2a4c7753a37759a9b21f64a990572643eee18669b1faa782fee45355ed in /
2025-07-14 16:34:17 UTC/bin/sh -c #(nop) CMD ["/bin/bash"]
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ENV NVARCH=sbsa
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ENV NVIDIA_REQUIRE_CUDA=cuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_CUDART_VERSION=12.9.79-1
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ENV CUDA_VERSION=12.9.1
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-9=${NV_CUDA_CUDART_VERSION} cuda-compat-12-9 && rm -rf /var/lib/apt/lists/* # buildkit
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)COPY NGC-DL-CONTAINER-LICENSE / # buildkit
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)ENV NVIDIA_VISIBLE_DEVICES=all
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_LIB_VERSION=12.9.1-1
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_NVTX_VERSION=12.9.79-1
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_VERSION=12.4.1.87-1
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_PACKAGE=libnpp-12-9=12.4.1.87-1
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUSPARSE_VERSION=12.5.10.65-1
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-12-9
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_VERSION=12.9.1.4-1
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_PACKAGE=libcublas-12-9=12.9.1.4-1
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_PACKAGE_VERSION=2.27.3-1
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NCCL_VERSION=2.27.3-1
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_PACKAGE=libnccl2=2.27.3-1+cuda12.9
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-12-9=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-12-9=${NV_NVTX_VERSION} libcusparse-12-9=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENV NVIDIA_PRODUCT_NAME=CUDA
2025-07-18 20:20:54 UTC (buildkit.dockerfile.v0)ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_LIB_VERSION=12.9.1-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_CUDART_DEV_VERSION=12.9.79-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_NVML_DEV_VERSION=12.9.79-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUSPARSE_DEV_VERSION=12.5.10.65-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_DEV_VERSION=12.4.1.87-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_DEV_PACKAGE=libnpp-dev-12-9=12.4.1.87-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_DEV_PACKAGE_NAME=libcublas-dev-12-9
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_DEV_VERSION=12.9.1.4-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_DEV_PACKAGE=libcublas-dev-12-9=12.9.1.4-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_NSIGHT_COMPUTE_VERSION=12.9.1-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE=cuda-nsight-compute-12-9=12.9.1-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_DEV_PACKAGE_NAME=libnccl-dev
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_DEV_PACKAGE_VERSION=2.27.3-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NCCL_VERSION=2.27.3-1
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_DEV_PACKAGE=libnccl-dev=2.27.3-1+cuda12.9
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2025-07-18 20:35:59 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-dev-12-9=${NV_CUDA_CUDART_DEV_VERSION} cuda-command-line-tools-12-9=${NV_CUDA_LIB_VERSION} cuda-minimal-build-12-9=${NV_CUDA_LIB_VERSION} cuda-libraries-dev-12-9=${NV_CUDA_LIB_VERSION} cuda-nvml-dev-12-9=${NV_NVML_DEV_VERSION} ${NV_NVPROF_DEV_PACKAGE} ${NV_LIBNPP_DEV_PACKAGE} libcusparse-dev-12-9=${NV_LIBCUSPARSE_DEV_VERSION} ${NV_LIBCUBLAS_DEV_PACKAGE} ${NV_LIBNCCL_DEV_PACKAGE} ${NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
2025-07-18 20:36:00 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_DEV_PACKAGE_NAME} ${NV_LIBNCCL_DEV_PACKAGE_NAME} # buildkit
2025-07-18 20:36:00 UTC (buildkit.dockerfile.v0)ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ARG CUDA_VERSION
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ARG PYTHON_VERSION
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ARG INSTALL_KV_CONNECTORS=false
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)WORKDIR /vllm-workspace
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ENV DEBIAN_FRONTEND=noninteractive
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ARG TARGETPLATFORM
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ARG GDRCOPY_CUDA_VERSION=12.8
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ARG GDRCOPY_OS_VERSION=Ubuntu22_04
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)SHELL [/bin/bash -c]
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ARG DEADSNAKES_MIRROR_URL
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ARG DEADSNAKES_GPGKEY_URL
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)ARG GET_PIP_URL
2025-10-03 21:08:08 UTC (buildkit.dockerfile.v0)RUN |9 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit
2025-10-03 21:10:51 UTC (buildkit.dockerfile.v0)RUN |9 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl wget sudo vim python3-pip && apt-get install -y ffmpeg libsm6 libxext6 libgl1 && if [ ! -z ${DEADSNAKES_MIRROR_URL} ] ; then if [ ! -z "${DEADSNAKES_GPGKEY_URL}" ] ; then mkdir -p -m 0755 /etc/apt/keyrings ; curl -L ${DEADSNAKES_GPGKEY_URL} | gpg --dearmor > /etc/apt/keyrings/deadsnakes.gpg ; sudo chmod 644 /etc/apt/keyrings/deadsnakes.gpg ; echo "deb [signed-by=/etc/apt/keyrings/deadsnakes.gpg] ${DEADSNAKES_MIRROR_URL} $(lsb_release -cs) main" > /etc/apt/sources.list.d/deadsnakes.list ; fi ; else for i in 1 2 3; do add-apt-repository -y ppa:deadsnakes/ppa && break || { echo "Attempt $i failed, retrying in 5s..."; sleep 5; }; done ; fi && apt-get update -y && apt-get install -y python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS ${GET_PIP_URL} | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit
2025-10-03 21:10:51 UTC (buildkit.dockerfile.v0)ARG PIP_INDEX_URL UV_INDEX_URL
2025-10-03 21:10:51 UTC (buildkit.dockerfile.v0)ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL
2025-10-03 21:10:51 UTC (buildkit.dockerfile.v0)ARG PYTORCH_CUDA_INDEX_BASE_URL
2025-10-03 21:10:51 UTC (buildkit.dockerfile.v0)ARG PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL
2025-10-03 21:10:51 UTC (buildkit.dockerfile.v0)ARG PIP_KEYRING_PROVIDER UV_KEYRING_PROVIDER
2025-10-03 21:10:53 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c python3 -m pip install uv # buildkit
2025-10-03 21:10:53 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2025-10-03 21:10:53 UTC (buildkit.dockerfile.v0)ENV UV_INDEX_STRATEGY=unsafe-best-match
2025-10-03 21:10:53 UTC (buildkit.dockerfile.v0)ENV UV_LINK_MODE=copy
2025-10-03 21:10:55 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit
2025-10-03 21:11:05 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then uv pip install --system --index-url ${PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') "torch==2.8.0.dev20250318+cu128" "torchvision==0.22.0.dev20250319" ; uv pip install --system --index-url ${PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') --pre pytorch_triton==3.3.0+gitab727c40 ; fi # buildkit
2025-10-03 21:32:07 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c uv pip install --system dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
2025-10-03 21:32:07 UTC (buildkit.dockerfile.v0)ARG FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git
2025-10-03 21:32:07 UTC (buildkit.dockerfile.v0)ARG FLASHINFER_GIT_REF=v0.3.1
2025-10-03 21:32:07 UTC (buildkit.dockerfile.v0)ARG FLASHINFER_AOT_COMPILE=false
2025-10-03 22:38:27 UTC (buildkit.dockerfile.v0)RUN |20 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true /bin/bash -c bash - <<'BASH' . /etc/environment git clone --depth 1 --recursive --shallow-submodules \ --branch ${FLASHINFER_GIT_REF} \ ${FLASHINFER_GIT_REPO} flashinfer pushd flashinfer if [ "${FLASHINFER_AOT_COMPILE}" = "true" ]; then # Exclude CUDA arches for older versions (11.x and 12.0-12.7) # TODO: Update this to allow setting TORCH_CUDA_ARCH_LIST as a build arg. if [[ "${CUDA_VERSION}" == 11.* ]]; then FI_TORCH_CUDA_ARCH_LIST="7.5 8.0 8.9" elif [[ "${CUDA_VERSION}" == 12.[0-7]* ]]; then FI_TORCH_CUDA_ARCH_LIST="7.5 8.0 8.9 9.0a" else # CUDA 12.8+ supports 10.0a and 12.0 FI_TORCH_CUDA_ARCH_LIST="7.5 8.0 8.9 9.0a 10.0a 12.0" fi echo "🏗️ Installing FlashInfer with AOT compilation for arches: ${FI_TORCH_CUDA_ARCH_LIST}" export FLASHINFER_CUDA_ARCH_LIST="${FI_TORCH_CUDA_ARCH_LIST}" # HACK: We need these to run flashinfer.aot before installing flashinfer, get from the package in the future uv pip install --system cuda-python==$(echo $CUDA_VERSION | cut -d. -f1,2) pynvml==$(echo $CUDA_VERSION | cut -d. -f1) nvidia-nvshmem-cu$(echo $CUDA_VERSION | cut -d. -f1) # Build AOT kernels TORCH_CUDA_ARCH_LIST="${FI_TORCH_CUDA_ARCH_LIST}" \ python3 -m flashinfer.aot # Install with no-build-isolation since we already built AOT kernels TORCH_CUDA_ARCH_LIST="${FI_TORCH_CUDA_ARCH_LIST}" \ uv pip install --system --no-build-isolation . \ --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # Download pre-compiled cubins TORCH_CUDA_ARCH_LIST="${FI_TORCH_CUDA_ARCH_LIST}" \ python3 -m flashinfer --download-cubin || echo "WARNING: Failed to download flashinfer cubins." else echo "🏗️ Installing FlashInfer without AOT compilation in JIT mode" uv pip install --system . \ --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') fi popd rm -rf flashinfer BASH # buildkit
2025-10-03 22:38:27 UTC (buildkit.dockerfile.v0)COPY examples examples # buildkit
2025-10-03 22:38:27 UTC (buildkit.dockerfile.v0)COPY benchmarks benchmarks # buildkit
2025-10-03 22:38:28 UTC (buildkit.dockerfile.v0)COPY ./vllm/collect_env.py . # buildkit
2025-10-03 22:38:28 UTC (buildkit.dockerfile.v0)RUN |20 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true /bin/bash -c . /etc/environment && uv pip list # buildkit
2025-10-03 22:38:28 UTC (buildkit.dockerfile.v0)COPY requirements/build.txt requirements/build.txt # buildkit
2025-10-03 22:38:30 UTC (buildkit.dockerfile.v0)RUN |20 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true /bin/bash -c uv pip install --system -r requirements/build.txt --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
2025-10-03 22:38:30 UTC (buildkit.dockerfile.v0)ARG DEEPGEMM_GIT_REF
2025-10-03 22:38:30 UTC (buildkit.dockerfile.v0)COPY tools/install_deepgemm.sh /tmp/install_deepgemm.sh # buildkit
2025-10-03 22:39:21 UTC (buildkit.dockerfile.v0)RUN |21 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true DEEPGEMM_GIT_REF= /bin/bash -c VLLM_DOCKER_BUILD_CONTEXT=1 /tmp/install_deepgemm.sh --cuda-version "${CUDA_VERSION}" ${DEEPGEMM_GIT_REF:+--ref "$DEEPGEMM_GIT_REF"} # buildkit
2025-10-03 22:39:22 UTC (buildkit.dockerfile.v0)COPY tools/install_gdrcopy.sh install_gdrcopy.sh # buildkit
2025-10-03 22:39:26 UTC (buildkit.dockerfile.v0)RUN |21 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true DEEPGEMM_GIT_REF= /bin/bash -c set -eux; case "${TARGETPLATFORM}" in linux/arm64) UUARCH="aarch64" ;; linux/amd64) UUARCH="x64" ;; *) echo "Unsupported TARGETPLATFORM: ${TARGETPLATFORM}" >&2; exit 1 ;; esac; ./install_gdrcopy.sh "${GDRCOPY_OS_VERSION}" "${GDRCOPY_CUDA_VERSION}" "${UUARCH}"; rm ./install_gdrcopy.sh # buildkit
2025-10-03 22:39:26 UTC (buildkit.dockerfile.v0)COPY tools/ep_kernels/install_python_libraries.sh install_python_libraries.sh # buildkit
2025-10-03 22:39:26 UTC (buildkit.dockerfile.v0)ENV CUDA_HOME=/usr/local/cuda
2025-10-03 22:45:21 UTC (buildkit.dockerfile.v0)RUN |21 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/arm64 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.3.1 FLASHINFER_AOT_COMPILE=true DEEPGEMM_GIT_REF= /bin/bash -c export TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST:-9.0a+PTX}" && bash install_python_libraries.sh # buildkit
2025-10-03 22:45:21 UTC (buildkit.dockerfile.v0)ARG TARGETPLATFORM
2025-10-03 22:45:21 UTC (buildkit.dockerfile.v0)ARG INSTALL_KV_CONNECTORS=false
2025-10-03 22:45:21 UTC (buildkit.dockerfile.v0)ARG PIP_INDEX_URL UV_INDEX_URL
2025-10-03 22:45:21 UTC (buildkit.dockerfile.v0)ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL
2025-10-03 22:45:21 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2025-10-03 22:45:21 UTC (buildkit.dockerfile.v0)COPY requirements/kv_connectors.txt requirements/kv_connectors.txt # buildkit
2025-10-03 22:45:44 UTC (buildkit.dockerfile.v0)RUN |6 TARGETPLATFORM=linux/arm64 INSTALL_KV_CONNECTORS=true PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= /bin/bash -c if [ "$INSTALL_KV_CONNECTORS" = "true" ]; then uv pip install --system -r requirements/kv_connectors.txt; fi; if [ "$TARGETPLATFORM" = "linux/arm64" ]; then BITSANDBYTES_VERSION="0.42.0"; else BITSANDBYTES_VERSION="0.46.1"; fi; uv pip install --system accelerate hf_transfer modelscope "bitsandbytes>=${BITSANDBYTES_VERSION}" 'timm>=1.0.17' boto3 runai-model-streamer runai-model-streamer[s3] # buildkit
2025-10-03 22:45:44 UTC (buildkit.dockerfile.v0)ENV VLLM_USAGE_SOURCE=production-docker-image
2025-10-03 22:45:44 UTC (buildkit.dockerfile.v0)ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"]
Please be careful as this will not just delete the reference but also the actual content!
For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.