2025-04-06 04:42:15 UTC
8.38 GB
12.4.0
DEBIAN_FRONTENDnoninteractive
LD_LIBRARY_PATH/usr/local/nvidia/lib:/usr/local/nvidia/lib64
LIBRARY_PATH/usr/local/cuda/lib64/stubs
NCCL_VERSION2.20.5-1
NVARCHx86_64
NVIDIA_DRIVER_CAPABILITIEScompute,utility
NVIDIA_PRODUCT_NAMECUDA
NVIDIA_REQUIRE_CUDAcuda>=12.4 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526 brand=tesla,driver>=535,driver<536 brand=unknown,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=geforce,driver>=535,driver<536 brand=geforcertx,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=titan,driver>=535,driver<536 brand=titanrtx,driver>=535,driver<536
NVIDIA_VISIBLE_DEVICESall
NV_CUDA_COMPAT_PACKAGEcuda-compat-12-4
NV_CUDA_CUDART_DEV_VERSION12.4.99-1
NV_CUDA_CUDART_VERSION12.4.99-1
NV_CUDA_LIB_VERSION12.4.0-1
NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGEcuda-nsight-compute-12-4=12.4.0-1
NV_CUDA_NSIGHT_COMPUTE_VERSION12.4.0-1
NV_LIBCUBLAS_DEV_PACKAGElibcublas-dev-12-4=12.4.2.65-1
NV_LIBCUBLAS_DEV_PACKAGE_NAMElibcublas-dev-12-4
NV_LIBCUBLAS_DEV_VERSION12.4.2.65-1
NV_LIBCUBLAS_PACKAGElibcublas-12-4=12.4.2.65-1
NV_LIBCUBLAS_PACKAGE_NAMElibcublas-12-4
NV_LIBCUBLAS_VERSION12.4.2.65-1
NV_LIBCUSPARSE_DEV_VERSION12.3.0.142-1
NV_LIBCUSPARSE_VERSION12.3.0.142-1
NV_LIBNCCL_DEV_PACKAGElibnccl-dev=2.20.5-1+cuda12.4
NV_LIBNCCL_DEV_PACKAGE_NAMElibnccl-dev
NV_LIBNCCL_DEV_PACKAGE_VERSION2.20.5-1
NV_LIBNCCL_PACKAGElibnccl2=2.20.5-1+cuda12.4
NV_LIBNCCL_PACKAGE_NAMElibnccl2
NV_LIBNCCL_PACKAGE_VERSION2.20.5-1
NV_LIBNPP_DEV_PACKAGElibnpp-dev-12-4=12.2.5.2-1
NV_LIBNPP_DEV_VERSION12.2.5.2-1
NV_LIBNPP_PACKAGElibnpp-12-4=12.2.5.2-1
NV_LIBNPP_VERSION12.2.5.2-1
NV_NVML_DEV_VERSION12.4.99-1
NV_NVPROF_DEV_PACKAGEcuda-nvprof-12-4=12.4.99-1
NV_NVPROF_VERSION12.4.99-1
NV_NVTX_VERSION12.4.99-1
PATH/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
UV_HTTP_TIMEOUT500
VLLM_USAGE_SOURCEproduction-docker-image
[#000] sha256:23828d760c7b04df02891af556c40ca44c2dd79d6837ea6f18fac24f4108448c - 0.34% (29 MB)
[#001] sha256:edd1dba56169c724e9377dafe9d6dd34c0ef9585109fa8366b4a3ee68e07fd25 - 0.05% (4.41 MB)
[#002] sha256:e06eb1b5c4cc0283389710e45402738c973f9c27a4cbdf90d53751723279e001 - 0.64% (54.9 MB)
[#003] sha256:7f308a7652768c0a964eb1720554421079b6a956110c7a12362380d2372fe82f - 0.0% (184 Bytes)
[#004] sha256:3af11d09e9cd1eb9c379f0a4071231e5a5642eb728b4b33bcb76be291f3c9488 - 0.0% (6.72 KB)
[#005] sha256:42896cdfd7b6a3e75be89e9fbc327a2dc8a1f56ab23a994553c28125ed85f528 - 15.12% (1.27 GB)
[#006] sha256:6005190795580507557f886a8cb09d07f48a293591caa5f686ae89e2f363a350 - 0.0% (62.6 KB)
[#007] sha256:0ae42424cadfa646dc06982b0ed3d08688b628c43fc379782b3b5d2d578eb041 - 0.0% (1.65 KB)
[#008] sha256:73b7968785dcb3e277c8de18c033614246b9419edb40941a0fc66aed6c831edb - 0.0% (1.49 KB)
[#009] sha256:80150f70fb1e403d909539844a70fcb152ecfbd994a2c2c186dd71abb90be693 - 29.19% (2.45 GB)
[#010] sha256:3bd5db8307cf789162a5a096889ea97023d5795068bdd8f07a0b09b3615d17df - 0.0% (86.8 KB)
[#011] sha256:ab239415ae73e11f87a2a1eea9c925feab641bd69e4c54f917a6a59364a34f8e - 0.0% (104 Bytes)
[#012] sha256:6fb4ebd5ba7c5f0320018c0923d7ada8ea732e342fedcc91a00f3b0d0895d154 - 0.0% (229 Bytes)
[#013] sha256:a37d9fc5e9a1d95af9d7650ec44c0056efa33a322b8b58a12144c0815aa0bd0b - 3.66% (314 MB)
[#014] sha256:23080b1808657d8a8f4a4b8cee454a153bca9b70848b7957ce4cd3575f98f7ef - 0.38% (32.7 MB)
[#015] sha256:2a87b7c0cece216ed436882d032761bf7f104cfbea869b63a15bcca3c33a6359 - 0.0% (12.8 KB)
[#016] sha256:5752ff55c9579d56c6390bd9c8047e8d3bdcc76ebb38d8336f3ff9b889e81a11 - 0.0% (122 Bytes)
[#017] sha256:0a1639fced3a6dc7556f289d452ed08560c30ac868e694b2c2b79ea76101c274 - 43.11% (3.61 GB)
[#018] sha256:458d836a6bde7126609904be66663dd1fcd25d35e0e672b9d40036ac006acc93 - 6.05% (519 MB)
[#019] sha256:6379528bd2c0da43bd0250957da81f70bda565cbeee0d9e7b930ec73c9d7c055 - 0.0% (95 KB)
[#020] sha256:9d7c1cc1d11e627b1a3ae3d1fae6bea03d7a0837dc9a38a9913e94de79b5ce97 - 0.0% (273 Bytes)
[#021] sha256:9834c4a6484e4ea7ed007a84489cce1232c2538b90ca3c397c281f79359748f1 - 0.3% (25.9 MB)
[#022] sha256:bec7545c7b3ff59eafe41de97728d90178d0b43855ae579f6bb8e8e3f00b0d8c - 1.16% (99.9 MB)
/bin/sh -c #(nop) ARG RELEASE
2024-02-27 18:52:57 UTC/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH
2024-02-27 18:52:57 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu
2024-02-27 18:52:57 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04
2024-02-27 18:52:58 UTC/bin/sh -c #(nop) ADD file:21c2e8d95909bec6f4acdaf4aed55b44ee13603681f93b152e423e3e6a4a207b in /
2024-02-27 18:52:59 UTC/bin/sh -c #(nop) CMD ["/bin/bash"]
2024-04-04 23:36:11 UTC (buildkit.dockerfile.v0)ENV NVARCH=x86_64
2024-04-04 23:36:11 UTC (buildkit.dockerfile.v0)ENV NVIDIA_REQUIRE_CUDA=cuda>=12.4 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526 brand=tesla,driver>=535,driver<536 brand=unknown,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=geforce,driver>=535,driver<536 brand=geforcertx,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=titan,driver>=535,driver<536 brand=titanrtx,driver>=535,driver<536
2024-04-04 23:36:11 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_CUDART_VERSION=12.4.99-1
2024-04-04 23:36:11 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_COMPAT_PACKAGE=cuda-compat-12-4
2024-04-04 23:36:11 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2024-04-04 23:36:11 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2024-04-04 23:36:11 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit
2024-04-04 23:36:11 UTC (buildkit.dockerfile.v0)ENV CUDA_VERSION=12.4.0
2024-04-04 23:36:23 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-4=${NV_CUDA_CUDART_VERSION} ${NV_CUDA_COMPAT_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
2024-04-04 23:36:23 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit
2024-04-04 23:36:23 UTC (buildkit.dockerfile.v0)ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
2024-04-04 23:36:23 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64
2024-04-04 23:36:23 UTC (buildkit.dockerfile.v0)COPY NGC-DL-CONTAINER-LICENSE / # buildkit
2024-04-04 23:36:23 UTC (buildkit.dockerfile.v0)ENV NVIDIA_VISIBLE_DEVICES=all
2024-04-04 23:36:23 UTC (buildkit.dockerfile.v0)ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_LIB_VERSION=12.4.0-1
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_NVTX_VERSION=12.4.99-1
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_VERSION=12.2.5.2-1
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_PACKAGE=libnpp-12-4=12.2.5.2-1
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUSPARSE_VERSION=12.3.0.142-1
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-12-4
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_VERSION=12.4.2.65-1
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_PACKAGE=libcublas-12-4=12.4.2.65-1
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_PACKAGE_VERSION=2.20.5-1
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NCCL_VERSION=2.20.5-1
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_PACKAGE=libnccl2=2.20.5-1+cuda12.4
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-12-4=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-12-4=${NV_NVTX_VERSION} libcusparse-12-4=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENV NVIDIA_PRODUCT_NAME=CUDA
2024-04-04 23:40:07 UTC (buildkit.dockerfile.v0)ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_LIB_VERSION=12.4.0-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_CUDART_DEV_VERSION=12.4.99-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_NVML_DEV_VERSION=12.4.99-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUSPARSE_DEV_VERSION=12.3.0.142-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_DEV_VERSION=12.2.5.2-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_LIBNPP_DEV_PACKAGE=libnpp-dev-12-4=12.2.5.2-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_DEV_VERSION=12.4.2.65-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_DEV_PACKAGE_NAME=libcublas-dev-12-4
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_LIBCUBLAS_DEV_PACKAGE=libcublas-dev-12-4=12.4.2.65-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_NSIGHT_COMPUTE_VERSION=12.4.0-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE=cuda-nsight-compute-12-4=12.4.0-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_NVPROF_VERSION=12.4.99-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_NVPROF_DEV_PACKAGE=cuda-nvprof-12-4=12.4.99-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_DEV_PACKAGE_NAME=libnccl-dev
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_DEV_PACKAGE_VERSION=2.20.5-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NCCL_VERSION=2.20.5-1
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV NV_LIBNCCL_DEV_PACKAGE=libnccl-dev=2.20.5-1+cuda12.4
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-dev-12-4=${NV_CUDA_CUDART_DEV_VERSION} cuda-command-line-tools-12-4=${NV_CUDA_LIB_VERSION} cuda-minimal-build-12-4=${NV_CUDA_LIB_VERSION} cuda-libraries-dev-12-4=${NV_CUDA_LIB_VERSION} cuda-nvml-dev-12-4=${NV_NVML_DEV_VERSION} ${NV_NVPROF_DEV_PACKAGE} ${NV_LIBNPP_DEV_PACKAGE} libcusparse-dev-12-4=${NV_LIBCUSPARSE_DEV_VERSION} ${NV_LIBCUBLAS_DEV_PACKAGE} ${NV_LIBNCCL_DEV_PACKAGE} ${NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_DEV_PACKAGE_NAME} ${NV_LIBNCCL_DEV_PACKAGE_NAME} # buildkit
2024-04-04 23:47:46 UTC (buildkit.dockerfile.v0)ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs
2025-04-06 04:19:40 UTC (buildkit.dockerfile.v0)ARG CUDA_VERSION=12.4.1
2025-04-06 04:19:40 UTC (buildkit.dockerfile.v0)ARG PYTHON_VERSION=3.12
2025-04-06 04:19:40 UTC (buildkit.dockerfile.v0)WORKDIR /vllm-workspace
2025-04-06 04:19:40 UTC (buildkit.dockerfile.v0)ENV DEBIAN_FRONTEND=noninteractive
2025-04-06 04:19:40 UTC (buildkit.dockerfile.v0)ARG TARGETPLATFORM
2025-04-06 04:19:40 UTC (buildkit.dockerfile.v0)RUN |3 CUDA_VERSION=12.4.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit
2025-04-06 04:22:22 UTC (buildkit.dockerfile.v0)RUN |3 CUDA_VERSION=12.4.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl wget sudo vim python3-pip && apt-get install -y ffmpeg libsm6 libxext6 libgl1 && add-apt-repository ppa:deadsnakes/ppa && apt-get update -y && apt-get install -y python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS https://bootstrap.pypa.io/get-pip.py | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit
2025-04-06 04:22:25 UTC (buildkit.dockerfile.v0)RUN |3 CUDA_VERSION=12.4.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c python3 -m pip install uv # buildkit
2025-04-06 04:22:25 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2025-04-06 04:22:26 UTC (buildkit.dockerfile.v0)RUN |3 CUDA_VERSION=12.4.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit
2025-04-06 04:22:27 UTC (buildkit.dockerfile.v0)RUN |3 CUDA_VERSION=12.4.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then uv pip install --system --index-url https://download.pytorch.org/whl/nightly/cu128 "torch==2.8.0.dev20250318+cu128" "torchvision==0.22.0.dev20250319"; uv pip install --system --index-url https://download.pytorch.org/whl/nightly/cu128 --pre pytorch_triton==3.3.0+gitab727c40; fi # buildkit
2025-04-06 04:41:50 UTC (buildkit.dockerfile.v0)RUN |3 CUDA_VERSION=12.4.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c uv pip install --system dist/*.whl --verbose # buildkit
2025-04-06 04:42:07 UTC (buildkit.dockerfile.v0)RUN |3 CUDA_VERSION=12.4.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c . /etc/environment && if [ "$TARGETPLATFORM" != "linux/arm64" ]; then uv pip install --system https://github.com/flashinfer-ai/flashinfer/releases/download/v0.2.1.post2/flashinfer_python-0.2.1.post2+cu124torch2.6-cp38-abi3-linux_x86_64.whl ; fi # buildkit
2025-04-06 04:42:08 UTC (buildkit.dockerfile.v0)COPY examples examples # buildkit
2025-04-06 04:42:08 UTC (buildkit.dockerfile.v0)COPY requirements/build.txt requirements/build.txt # buildkit
2025-04-06 04:42:08 UTC (buildkit.dockerfile.v0)RUN |3 CUDA_VERSION=12.4.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c uv pip install --system -r requirements/build.txt # buildkit
2025-04-06 04:42:08 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2025-04-06 04:42:15 UTC (buildkit.dockerfile.v0)RUN /bin/sh -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then uv pip install --system accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.42.0' 'timm==0.9.10' boto3 runai-model-streamer runai-model-streamer[s3]; else uv pip install --system accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.45.3' 'timm==0.9.10' boto3 runai-model-streamer runai-model-streamer[s3]; fi # buildkit
2025-04-06 04:42:15 UTC (buildkit.dockerfile.v0)ENV VLLM_USAGE_SOURCE=production-docker-image
2025-04-06 04:42:15 UTC (buildkit.dockerfile.v0)ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"]
Please be careful as this will not just delete the reference but also the actual content!
For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.