Namespace
vllm
Image / Tag
vllm-openai:v0.7.1
Content Digest
sha256:9cd69b577cf26df32aceb74577ea7f6749618a72e630f654ecb10dbfb23e3de4
Details
Created

2025-02-01 19:03:05 UTC

Size

8.3 GB

Content Digest
Labels
  • maintainer
    NVIDIA CORPORATION <cudatools@nvidia.com>
  • org.opencontainers.image.ref.name
    ubuntu
  • org.opencontainers.image.version
    22.04

Environment
CUDA_VERSION

12.1.0

DEBIAN_FRONTEND

noninteractive

LD_LIBRARY_PATH

/usr/local/nvidia/lib:/usr/local/nvidia/lib64

LIBRARY_PATH

/usr/local/cuda/lib64/stubs

NCCL_VERSION

2.17.1-1

NVARCH

x86_64

NVIDIA_CUDA_END_OF_LIFE

1

NVIDIA_DRIVER_CAPABILITIES

compute,utility

NVIDIA_PRODUCT_NAME

CUDA

NVIDIA_REQUIRE_CUDA

cuda>=12.1 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526

NVIDIA_VISIBLE_DEVICES

all

NV_CUDA_COMPAT_PACKAGE

cuda-compat-12-1

NV_CUDA_CUDART_DEV_VERSION

12.1.55-1

NV_CUDA_CUDART_VERSION

12.1.55-1

NV_CUDA_LIB_VERSION

12.1.0-1

NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE

cuda-nsight-compute-12-1=12.1.0-1

NV_CUDA_NSIGHT_COMPUTE_VERSION

12.1.0-1

NV_LIBCUBLAS_DEV_PACKAGE

libcublas-dev-12-1=12.1.0.26-1

NV_LIBCUBLAS_DEV_PACKAGE_NAME

libcublas-dev-12-1

NV_LIBCUBLAS_DEV_VERSION

12.1.0.26-1

NV_LIBCUBLAS_PACKAGE

libcublas-12-1=12.1.0.26-1

NV_LIBCUBLAS_PACKAGE_NAME

libcublas-12-1

NV_LIBCUBLAS_VERSION

12.1.0.26-1

NV_LIBCUSPARSE_DEV_VERSION

12.0.2.55-1

NV_LIBCUSPARSE_VERSION

12.0.2.55-1

NV_LIBNCCL_DEV_PACKAGE

libnccl-dev=2.17.1-1+cuda12.1

NV_LIBNCCL_DEV_PACKAGE_NAME

libnccl-dev

NV_LIBNCCL_DEV_PACKAGE_VERSION

2.17.1-1

NV_LIBNCCL_PACKAGE

libnccl2=2.17.1-1+cuda12.1

NV_LIBNCCL_PACKAGE_NAME

libnccl2

NV_LIBNCCL_PACKAGE_VERSION

2.17.1-1

NV_LIBNPP_DEV_PACKAGE

libnpp-dev-12-1=12.0.2.50-1

NV_LIBNPP_DEV_VERSION

12.0.2.50-1

NV_LIBNPP_PACKAGE

libnpp-12-1=12.0.2.50-1

NV_LIBNPP_VERSION

12.0.2.50-1

NV_NVML_DEV_VERSION

12.1.55-1

NV_NVPROF_DEV_PACKAGE

cuda-nvprof-12-1=12.1.55-1

NV_NVPROF_VERSION

12.1.55-1

NV_NVTX_VERSION

12.1.66-1

PATH

/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

VLLM_USAGE_SOURCE

production-docker-image


Layers

[#000] sha256:aece8493d3972efa43bfd4ee3cdba659c0f787f8f59c82fb3e48c87cbb22a12e - 0.33% (28.2 MB)

[#001] sha256:45f7ea5367fe9dcee002e55e45a888af03a36523d11d2213ef9c6fc0088f6e96 - 0.05% (4.41 MB)

[#002] sha256:3d97a47c3c73a9f0e95e65070cfd89d749b89b490846c2a7ab0b796097d3c12b - 0.63% (53.1 MB)

[#003] sha256:12cd4d19752f10fb4ec393dc915c62c18895ce0090f0db7773b2426f9059df16 - 0.0% (185 Bytes)

[#004] sha256:da5a484f9d74b1673c155ea49073a322875f9a48118d0d5656c60224c7f8094e - 0.0% (6.72 KB)

[#005] sha256:5e5846364eee50e93288b9e4085bc9e558ed543163636c9ca2e61a528cb4952d - 14.49% (1.2 GB)

[#006] sha256:fd355de1d1f25492195368f3c3859f24af856e5d7a2ffb34951776daa50bd3e7 - 0.0% (62.4 KB)

[#007] sha256:3480bb79c6384806f3ae4d8854b5e7ea3e51c3e0ed913965790cdb1ac06cb0c4 - 0.0% (1.65 KB)

[#008] sha256:e7016935dd60c632d835fe53b96c59b79194151f22ed555675a41525e066a99f - 0.0% (1.49 KB)

[#009] sha256:99541166a1337295206d78a74f33e732d8acee77395b8e4de71f6d80c2dd951c - 28.16% (2.34 GB)

[#010] sha256:8999112df5b031b628f484c1c2aec564d110232aa865626bf5be629955160ea1 - 0.0% (86.4 KB)

[#011] sha256:dfcca668e688df1b838c19532f3364eb99ff94f62903bb0268aba55eaffaca6d - 0.0% (104 Bytes)

[#012] sha256:8f64356cf212db4e6ac6929804de50c1ceb01d0345637fe0a306c15f60152138 - 0.0% (231 Bytes)

[#013] sha256:8a21015f209494c1f20f330b2bec64d711edfd8935d9ac3433e3e3bbe1e0822d - 3.68% (313 MB)

[#014] sha256:4f47ddde78a10d214e47147968079dbc9fc135308dd956ab57eaa58eebecda44 - 0.0% (12.6 KB)

[#015] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)

[#016] sha256:77a82039a915c838b53aebb1b1d5379743cb0e6e4fc01c268757b4a91e8ce8e6 - 40.38% (3.35 GB)

[#017] sha256:3683743cc31cdaa785c49bcec1bcd77a3d28ff994022d07a06c140ba5cfad245 - 10.72% (911 MB)

[#018] sha256:0014b2a13575a4c1cbac4190df81bc0d08c5bfc87c88785c3299c1531d2933ba - 0.0% (71.1 KB)

[#019] sha256:9d78eba7a05283c285ac2416feb87307590aa35a7e471e109ecd0a671c5a1d84 - 0.0% (257 Bytes)

[#020] sha256:4f13afae2075a7e283688e83ad07eba543f9224ba92b6e575d771e8421aa76c5 - 0.31% (26.3 MB)

[#021] sha256:ad4d7dfefc51dfc4c1ebecb4b876fdfd0ffeb1f6387a1abd0be6c6715addc574 - 1.25% (106 MB)


History
2023-10-05 07:33:30 UTC

/bin/sh -c #(nop) ARG RELEASE

2023-10-05 07:33:30 UTC

/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH

2023-10-05 07:33:30 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu

2023-10-05 07:33:30 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04

2023-10-05 07:33:32 UTC

/bin/sh -c #(nop) ADD file:63d5ab3ef0aab308c0e71cb67292c5467f60deafa9b0418cbb220affcd078444 in /

2023-10-05 07:33:32 UTC

/bin/sh -c #(nop) CMD ["/bin/bash"]

2023-11-10 05:44:18 UTC (buildkit.dockerfile.v0)

ENV NVARCH=x86_64

2023-11-10 05:44:18 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_REQUIRE_CUDA=cuda>=12.1 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526

2023-11-10 05:44:18 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_VERSION=12.1.55-1

2023-11-10 05:44:18 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_COMPAT_PACKAGE=cuda-compat-12-1

2023-11-10 05:44:18 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2023-11-10 05:44:18 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2023-11-10 05:44:18 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.0-1_all.deb && dpkg -i cuda-keyring_1.0-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit

2023-11-10 05:44:18 UTC (buildkit.dockerfile.v0)

ENV CUDA_VERSION=12.1.0

2023-11-10 05:44:29 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-1=${NV_CUDA_CUDART_VERSION} ${NV_CUDA_COMPAT_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2023-11-10 05:44:29 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit

2023-11-10 05:44:29 UTC (buildkit.dockerfile.v0)

ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

2023-11-10 05:44:29 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64

2023-11-10 05:44:29 UTC (buildkit.dockerfile.v0)

COPY NGC-DL-CONTAINER-LICENSE / # buildkit

2023-11-10 05:44:29 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_VISIBLE_DEVICES=all

2023-11-10 05:44:29 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_LIB_VERSION=12.1.0-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_NVTX_VERSION=12.1.66-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_VERSION=12.0.2.50-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_PACKAGE=libnpp-12-1=12.0.2.50-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUSPARSE_VERSION=12.0.2.55-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-12-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_VERSION=12.1.0.26-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_PACKAGE=libcublas-12-1=12.1.0.26-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE_VERSION=2.17.1-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NCCL_VERSION=2.17.1-1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE=libnccl2=2.17.1-1+cuda12.1

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2023-11-10 05:49:19 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-12-1=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-12-1=${NV_NVTX_VERSION} libcusparse-12-1=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2023-11-10 05:49:20 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit

2023-11-10 05:49:20 UTC (buildkit.dockerfile.v0)

COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit

2023-11-10 05:49:20 UTC (buildkit.dockerfile.v0)

COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit

2023-11-10 05:49:20 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_PRODUCT_NAME=CUDA

2023-11-10 05:49:20 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_CUDA_END_OF_LIFE=1

2023-11-10 05:49:20 UTC (buildkit.dockerfile.v0)

ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_LIB_VERSION=12.1.0-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_DEV_VERSION=12.1.55-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_NVML_DEV_VERSION=12.1.55-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUSPARSE_DEV_VERSION=12.0.2.55-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_DEV_VERSION=12.0.2.50-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_DEV_PACKAGE=libnpp-dev-12-1=12.0.2.50-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_VERSION=12.1.0.26-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_PACKAGE_NAME=libcublas-dev-12-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_PACKAGE=libcublas-dev-12-1=12.1.0.26-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_NSIGHT_COMPUTE_VERSION=12.1.0-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE=cuda-nsight-compute-12-1=12.1.0-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_NVPROF_VERSION=12.1.55-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_NVPROF_DEV_PACKAGE=cuda-nvprof-12-1=12.1.55-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE_NAME=libnccl-dev

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE_VERSION=2.17.1-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NCCL_VERSION=2.17.1-1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE=libnccl-dev=2.17.1-1+cuda12.1

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2023-11-10 06:02:04 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-dev-12-1=${NV_CUDA_CUDART_DEV_VERSION} cuda-command-line-tools-12-1=${NV_CUDA_LIB_VERSION} cuda-minimal-build-12-1=${NV_CUDA_LIB_VERSION} cuda-libraries-dev-12-1=${NV_CUDA_LIB_VERSION} cuda-nvml-dev-12-1=${NV_NVML_DEV_VERSION} ${NV_NVPROF_DEV_PACKAGE} ${NV_LIBNPP_DEV_PACKAGE} libcusparse-dev-12-1=${NV_LIBCUSPARSE_DEV_VERSION} ${NV_LIBCUBLAS_DEV_PACKAGE} ${NV_LIBNCCL_DEV_PACKAGE} ${NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2023-11-10 06:02:16 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_DEV_PACKAGE_NAME} ${NV_LIBNCCL_DEV_PACKAGE_NAME} # buildkit

2023-11-10 06:02:16 UTC (buildkit.dockerfile.v0)

ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs

2025-02-01 18:31:05 UTC (buildkit.dockerfile.v0)

ARG CUDA_VERSION=12.4.1

2025-02-01 18:31:05 UTC (buildkit.dockerfile.v0)

ARG PYTHON_VERSION=3.12

2025-02-01 18:31:05 UTC (buildkit.dockerfile.v0)

WORKDIR /vllm-workspace

2025-02-01 18:31:05 UTC (buildkit.dockerfile.v0)

ENV DEBIAN_FRONTEND=noninteractive

2025-02-01 18:31:05 UTC (buildkit.dockerfile.v0)

ARG TARGETPLATFORM

2025-02-01 18:31:06 UTC (buildkit.dockerfile.v0)

RUN |3 CUDA_VERSION=12.1.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit

2025-02-01 18:32:50 UTC (buildkit.dockerfile.v0)

RUN |3 CUDA_VERSION=12.1.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl wget sudo vim python3-pip && apt-get install -y ffmpeg libsm6 libxext6 libgl1 && add-apt-repository ppa:deadsnakes/ppa && apt-get update -y && apt-get install -y python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS https://bootstrap.pypa.io/get-pip.py | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit

2025-02-01 18:32:51 UTC (buildkit.dockerfile.v0)

RUN |3 CUDA_VERSION=12.1.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit

2025-02-01 18:32:52 UTC (buildkit.dockerfile.v0)

RUN |3 CUDA_VERSION=12.1.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then python3 -m pip install --index-url https://download.pytorch.org/whl/nightly/cu124 "torch==2.6.0.dev20241210+cu124" "torchvision==0.22.0.dev20241215"; fi # buildkit

2025-02-01 19:01:52 UTC (buildkit.dockerfile.v0)

RUN |3 CUDA_VERSION=12.1.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c python3 -m pip install dist/*.whl --verbose # buildkit

2025-02-01 19:02:51 UTC (buildkit.dockerfile.v0)

RUN |3 CUDA_VERSION=12.1.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c . /etc/environment && if [ "$TARGETPLATFORM" != "linux/arm64" ]; then python3 -m pip install https://wheels.vllm.ai/flashinfer/524304395bd1d8cd7d07db083859523fcaa246a4/flashinfer_python-0.2.0.post1-cp${PYTHON_VERSION_STR}-cp${PYTHON_VERSION_STR}-linux_x86_64.whl; fi # buildkit

2025-02-01 19:02:51 UTC (buildkit.dockerfile.v0)

COPY examples examples # buildkit

2025-02-01 19:02:51 UTC (buildkit.dockerfile.v0)

COPY requirements-build.txt requirements-build.txt # buildkit

2025-02-01 19:02:53 UTC (buildkit.dockerfile.v0)

RUN |3 CUDA_VERSION=12.1.0 PYTHON_VERSION=3.12 TARGETPLATFORM=linux/amd64 /bin/sh -c python3 -m pip install -r requirements-build.txt # buildkit

2025-02-01 19:03:05 UTC (buildkit.dockerfile.v0)

RUN /bin/sh -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then pip install accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.42.0' 'timm==0.9.10' boto3 runai-model-streamer runai-model-streamer[s3]; else pip install accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.45.0' 'timm==0.9.10' boto3 runai-model-streamer runai-model-streamer[s3]; fi # buildkit

2025-02-01 19:03:05 UTC (buildkit.dockerfile.v0)

ENV VLLM_USAGE_SOURCE=production-docker-image

2025-02-01 19:03:05 UTC (buildkit.dockerfile.v0)

ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"]

Danger Zone
Delete Tag

Please be careful as this will not just delete the reference but also the actual content!

For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.

Delete