2026-01-18 05:42:08 UTC
8.38 GB
12.9.1
DEBIAN_FRONTENDnoninteractive
LD_LIBRARY_PATH/usr/local/nvidia/lib64:/usr/local/cuda/lib64:/usr/local/cuda/lib64
NVARCHx86_64
NVIDIA_DRIVER_CAPABILITIEScompute,utility
NVIDIA_REQUIRE_CUDAcuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571
NVIDIA_VISIBLE_DEVICESall
NV_CUDA_CUDART_VERSION12.9.79-1
PATH/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
TORCH_CUDA_ARCH_LIST7.0 7.5 8.0 8.9 9.0 10.0 12.0
UV_HTTP_TIMEOUT500
UV_INDEX_STRATEGYunsafe-best-match
UV_LINK_MODEcopy
VLLM_USAGE_SOURCEproduction-docker-image
[#000] sha256:66587c81b81a58d07e40c48d900a1517516bbf58c4378c687d89d645824f5e5f - 0.34% (29 MB)
[#001] sha256:f29b1d4013a93a17a4d4acbb760170b608e6707e85419f0e1a2973233f1c0080 - 0.05% (4.43 MB)
[#002] sha256:340d44d2921c44112afe4f535a1a3bcfdc4eed5093388d098937942f7f883739 - 1.15% (98.7 MB)
[#003] sha256:59a4bcbddda3c45ff4949d35d2321b6eca9eaff7daae2334c99226bb19f60c3a - 0.0% (184 Bytes)
[#004] sha256:6e8af4fd0a071982e528b634ba99dec2474c21147f99748be708f36e10e3f4c2 - 0.0% (6.72 KB)
[#005] sha256:55b1331b4050ad984936587828fd2e951ec3dce414f241de27adfedafdab3be4 - 0.0% (104 Bytes)
[#006] sha256:406ae5a4205ee19034b8d4a490a201ddbbd21c53b0c5662e8bd48d806b8d29d1 - 0.0% (231 Bytes)
[#007] sha256:69ead450dd62f0ffc91ccb3f6e61d793e6e957b7a91701f2a031f24f44b309a0 - 2.55% (219 MB)
[#008] sha256:d675fbcc608e56af585135dd68619fc07bd81c8a9895c8511b031eb631d84455 - 15.84% (1.33 GB)
[#009] sha256:ea75fc3b9d01b81cdf85c6c52559d7a24a6714821916fbbf93dcc752aa95e5c7 - 0.52% (44.8 MB)
[#010] sha256:f37c35db391427610fffefcf524377f95ad5898ddacb5604938405f161c484fd - 0.0% (11.1 KB)
[#011] sha256:a60ee21ba56b4ddc630e4c1a63440a30bc4af2076bc95e694322f2d7df60dd4e - 0.0% (1.42 KB)
[#012] sha256:c56447a3ef0cf3bc6cd17a7f3efb1b3565074180ab9b190cb7a206cc25b4ef23 - 0.0% (474 Bytes)
[#013] sha256:93c928a4bce4b0fc13f2395a8c4dd6a177234c89060931b5bc6e2c76f52471bc - 56.88% (4.77 GB)
[#014] sha256:7876dfbaa644bf7317f99bb87802da2e214c857babefce798e6161652ed03746 - 14.28% (1.2 GB)
[#015] sha256:3c3f1d0595e6bcc00b579f103da10ad655d2324cb1dda98889b2d1606489f52d - 0.0% (897 Bytes)
[#016] sha256:e59d2252a06b281f63bd70f800b111ff460d0d7f695b61811464834cafeebd8d - 0.01% (525 KB)
[#017] sha256:b05de584548aa85b3e478f3661658a0c7d2fe017888838ff5701dd496d495dba - 1.08% (92.3 MB)
[#018] sha256:1b120389051a139b659611376015cfd99630790f15f01921f529c540d3720bf0 - 5.51% (473 MB)
[#019] sha256:0cfaccdd1b83a4de0f691849d42750b3f9be7f7a84f55dd9068fa934650ed637 - 0.0% (124 Bytes)
[#020] sha256:69ac373b231fa7fa4968adca2c179944ddcfdfb834efeb4e67dca138572c17c0 - 0.09% (7.61 MB)
[#021] sha256:1f1e31a3f818d1f9d26346e7114e35997b14d69d6e3a77385586334bf641dd72 - 1.16% (99.2 MB)
[#022] sha256:79eef2f4b1c346a9ee81943e8d389db21cd0a88c29a37656dd7d450c8f753de8 - 0.0% (200 KB)
[#023] sha256:9c21712adb3b7f3d09c48163c6b7fed124e24629b5667e3ef9ecea4f38ed6ace - 0.0% (175 KB)
[#024] sha256:786000a9e0a1c7cebf3966dc9bfedfe7802285b3a789a071a2d014f7417ab0c8 - 0.0% (8.2 KB)
[#025] sha256:a9f708721d22783c4f09f71ab200ebdac30ba661f90cf731edd8c136093dd44e - 0.56% (47.8 MB)
/bin/sh -c #(nop) ARG RELEASE
2025-07-14 16:33:29 UTC/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH
2025-07-14 16:33:29 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu
2025-07-14 16:33:29 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04
2025-07-14 16:33:31 UTC/bin/sh -c #(nop) ADD file:415bbc01dfb447d002e2d8173e113ef025d2bbfa20f1205823fa699dc87a2019 in /
2025-07-14 16:33:32 UTC/bin/sh -c #(nop) CMD ["/bin/bash"]
2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)ENV NVARCH=x86_64
2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)ENV NVIDIA_REQUIRE_CUDA=cuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571
2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_CUDART_VERSION=12.9.79-1
2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit
2025-07-18 20:11:02 UTC (buildkit.dockerfile.v0)ENV CUDA_VERSION=12.9.1
2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-9=${NV_CUDA_CUDART_VERSION} cuda-compat-12-9 && rm -rf /var/lib/apt/lists/* # buildkit
2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit
2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64
2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)COPY NGC-DL-CONTAINER-LICENSE / # buildkit
2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)ENV NVIDIA_VISIBLE_DEVICES=all
2025-07-18 20:11:19 UTC (buildkit.dockerfile.v0)ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
2026-01-18 05:23:08 UTC (buildkit.dockerfile.v0)ARG CUDA_VERSION
2026-01-18 05:23:08 UTC (buildkit.dockerfile.v0)ARG PYTHON_VERSION
2026-01-18 05:23:08 UTC (buildkit.dockerfile.v0)ARG DEADSNAKES_MIRROR_URL
2026-01-18 05:23:08 UTC (buildkit.dockerfile.v0)ARG DEADSNAKES_GPGKEY_URL
2026-01-18 05:23:08 UTC (buildkit.dockerfile.v0)ARG GET_PIP_URL
2026-01-18 05:23:08 UTC (buildkit.dockerfile.v0)ENV DEBIAN_FRONTEND=noninteractive
2026-01-18 05:23:08 UTC (buildkit.dockerfile.v0)WORKDIR /vllm-workspace
2026-01-18 05:23:49 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit
2026-01-18 05:27:30 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y --no-install-recommends software-properties-common curl sudo python3-pip ffmpeg libsm6 libxext6 libgl1 && if [ ! -z ${DEADSNAKES_MIRROR_URL} ] ; then if [ ! -z "${DEADSNAKES_GPGKEY_URL}" ] ; then mkdir -p -m 0755 /etc/apt/keyrings ; curl -L ${DEADSNAKES_GPGKEY_URL} | gpg --dearmor > /etc/apt/keyrings/deadsnakes.gpg ; sudo chmod 644 /etc/apt/keyrings/deadsnakes.gpg ; echo "deb [signed-by=/etc/apt/keyrings/deadsnakes.gpg] ${DEADSNAKES_MIRROR_URL} $(lsb_release -cs) main" > /etc/apt/sources.list.d/deadsnakes.list ; fi ; else for i in 1 2 3; do add-apt-repository -y ppa:deadsnakes/ppa && break || { echo "Attempt $i failed, retrying in 5s..."; sleep 5; }; done ; fi && apt-get update -y && apt-get install -y --no-install-recommends python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && rm -rf /var/lib/apt/lists/* && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS ${GET_PIP_URL} | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit
2026-01-18 05:28:48 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c CUDA_VERSION_DASH=$(echo $CUDA_VERSION | cut -d. -f1,2 | tr '.' '-') && apt-get update -y && apt-get install -y --no-install-recommends cuda-nvcc-${CUDA_VERSION_DASH} cuda-cudart-${CUDA_VERSION_DASH} cuda-nvrtc-${CUDA_VERSION_DASH} cuda-cuobjdump-${CUDA_VERSION_DASH} libcurand-dev-${CUDA_VERSION_DASH} libcublas-${CUDA_VERSION_DASH} libnccl-dev && rm -rf /var/lib/apt/lists/* # buildkit
2026-01-18 05:28:56 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c python3 -m pip install uv # buildkit
2026-01-18 05:28:56 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2026-01-18 05:28:56 UTC (buildkit.dockerfile.v0)ENV UV_INDEX_STRATEGY=unsafe-best-match
2026-01-18 05:28:56 UTC (buildkit.dockerfile.v0)ENV UV_LINK_MODE=copy
2026-01-18 05:28:58 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit
2026-01-18 05:28:58 UTC (buildkit.dockerfile.v0)ARG PYTORCH_CUDA_INDEX_BASE_URL
2026-01-18 05:28:59 UTC (buildkit.dockerfile.v0)COPY requirements/common.txt /tmp/common.txt # buildkit
2026-01-18 05:29:01 UTC (buildkit.dockerfile.v0)COPY requirements/cuda.txt /tmp/requirements-cuda.txt # buildkit
2026-01-18 05:30:25 UTC (buildkit.dockerfile.v0)RUN |6 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl /bin/sh -c uv pip install --system -r /tmp/requirements-cuda.txt --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') && rm /tmp/requirements-cuda.txt /tmp/common.txt # buildkit
2026-01-18 05:30:25 UTC (buildkit.dockerfile.v0)ARG FLASHINFER_VERSION=0.5.3
2026-01-18 05:32:19 UTC (buildkit.dockerfile.v0)RUN |7 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 /bin/sh -c uv pip install --system flashinfer-cubin==${FLASHINFER_VERSION} && uv pip install --system flashinfer-jit-cache==${FLASHINFER_VERSION} --extra-index-url https://flashinfer.ai/whl/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') && flashinfer show-config # buildkit
2026-01-18 05:32:19 UTC (buildkit.dockerfile.v0)ARG GDRCOPY_CUDA_VERSION=12.8
2026-01-18 05:32:19 UTC (buildkit.dockerfile.v0)ARG GDRCOPY_OS_VERSION=Ubuntu22_04
2026-01-18 05:32:19 UTC (buildkit.dockerfile.v0)ARG TARGETPLATFORM
2026-01-18 05:32:19 UTC (buildkit.dockerfile.v0)COPY tools/install_gdrcopy.sh /tmp/install_gdrcopy.sh # buildkit
2026-01-18 05:32:27 UTC (buildkit.dockerfile.v0)RUN |10 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/amd64 /bin/sh -c set -eux; case "${TARGETPLATFORM}" in linux/arm64) UUARCH="aarch64" ;; linux/amd64) UUARCH="x64" ;; *) echo "Unsupported TARGETPLATFORM: ${TARGETPLATFORM}" >&2; exit 1 ;; esac; /tmp/install_gdrcopy.sh "${GDRCOPY_OS_VERSION}" "${GDRCOPY_CUDA_VERSION}" "${UUARCH}" && rm /tmp/install_gdrcopy.sh # buildkit
2026-01-18 05:32:35 UTC (buildkit.dockerfile.v0)RUN |10 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/amd64 /bin/sh -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then BITSANDBYTES_VERSION="0.42.0"; else BITSANDBYTES_VERSION="0.46.1"; fi; uv pip install --system accelerate hf_transfer modelscope "bitsandbytes>=${BITSANDBYTES_VERSION}" 'timm>=1.0.17' 'runai-model-streamer[s3,gcs]>=0.15.3' # buildkit
2026-01-18 05:32:35 UTC (buildkit.dockerfile.v0)ARG PIP_INDEX_URL UV_INDEX_URL
2026-01-18 05:32:35 UTC (buildkit.dockerfile.v0)ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL
2026-01-18 05:32:35 UTC (buildkit.dockerfile.v0)ARG PYTORCH_CUDA_INDEX_BASE_URL
2026-01-18 05:32:35 UTC (buildkit.dockerfile.v0)ARG PIP_KEYRING_PROVIDER UV_KEYRING_PROVIDER
2026-01-18 05:42:00 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/amd64 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/sh -c uv pip install --system dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
2026-01-18 05:42:00 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/amd64 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/sh -c . /etc/environment && uv pip list # buildkit
2026-01-18 05:42:01 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/amd64 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/sh -c sh -c 'if ls /tmp/deepgemm/dist/*.whl >/dev/null 2>&1; then uv pip install --system /tmp/deepgemm/dist/*.whl; else echo "No DeepGEMM wheels to install; skipping."; fi' # buildkit
2026-01-18 05:42:01 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64:/usr/local/cuda/lib64
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/amd64 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/sh -c uv pip install --system ep_kernels/dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib64:/usr/local/cuda/lib64:/usr/local/cuda/lib64
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)COPY examples examples # buildkit
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)COPY benchmarks benchmarks # buildkit
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)COPY ./vllm/collect_env.py . # buildkit
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)ARG TARGETPLATFORM
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)ARG INSTALL_KV_CONNECTORS=false
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)ARG CUDA_VERSION
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)ARG PIP_INDEX_URL UV_INDEX_URL
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)ARG torch_cuda_arch_list=7.0 7.5 8.0 8.9 9.0 10.0 12.0
2026-01-18 05:42:04 UTC (buildkit.dockerfile.v0)ENV TORCH_CUDA_ARCH_LIST=7.0 7.5 8.0 8.9 9.0 10.0 12.0
2026-01-18 05:42:08 UTC (buildkit.dockerfile.v0)RUN |8 TARGETPLATFORM=linux/amd64 INSTALL_KV_CONNECTORS=true CUDA_VERSION=12.9.1 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= torch_cuda_arch_list=7.0 7.5 8.0 8.9 9.0 10.0 12.0 /bin/sh -c CUDA_MAJOR="${CUDA_VERSION%%.*}"; CUDA_VERSION_DASH=$(echo $CUDA_VERSION | cut -d. -f1,2 | tr '.' '-'); CUDA_HOME=/usr/local/cuda; BUILD_PKGS="libcusparse-dev-${CUDA_VERSION_DASH} libcublas-dev-${CUDA_VERSION_DASH} libcusolver-dev-${CUDA_VERSION_DASH}"; if [ "$INSTALL_KV_CONNECTORS" = "true" ]; then if [ "$CUDA_MAJOR" -ge 13 ]; then uv pip install --system nixl-cu13; fi; uv pip install --system -r /tmp/kv_connectors.txt --no-build || ( apt-get update -y && apt-get install -y --no-install-recommends ${BUILD_PKGS} && uv pip install --system -r /tmp/kv_connectors.txt --no-build-isolation && apt-get purge -y ${BUILD_PKGS} && rm -rf /var/lib/apt/lists/* ); fi # buildkit
2026-01-18 05:42:08 UTC (buildkit.dockerfile.v0)ENV VLLM_USAGE_SOURCE=production-docker-image
2026-01-18 05:42:08 UTC (buildkit.dockerfile.v0)ENTRYPOINT ["vllm" "serve"]
2026-01-18 05:50:30 UTC
9 GB
12.9.1
DEBIAN_FRONTENDnoninteractive
LD_LIBRARY_PATH/usr/local/nvidia/lib64:/usr/local/cuda/lib64:/usr/local/cuda/lib64
NVARCHsbsa
NVIDIA_DRIVER_CAPABILITIEScompute,utility
NVIDIA_REQUIRE_CUDAcuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571
NVIDIA_VISIBLE_DEVICESall
NV_CUDA_CUDART_VERSION12.9.79-1
PATH/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
TORCH_CUDA_ARCH_LIST8.7 8.9 9.0 10.0+PTX 12.0
UV_HTTP_TIMEOUT500
UV_INDEX_STRATEGYunsafe-best-match
UV_LINK_MODEcopy
VLLM_USAGE_SOURCEproduction-docker-image
[#000] sha256:2ea2730b4ab400d71167ddb8627f741637496aa57128fdfc248d6a9f799d76e9 - 0.29% (27.1 MB)
[#001] sha256:7aa2d0bb5c94f1cf869e71e4db856d2ca0733f5eaab55dd514441da9616abb35 - 0.05% (4.38 MB)
[#002] sha256:5136ae4e75ffd61960e9220c7d7625a3ee213ff63c25fdc24e85bfe229b16ab5 - 1.01% (93.1 MB)
[#003] sha256:6f760a753c5e1fc35281126d63b6ca9bef93e49f89a826a2bc2786e293d88f00 - 0.0% (182 Bytes)
[#004] sha256:6e8af4fd0a071982e528b634ba99dec2474c21147f99748be708f36e10e3f4c2 - 0.0% (6.72 KB)
[#005] sha256:a9cf6d711706981051ba7cfa2daca38c805c57710995db3825bf850ee4c1d0b1 - 0.0% (104 Bytes)
[#006] sha256:2fe7d9180635e637090440a2173081a5ed518704b8f87d7ea88bc6dd2542ceb3 - 0.0% (231 Bytes)
[#007] sha256:19361719c3be476808b05a5a7eb3c90551b449d97d5de8fc038ffe20b02052dd - 2.22% (204 MB)
[#008] sha256:ea6771bc4fa698a5ebea29413fa8e1aa29b19a41a33759c0537771aa504a5462 - 14.16% (1.27 GB)
[#009] sha256:3c1f609ffcf0c74694a46e3402213835d370835d215962b942c8d2a20712fec5 - 0.47% (43 MB)
[#010] sha256:a0fbaa954ec7cab4b810f121b8e3aa698a52596081b5bc698850d7e894e06433 - 0.0% (10.8 KB)
[#011] sha256:960554242682852d72169423589edcd2bc4dd5f4d2f9eff79af64dae16833afb - 0.0% (1.42 KB)
[#012] sha256:b04f1ef92d1d12005d72c9ace5e51ce8002c798d4ab8ab361d05aa06cb361df0 - 0.0% (476 Bytes)
[#013] sha256:849791073d41f996e0f76b3735dbe21bde7d6f07413876a7a553b60fcca68f3e - 45.38% (4.08 GB)
[#014] sha256:2792a783c115e0e5fc60f401658739a2f063f4c87525803466ceb2630f55dda8 - 13.21% (1.19 GB)
[#015] sha256:c14813221e6a8ddabe8925a55573c5de6692a4d4786e817883ef95725641dd29 - 0.0% (897 Bytes)
[#016] sha256:9c61b1d12de9c05a654940644f21f716d9be6f884085dc243e2c5ba44eb3193c - 0.01% (522 KB)
[#017] sha256:d78a8430a7fc72d88b46ac45690ea0ecc7aa3f75d895934d144e5076a23706e7 - 3.67% (338 MB)
[#018] sha256:5f81dbf46f76e2779b64a84ce899020904877ac746fa21d70b79fe68f2780436 - 7.59% (700 MB)
[#019] sha256:0350b340d92faf868a3042a407afc763d6aaef0d034a7aa63cd9bb7000528cc3 - 0.0% (124 Bytes)
[#020] sha256:473ba986ca9ddb05966962e441f2937e5aedb653560c94fdce334baffd9b3bd9 - 0.08% (7.44 MB)
[#021] sha256:65c899b4f33a11a56b5e398c28867bfdef859b283266c4f94f51a72f71ac4e0f - 1.07% (99 MB)
[#022] sha256:ac08208ebe9d160db1cffa883056ac2402aebd5d491862e2d55397aa770c4fdc - 0.0% (200 KB)
[#023] sha256:b4991719dfbaa616e471f839c5756ef8bf03984778a74b2420572d9332449704 - 0.0% (175 KB)
[#024] sha256:0ff96fb5444667f5fb9b63f87725778a95bffd76334fc6b397162171111c5f4d - 0.0% (8.2 KB)
[#025] sha256:d588c9c4d0144cad274b6dcd1eda76c1b19acbb0da4fc621b38ca7c766099595 - 10.8% (996 MB)
/bin/sh -c #(nop) ARG RELEASE
2025-07-14 16:34:14 UTC/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH
2025-07-14 16:34:14 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu
2025-07-14 16:34:14 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04
2025-07-14 16:34:16 UTC/bin/sh -c #(nop) ADD file:834c1c2a4c7753a37759a9b21f64a990572643eee18669b1faa782fee45355ed in /
2025-07-14 16:34:17 UTC/bin/sh -c #(nop) CMD ["/bin/bash"]
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ENV NVARCH=sbsa
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ENV NVIDIA_REQUIRE_CUDA=cuda>=12.9 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 brand=unknown,driver>=570,driver<571 brand=grid,driver>=570,driver<571 brand=tesla,driver>=570,driver<571 brand=nvidia,driver>=570,driver<571 brand=quadro,driver>=570,driver<571 brand=quadrortx,driver>=570,driver<571 brand=nvidiartx,driver>=570,driver<571 brand=vapps,driver>=570,driver<571 brand=vpc,driver>=570,driver<571 brand=vcs,driver>=570,driver<571 brand=vws,driver>=570,driver<571 brand=cloudgaming,driver>=570,driver<571
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_CUDART_VERSION=12.9.79-1
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit
2025-07-18 20:12:35 UTC (buildkit.dockerfile.v0)ENV CUDA_VERSION=12.9.1
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-9=${NV_CUDA_CUDART_VERSION} cuda-compat-12-9 && rm -rf /var/lib/apt/lists/* # buildkit
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=arm64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)COPY NGC-DL-CONTAINER-LICENSE / # buildkit
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)ENV NVIDIA_VISIBLE_DEVICES=all
2025-07-18 20:13:38 UTC (buildkit.dockerfile.v0)ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
2026-01-18 05:25:34 UTC (buildkit.dockerfile.v0)ARG CUDA_VERSION
2026-01-18 05:25:34 UTC (buildkit.dockerfile.v0)ARG PYTHON_VERSION
2026-01-18 05:25:34 UTC (buildkit.dockerfile.v0)ARG DEADSNAKES_MIRROR_URL
2026-01-18 05:25:34 UTC (buildkit.dockerfile.v0)ARG DEADSNAKES_GPGKEY_URL
2026-01-18 05:25:34 UTC (buildkit.dockerfile.v0)ARG GET_PIP_URL
2026-01-18 05:25:34 UTC (buildkit.dockerfile.v0)ENV DEBIAN_FRONTEND=noninteractive
2026-01-18 05:25:34 UTC (buildkit.dockerfile.v0)WORKDIR /vllm-workspace
2026-01-18 05:26:24 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit
2026-01-18 05:29:17 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y --no-install-recommends software-properties-common curl sudo python3-pip ffmpeg libsm6 libxext6 libgl1 && if [ ! -z ${DEADSNAKES_MIRROR_URL} ] ; then if [ ! -z "${DEADSNAKES_GPGKEY_URL}" ] ; then mkdir -p -m 0755 /etc/apt/keyrings ; curl -L ${DEADSNAKES_GPGKEY_URL} | gpg --dearmor > /etc/apt/keyrings/deadsnakes.gpg ; sudo chmod 644 /etc/apt/keyrings/deadsnakes.gpg ; echo "deb [signed-by=/etc/apt/keyrings/deadsnakes.gpg] ${DEADSNAKES_MIRROR_URL} $(lsb_release -cs) main" > /etc/apt/sources.list.d/deadsnakes.list ; fi ; else for i in 1 2 3; do add-apt-repository -y ppa:deadsnakes/ppa && break || { echo "Attempt $i failed, retrying in 5s..."; sleep 5; }; done ; fi && apt-get update -y && apt-get install -y --no-install-recommends python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && rm -rf /var/lib/apt/lists/* && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS ${GET_PIP_URL} | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit
2026-01-18 05:30:28 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c CUDA_VERSION_DASH=$(echo $CUDA_VERSION | cut -d. -f1,2 | tr '.' '-') && apt-get update -y && apt-get install -y --no-install-recommends cuda-nvcc-${CUDA_VERSION_DASH} cuda-cudart-${CUDA_VERSION_DASH} cuda-nvrtc-${CUDA_VERSION_DASH} cuda-cuobjdump-${CUDA_VERSION_DASH} libcurand-dev-${CUDA_VERSION_DASH} libcublas-${CUDA_VERSION_DASH} libnccl-dev && rm -rf /var/lib/apt/lists/* # buildkit
2026-01-18 05:30:33 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c python3 -m pip install uv # buildkit
2026-01-18 05:30:33 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2026-01-18 05:30:33 UTC (buildkit.dockerfile.v0)ENV UV_INDEX_STRATEGY=unsafe-best-match
2026-01-18 05:30:33 UTC (buildkit.dockerfile.v0)ENV UV_LINK_MODE=copy
2026-01-18 05:30:46 UTC (buildkit.dockerfile.v0)RUN |5 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/sh -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit
2026-01-18 05:30:46 UTC (buildkit.dockerfile.v0)ARG PYTORCH_CUDA_INDEX_BASE_URL
2026-01-18 05:30:52 UTC (buildkit.dockerfile.v0)COPY requirements/common.txt /tmp/common.txt # buildkit
2026-01-18 05:30:53 UTC (buildkit.dockerfile.v0)COPY requirements/cuda.txt /tmp/requirements-cuda.txt # buildkit
2026-01-18 05:32:03 UTC (buildkit.dockerfile.v0)RUN |6 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl /bin/sh -c uv pip install --system -r /tmp/requirements-cuda.txt --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') && rm /tmp/requirements-cuda.txt /tmp/common.txt # buildkit
2026-01-18 05:32:03 UTC (buildkit.dockerfile.v0)ARG FLASHINFER_VERSION=0.5.3
2026-01-18 05:33:48 UTC (buildkit.dockerfile.v0)RUN |7 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 /bin/sh -c uv pip install --system flashinfer-cubin==${FLASHINFER_VERSION} && uv pip install --system flashinfer-jit-cache==${FLASHINFER_VERSION} --extra-index-url https://flashinfer.ai/whl/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') && flashinfer show-config # buildkit
2026-01-18 05:33:48 UTC (buildkit.dockerfile.v0)ARG GDRCOPY_CUDA_VERSION=12.8
2026-01-18 05:33:48 UTC (buildkit.dockerfile.v0)ARG GDRCOPY_OS_VERSION=Ubuntu22_04
2026-01-18 05:33:48 UTC (buildkit.dockerfile.v0)ARG TARGETPLATFORM
2026-01-18 05:33:48 UTC (buildkit.dockerfile.v0)COPY tools/install_gdrcopy.sh /tmp/install_gdrcopy.sh # buildkit
2026-01-18 05:33:55 UTC (buildkit.dockerfile.v0)RUN |10 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/arm64 /bin/sh -c set -eux; case "${TARGETPLATFORM}" in linux/arm64) UUARCH="aarch64" ;; linux/amd64) UUARCH="x64" ;; *) echo "Unsupported TARGETPLATFORM: ${TARGETPLATFORM}" >&2; exit 1 ;; esac; /tmp/install_gdrcopy.sh "${GDRCOPY_OS_VERSION}" "${GDRCOPY_CUDA_VERSION}" "${UUARCH}" && rm /tmp/install_gdrcopy.sh # buildkit
2026-01-18 05:34:04 UTC (buildkit.dockerfile.v0)RUN |10 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/arm64 /bin/sh -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then BITSANDBYTES_VERSION="0.42.0"; else BITSANDBYTES_VERSION="0.46.1"; fi; uv pip install --system accelerate hf_transfer modelscope "bitsandbytes>=${BITSANDBYTES_VERSION}" 'timm>=1.0.17' 'runai-model-streamer[s3,gcs]>=0.15.3' # buildkit
2026-01-18 05:34:04 UTC (buildkit.dockerfile.v0)ARG PIP_INDEX_URL UV_INDEX_URL
2026-01-18 05:34:04 UTC (buildkit.dockerfile.v0)ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL
2026-01-18 05:34:04 UTC (buildkit.dockerfile.v0)ARG PYTORCH_CUDA_INDEX_BASE_URL
2026-01-18 05:34:04 UTC (buildkit.dockerfile.v0)ARG PIP_KEYRING_PROVIDER UV_KEYRING_PROVIDER
2026-01-18 05:44:50 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/arm64 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/sh -c uv pip install --system dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
2026-01-18 05:44:51 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/arm64 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/sh -c . /etc/environment && uv pip list # buildkit
2026-01-18 05:44:52 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/arm64 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/sh -c sh -c 'if ls /tmp/deepgemm/dist/*.whl >/dev/null 2>&1; then uv pip install --system /tmp/deepgemm/dist/*.whl; else echo "No DeepGEMM wheels to install; skipping."; fi' # buildkit
2026-01-18 05:44:52 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64:/usr/local/cuda/lib64
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)RUN |17 CUDA_VERSION=12.9.1 PYTHON_VERSION=3.12 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl FLASHINFER_VERSION=0.5.3 GDRCOPY_CUDA_VERSION=12.8 GDRCOPY_OS_VERSION=Ubuntu22_04 TARGETPLATFORM=linux/arm64 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/sh -c uv pip install --system ep_kernels/dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib64:/usr/local/cuda/lib64:/usr/local/cuda/lib64
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)COPY examples examples # buildkit
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)COPY benchmarks benchmarks # buildkit
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)COPY ./vllm/collect_env.py . # buildkit
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)ARG TARGETPLATFORM
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)ARG INSTALL_KV_CONNECTORS=false
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)ARG CUDA_VERSION
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)ARG PIP_INDEX_URL UV_INDEX_URL
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)ENV UV_HTTP_TIMEOUT=500
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)ARG torch_cuda_arch_list=7.0 7.5 8.0 8.9 9.0 10.0 12.0
2026-01-18 05:44:55 UTC (buildkit.dockerfile.v0)ENV TORCH_CUDA_ARCH_LIST=8.7 8.9 9.0 10.0+PTX 12.0
2026-01-18 05:50:30 UTC (buildkit.dockerfile.v0)RUN |8 TARGETPLATFORM=linux/arm64 INSTALL_KV_CONNECTORS=true CUDA_VERSION=12.9.1 PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= torch_cuda_arch_list=8.7 8.9 9.0 10.0+PTX 12.0 /bin/sh -c CUDA_MAJOR="${CUDA_VERSION%%.*}"; CUDA_VERSION_DASH=$(echo $CUDA_VERSION | cut -d. -f1,2 | tr '.' '-'); CUDA_HOME=/usr/local/cuda; BUILD_PKGS="libcusparse-dev-${CUDA_VERSION_DASH} libcublas-dev-${CUDA_VERSION_DASH} libcusolver-dev-${CUDA_VERSION_DASH}"; if [ "$INSTALL_KV_CONNECTORS" = "true" ]; then if [ "$CUDA_MAJOR" -ge 13 ]; then uv pip install --system nixl-cu13; fi; uv pip install --system -r /tmp/kv_connectors.txt --no-build || ( apt-get update -y && apt-get install -y --no-install-recommends ${BUILD_PKGS} && uv pip install --system -r /tmp/kv_connectors.txt --no-build-isolation && apt-get purge -y ${BUILD_PKGS} && rm -rf /var/lib/apt/lists/* ); fi # buildkit
2026-01-18 05:50:30 UTC (buildkit.dockerfile.v0)ENV VLLM_USAGE_SOURCE=production-docker-image
2026-01-18 05:50:30 UTC (buildkit.dockerfile.v0)ENTRYPOINT ["vllm" "serve"]
Please be careful as this will not just delete the reference but also the actual content!
For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.