Namespace
approachingai
Image / Tag
ktransformers:latest
Content Digest
sha256:8476770c0693c7fb1a773d9570509c3d45011c29899eb10b62640fac6ed98e66
Details
Created

2026-03-05 08:13:01 UTC

Size

14.5 GB

Content Digest
Labels
  • com.nvidia.cudnn.version
    9.8.0.87-1
  • maintainer
    NVIDIA CORPORATION <cudatools@nvidia.com>
  • org.opencontainers.image.ref.name
    ubuntu
  • org.opencontainers.image.version
    24.04

Environment
CUDA_HOME

/usr/local/cuda

CUDA_VERSION

12.8.1

DEBIAN_FRONTEND

noninteractive

FLASHINFER_VERSION

0.5.3

GDRCOPY_HOME

/usr/src/gdrdrv-2.5.1/

GIT_SSL_NO_VERIFY

1

HTTPS_PROXY

http://127.0.0.1:7890

HTTP_PROXY

http://127.0.0.1:7890

LANG

en_US.UTF-8

LANGUAGE

en_US:en

LC_ALL

en_US.UTF-8

LD_LIBRARY_PATH

/usr/local/cuda/lib64:/usr/local/nvidia/lib:/usr/local/nvidia/lib64

LIBRARY_PATH

/usr/local/cuda/lib64/stubs

NCCL_VERSION

2.25.1-1

NVARCH

x86_64

NVIDIA_DRIVER_CAPABILITIES

compute,utility

NVIDIA_PRODUCT_NAME

CUDA

NVIDIA_REQUIRE_CUDA

cuda>=12.8 brand=unknown,driver>=470,driver<471 brand=grid,driver>=470,driver<471 brand=tesla,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=vapps,driver>=470,driver<471 brand=vpc,driver>=470,driver<471 brand=vcs,driver>=470,driver<471 brand=vws,driver>=470,driver<471 brand=cloudgaming,driver>=470,driver<471 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566

NVIDIA_VISIBLE_DEVICES

all

NV_CUDA_CUDART_DEV_VERSION

12.8.90-1

NV_CUDA_CUDART_VERSION

12.8.90-1

NV_CUDA_LIB_VERSION

12.8.1-1

NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE

cuda-nsight-compute-12-8=12.8.1-1

NV_CUDA_NSIGHT_COMPUTE_VERSION

12.8.1-1

NV_CUDNN_PACKAGE

libcudnn9-cuda-12=9.8.0.87-1

NV_CUDNN_PACKAGE_DEV

libcudnn9-dev-cuda-12=9.8.0.87-1

NV_CUDNN_PACKAGE_NAME

libcudnn9-cuda-12

NV_CUDNN_VERSION

9.8.0.87-1

NV_LIBCUBLAS_DEV_PACKAGE

libcublas-dev-12-8=12.8.4.1-1

NV_LIBCUBLAS_DEV_PACKAGE_NAME

libcublas-dev-12-8

NV_LIBCUBLAS_DEV_VERSION

12.8.4.1-1

NV_LIBCUBLAS_PACKAGE

libcublas-12-8=12.8.4.1-1

NV_LIBCUBLAS_PACKAGE_NAME

libcublas-12-8

NV_LIBCUBLAS_VERSION

12.8.4.1-1

NV_LIBCUSPARSE_DEV_VERSION

12.5.8.93-1

NV_LIBCUSPARSE_VERSION

12.5.8.93-1

NV_LIBNCCL_DEV_PACKAGE

libnccl-dev=2.25.1-1+cuda12.8

NV_LIBNCCL_DEV_PACKAGE_NAME

libnccl-dev

NV_LIBNCCL_DEV_PACKAGE_VERSION

2.25.1-1

NV_LIBNCCL_PACKAGE

libnccl2=2.25.1-1+cuda12.8

NV_LIBNCCL_PACKAGE_NAME

libnccl2

NV_LIBNCCL_PACKAGE_VERSION

2.25.1-1

NV_LIBNPP_DEV_PACKAGE

libnpp-dev-12-8=12.3.3.100-1

NV_LIBNPP_DEV_VERSION

12.3.3.100-1

NV_LIBNPP_PACKAGE

libnpp-12-8=12.3.3.100-1

NV_LIBNPP_VERSION

12.3.3.100-1

NV_NVML_DEV_VERSION

12.8.90-1

NV_NVPROF_DEV_PACKAGE

cuda-nvprof-12-8=12.8.90-1

NV_NVPROF_VERSION

12.8.90-1

NV_NVTX_VERSION

12.8.90-1

PATH

/opt/miniconda3/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/nvidia/bin

http_proxy

http://127.0.0.1:7890

https_proxy

http://127.0.0.1:7890


Layers

[#000] sha256:107a4fb0af3829758fca8bb809bb86ccb87dd630e4d61110103466886f7b0746 - 0.2% (29.2 MB)

[#001] sha256:a102f36d092c0e9e0bef8c97854f606af9156aa36ab408e6fa4b88e27124a7e6 - 0.04% (6.63 MB)

[#002] sha256:05ec76e31584ec109785cc7045bd88df0240411233c2fcdad66b621c662034c0 - 0.41% (61.3 MB)

[#003] sha256:398182656c471d6ecca3c2d6d30e97193b40ffc8028a94515093960322f3d64e - 0.0% (183 Bytes)

[#004] sha256:73389fbd088f5ed5d9fd258baced59de092978b4f483920ea6d074522a105119 - 0.0% (6.72 KB)

[#005] sha256:cbb9175a9bc5f6553f8c0c5025ea9521898b8a3956ee24798dc35c24c6185053 - 13.21% (1.92 GB)

[#006] sha256:3d6ab8c799cda2f4c6a6277b0e24dd2231c5de83b0316968b7cce81156bb8be0 - 0.0% (58.2 KB)

[#007] sha256:7209097bfb98d6f8b422984480f1fddead5ea62f8900ff6b6548e060b71aca76 - 0.0% (1.64 KB)

[#008] sha256:545a3ada5b6bc612a11c13a659775d67eeda5a61615e7f49c76ecd24adcad626 - 0.0% (1.49 KB)

[#009] sha256:abf026459f528efac0543168ff07d7037e9415fe3eb956b82f8fd617c7d2db1f - 19.27% (2.8 GB)

[#010] sha256:93e2721b7dddc8fb00723395d1865e71805c41b3d8f166c6753b2cb7e92b0da6 - 0.0% (87.4 KB)

[#011] sha256:ae9716fa7429dcb1b2b3722df89a54c812a531545360f4bb7fa92046236996d7 - 4.52% (671 MB)

[#012] sha256:567755953e44776028fc0e9105afe324a0bd078a023658e9ad6ce8bd5a9b2e4f - 0.0% (318 Bytes)

[#013] sha256:4f14ac1904e66c74ab5f148f40c3b40d27b7872dc4e06263ac929381be0f24e5 - 6.59% (979 MB)

[#014] sha256:223e6c538c307073b5a71396e1008fedb11a2ab858729b1a7015b3694e451d4e - 0.01% (1.43 MB)

[#015] sha256:8d22236cf9b23051cef2766cead99f0df6b094c0ab35ab94da1ce8982922c724 - 0.0% (187 Bytes)

[#016] sha256:71d8a089768be56166dc679adedc0ee016f55d38c8e59910f31fc0d17a4fce87 - 0.01% (846 KB)

[#017] sha256:e5bbc20bd6950002971e3566624141acefcd26657e63f6a037a5fdded325f419 - 2.42% (359 MB)

[#018] sha256:25c8470ce139fc2ce3bf88be52b30e00105170d13fddcc2e87181dedc9a4cbf1 - 0.0% (844 Bytes)

[#019] sha256:e4e20ac9a8cec98c77dd46105ca3026539494e77483902a9c2f975f9974e2a2c - 0.0% (235 Bytes)

[#020] sha256:4373b62912c958250376fa1353382d95f4b50c3960b5af47f6d73fcd0d5362d8 - 0.0% (99 Bytes)

[#021] sha256:6ee755294b60758028dcd078736976750055da26e41aa9f71f736e3f25036c4d - 1.3% (193 MB)

[#022] sha256:4b36db75e8f0d46adda55d3b2ffb35f09b965241aa6b4befc997d079f0164a1b - 0.0% (21.5 KB)

[#023] sha256:a61f3a0bebba481e35328e1ffa3999f2f8039ca333dc19b21e26e91b8b6f350b - 6.0% (891 MB)

[#024] sha256:2889c6a38ccb1727f8cea75e675312ed15f64ceaa584517a3738277da038f7b2 - 0.0% (1.23 KB)

[#025] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)

[#026] sha256:8766b44830ffbdc53712cff0e00b4459159d31b0fe9fd3050507b0f38058537d - 0.02% (2.54 MB)

[#027] sha256:10f9a8d34ad67afd8ffcf3e715053fccbf57fedb99db3047a1cd47a794502194 - 3.42% (508 MB)

[#028] sha256:3d31858a2b532959d25379702c15379174b00153e950b645ab6172050377a86a - 34.58% (5.02 GB)

[#029] sha256:ed5b3682993515ce803bd285900c82f0ccd9fbfdfb8d3e2c665e0bc5987bc72e - 0.94% (140 MB)

[#030] sha256:39addc71961278ea7d77b5e072201eec5ebf66d869dbbc3188165296e1032993 - 0.01% (1.2 MB)

[#031] sha256:56b6cbe015314989cd1ab4cd6a556e8f11a7e713ada5ebb8dcdd3f5f47c6388a - 0.16% (23.9 MB)

[#032] sha256:9ae52cefe47534d8c8583a5d9ce7bd42cccbb3fbddcbf73d486e84d349f4a117 - 1.9% (283 MB)

[#033] sha256:471ed8d2ee4fb280774b56436b0ba07ffc7635aef62804d5ffcbc4081d66968c - 4.99% (742 MB)

[#034] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)

[#035] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)

[#036] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)

[#037] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)

[#038] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)

[#039] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)

[#040] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)

[#041] sha256:60f46e6315ae99245a9be18325fdaa328a221d7ac5c6ff119e80b52caa7b5f9c - 0.0% (1.7 KB)

[#042] sha256:f859ed8eacc4fe5870873c3bf132fe98a436395cdbbfb104db38d84de2fc7287 - 0.0% (1.73 KB)

[#043] sha256:b4cd1d61facc63ec29fa8247cc7b87334e56d6f2458ca07b77fa348fcf6a49f5 - 0.0% (211 Bytes)

[#044] sha256:4f4fb700ef54461cfa02571ae0db9a0dc1e0cdb5577484a6d75e68dc38e8acc1 - 0.0% (32 Bytes)


History
2025-01-27 04:14:00 UTC

/bin/sh -c #(nop) ARG RELEASE

2025-01-27 04:14:00 UTC

/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH

2025-01-27 04:14:00 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu

2025-01-27 04:14:00 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.version=24.04

2025-01-27 04:14:03 UTC

/bin/sh -c #(nop) ADD file:6df775300d76441aa33f31b22c1afce8dfe35c8ffbc14ef27c27009235b12a95 in /

2025-01-27 04:14:03 UTC

/bin/sh -c #(nop) CMD ["/bin/bash"]

2025-03-10 22:19:07 UTC (buildkit.dockerfile.v0)

ENV NVARCH=x86_64

2025-03-10 22:19:07 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_REQUIRE_CUDA=cuda>=12.8 brand=unknown,driver>=470,driver<471 brand=grid,driver>=470,driver<471 brand=tesla,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=vapps,driver>=470,driver<471 brand=vpc,driver>=470,driver<471 brand=vcs,driver>=470,driver<471 brand=vws,driver>=470,driver<471 brand=cloudgaming,driver>=470,driver<471 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566

2025-03-10 22:19:07 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_VERSION=12.8.90-1

2025-03-10 22:19:07 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 22:19:07 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2025-03-10 22:19:07 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSL https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2404/${NVARCH}/3bf863cc.pub | apt-key add - && echo "deb https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2404/${NVARCH} /" > /etc/apt/sources.list.d/cuda.list && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:19:07 UTC (buildkit.dockerfile.v0)

ENV CUDA_VERSION=12.8.1

2025-03-10 22:19:21 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-8=${NV_CUDA_CUDART_VERSION} cuda-compat-12-8 && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:19:21 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit

2025-03-10 22:19:21 UTC (buildkit.dockerfile.v0)

ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

2025-03-10 22:19:21 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64

2025-03-10 22:19:21 UTC (buildkit.dockerfile.v0)

COPY NGC-DL-CONTAINER-LICENSE / # buildkit

2025-03-10 22:19:21 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_VISIBLE_DEVICES=all

2025-03-10 22:19:21 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_LIB_VERSION=12.8.1-1

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_NVTX_VERSION=12.8.90-1

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_VERSION=12.3.3.100-1

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_PACKAGE=libnpp-12-8=12.3.3.100-1

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUSPARSE_VERSION=12.5.8.93-1

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-12-8

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_VERSION=12.8.4.1-1

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_PACKAGE=libcublas-12-8=12.8.4.1-1

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE_VERSION=2.25.1-1

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NCCL_VERSION=2.25.1-1

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE=libnccl2=2.25.1-1+cuda12.8

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-12-8=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-12-8=${NV_NVTX_VERSION} libcusparse-12-8=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_PRODUCT_NAME=CUDA

2025-03-10 22:30:18 UTC (buildkit.dockerfile.v0)

ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_LIB_VERSION=12.8.1-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_DEV_VERSION=12.8.90-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_NVML_DEV_VERSION=12.8.90-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUSPARSE_DEV_VERSION=12.5.8.93-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_DEV_VERSION=12.3.3.100-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_DEV_PACKAGE=libnpp-dev-12-8=12.3.3.100-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_VERSION=12.8.4.1-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_PACKAGE_NAME=libcublas-dev-12-8

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_PACKAGE=libcublas-dev-12-8=12.8.4.1-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_NSIGHT_COMPUTE_VERSION=12.8.1-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE=cuda-nsight-compute-12-8=12.8.1-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_NVPROF_VERSION=12.8.90-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_NVPROF_DEV_PACKAGE=cuda-nvprof-12-8=12.8.90-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE_NAME=libnccl-dev

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE_VERSION=2.25.1-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NCCL_VERSION=2.25.1-1

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE=libnccl-dev=2.25.1-1+cuda12.8

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-dev-12-8=${NV_CUDA_CUDART_DEV_VERSION} cuda-command-line-tools-12-8=${NV_CUDA_LIB_VERSION} cuda-minimal-build-12-8=${NV_CUDA_LIB_VERSION} cuda-libraries-dev-12-8=${NV_CUDA_LIB_VERSION} cuda-nvml-dev-12-8=${NV_NVML_DEV_VERSION} ${NV_NVPROF_DEV_PACKAGE} ${NV_LIBNPP_DEV_PACKAGE} libcusparse-dev-12-8=${NV_LIBCUSPARSE_DEV_VERSION} ${NV_LIBCUBLAS_DEV_PACKAGE} ${NV_LIBNCCL_DEV_PACKAGE} ${NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_DEV_PACKAGE_NAME} ${NV_LIBNCCL_DEV_PACKAGE_NAME} # buildkit

2025-03-10 22:44:37 UTC (buildkit.dockerfile.v0)

ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs

2025-03-10 23:14:56 UTC (buildkit.dockerfile.v0)

ENV NV_CUDNN_VERSION=9.8.0.87-1

2025-03-10 23:14:56 UTC (buildkit.dockerfile.v0)

ENV NV_CUDNN_PACKAGE_NAME=libcudnn9-cuda-12

2025-03-10 23:14:56 UTC (buildkit.dockerfile.v0)

ENV NV_CUDNN_PACKAGE=libcudnn9-cuda-12=9.8.0.87-1

2025-03-10 23:14:56 UTC (buildkit.dockerfile.v0)

ENV NV_CUDNN_PACKAGE_DEV=libcudnn9-dev-cuda-12=9.8.0.87-1

2025-03-10 23:14:56 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 23:14:56 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2025-03-10 23:14:56 UTC (buildkit.dockerfile.v0)

LABEL com.nvidia.cudnn.version=9.8.0.87-1

2025-03-10 23:14:56 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends ${NV_CUDNN_PACKAGE} ${NV_CUDNN_PACKAGE_DEV} && apt-mark hold ${NV_CUDNN_PACKAGE_NAME} && rm -rf /var/lib/apt/lists/* # buildkit

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH=amd64

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG GRACE_BLACKWELL=0

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG HOPPER_SBO=0

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG CPU_VARIANT=x86-intel-multi

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG BUILD_ALL_CPU_VARIANTS=1

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG HTTP_PROXY=http://127.0.0.1:7890

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG HTTPS_PROXY=http://127.0.0.1:7890

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG http_proxy=http://127.0.0.1:7890

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG https_proxy=http://127.0.0.1:7890

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ENV HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GIT_SSL_NO_VERIFY=1

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG BUILD_AND_DOWNLOAD_PARALLEL=8

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG SGL_KERNEL_VERSION=0.3.19

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG SGL_VERSION=0.5.6.post1

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG USE_LATEST_SGLANG=0

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG GDRCOPY_VERSION=2.5.1

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG UBUNTU_MIRROR=1

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG GITHUB_ARTIFACTORY=github.com

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG FLASHINFER_VERSION=0.5.3

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG KTRANSFORMERS_VERSION=0.4.2

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ARG FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ENV DEBIAN_FRONTEND=noninteractive CUDA_HOME=/usr/local/cuda GDRCOPY_HOME=/usr/src/gdrdrv-2.5.1/ FLASHINFER_VERSION=0.5.3

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/nvidia/bin LD_LIBRARY_PATH=/usr/local/cuda/lib64:/usr/local/nvidia/lib:/usr/local/nvidia/lib64

2026-03-05 07:47:25 UTC (buildkit.dockerfile.v0)

RUN |23 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl /bin/sh -c if [ -n "$UBUNTU_MIRROR" ]; then echo "deb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ noble main restricted universe multiverse" > /etc/apt/sources.list && echo "deb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ noble-updates main restricted universe multiverse" >> /etc/apt/sources.list && echo "deb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ noble-backports main restricted universe multiverse" >> /etc/apt/sources.list && echo "deb http://security.ubuntu.com/ubuntu/ noble-security main restricted universe multiverse" >> /etc/apt/sources.list && rm -f /etc/apt/sources.list.d/ubuntu.sources; fi # buildkit

2026-03-05 07:48:43 UTC (buildkit.dockerfile.v0)

RUN |23 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl /bin/sh -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update && apt-get install -y --no-install-recommends --allow-change-held-packages tzdata ca-certificates software-properties-common netcat-openbsd kmod unzip openssh-server curl wget lsof locales build-essential cmake perl patchelf ccache git git-lfs libopenmpi-dev libnuma1 libnuma-dev numactl ffmpeg libibverbs-dev libibverbs1 libibumad3 librdmacm1 libnl-3-200 libnl-route-3-200 libnl-route-3-dev libnl-3-dev ibverbs-providers infiniband-diags perftest libgoogle-glog-dev libgtest-dev libjsoncpp-dev libunwind-dev libboost-all-dev libssl-dev libgrpc-dev libgrpc++-dev libprotobuf-dev protobuf-compiler protobuf-compiler-grpc pybind11-dev libhiredis-dev libcurl4-openssl-dev libczmq4 libczmq-dev libfabric-dev devscripts debhelper fakeroot dkms check libsubunit0 libsubunit-dev gdb ninja-build vim tmux htop zsh tree less rdma-core libnccl2 libnccl-dev && rm -rf /var/lib/apt/lists/* && apt-get clean # buildkit

2026-03-05 07:49:25 UTC (buildkit.dockerfile.v0)

RUN |23 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl /bin/sh -c mkdir -p /tmp/gdrcopy && cd /tmp && curl --retry 3 --retry-delay 2 -fsSL -o v${GDRCOPY_VERSION}.tar.gz https://${GITHUB_ARTIFACTORY}/NVIDIA/gdrcopy/archive/refs/tags/v${GDRCOPY_VERSION}.tar.gz && tar -xzf v${GDRCOPY_VERSION}.tar.gz && rm v${GDRCOPY_VERSION}.tar.gz && cd gdrcopy-${GDRCOPY_VERSION}/packages && CUDA=/usr/local/cuda ./build-deb-packages.sh && dpkg -i gdrdrv-dkms_*.deb libgdrapi_*.deb gdrcopy-tests_*.deb gdrcopy_*.deb && cd / && rm -rf /tmp/gdrcopy # buildkit

2026-03-05 07:49:25 UTC (buildkit.dockerfile.v0)

RUN |23 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl /bin/sh -c ln -sf /usr/lib/$(uname -m)-linux-gnu/libmlx5.so.1 /usr/lib/$(uname -m)-linux-gnu/libmlx5.so # buildkit

2026-03-05 07:49:26 UTC (buildkit.dockerfile.v0)

RUN |23 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl /bin/sh -c locale-gen en_US.UTF-8 # buildkit

2026-03-05 07:49:26 UTC (buildkit.dockerfile.v0)

ENV LANG=en_US.UTF-8 LANGUAGE=en_US:en LC_ALL=en_US.UTF-8

2026-03-05 07:49:42 UTC (buildkit.dockerfile.v0)

RUN |23 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl /bin/sh -c mkdir -p /opt/miniconda3 && wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh -O /opt/miniconda3/miniconda.sh && bash /opt/miniconda3/miniconda.sh -b -u -p /opt/miniconda3 && rm /opt/miniconda3/miniconda.sh # buildkit

2026-03-05 07:49:42 UTC (buildkit.dockerfile.v0)

ENV PATH=/opt/miniconda3/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/nvidia/bin

2026-03-05 07:49:52 UTC (buildkit.dockerfile.v0)

RUN |23 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl /bin/sh -c conda tos accept --override-channels --channel https://repo.anaconda.com/pkgs/main && conda tos accept --override-channels --channel https://repo.anaconda.com/pkgs/r # buildkit

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

RUN |23 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl /bin/sh -c conda config --add channels https://mirrors.tuna.tsinghua.edu.cn/anaconda/pkgs/main && conda config --add channels https://mirrors.tuna.tsinghua.edu.cn/anaconda/pkgs/free && conda config --set show_channel_urls yes && conda config --set ssl_verify false # buildkit

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG CUDA_VERSION=12.8.1

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG BUILD_AND_DOWNLOAD_PARALLEL

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG SGL_KERNEL_VERSION

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG SGL_VERSION

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG USE_LATEST_SGLANG

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG FLASHINFER_VERSION

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG GRACE_BLACKWELL

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG GRACE_BLACKWELL_DEEPEP_BRANCH

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG HOPPER_SBO

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG HOPPER_SBO_DEEPEP_COMMIT

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG DEEPEP_COMMIT

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG GITHUB_ARTIFACTORY=github.com

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG KTRANSFORMERS_VERSION

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG KTRANSFORMERS_WHEEL

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG FLASH_ATTN_WHEEL

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

ARG FUNCTIONALITY=infer

2026-03-05 07:49:54 UTC (buildkit.dockerfile.v0)

WORKDIR /workspace

2026-03-05 07:53:14 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c conda create -n serve python=3.12 -y && if [ "$FUNCTIONALITY" = "sft" ]; then conda create -n fine-tune python=3.12 -y; fi # buildkit

2026-03-05 07:53:15 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c /opt/miniconda3/envs/serve/bin/pip config set global.index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple && if [ "$FUNCTIONALITY" = "sft" ]; then /opt/miniconda3/envs/fine-tune/bin/pip config set global.index-url https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple; fi # buildkit

2026-03-05 07:53:17 UTC (buildkit.dockerfile.v0)

COPY . /workspace/ktransformers # buildkit

2026-03-05 07:53:17 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c cd /workspace/ktransformers && git submodule update --init --recursive && ln -s /workspace/ktransformers/third_party/sglang /workspace/sglang && if [ "$FUNCTIONALITY" = "sft" ]; then git clone --depth 1 https://${GITHUB_ARTIFACTORY}/hiyouga/LLaMA-Factory.git /workspace/LLaMA-Factory; fi # buildkit

2026-03-05 07:53:17 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c if [ "$FUNCTIONALITY" = "sft" ]; then curl --retry 3 --retry-delay 2 -fsSL -o /workspace/${KTRANSFORMERS_WHEEL} https://${GITHUB_ARTIFACTORY}/kvcache-ai/ktransformers/releases/download/v${KTRANSFORMERS_VERSION}/${KTRANSFORMERS_WHEEL} && curl --retry 3 --retry-delay 2 -fsSL -o /workspace/${FLASH_ATTN_WHEEL} https://${GITHUB_ARTIFACTORY}/Dao-AILab/flash-attention/releases/download/v2.8.3/${FLASH_ATTN_WHEEL}; fi # buildkit

2026-03-05 07:53:19 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c /opt/miniconda3/envs/serve/bin/pip install --upgrade pip setuptools wheel html5lib six # buildkit

2026-03-05 07:53:27 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c case "$CUDA_VERSION" in 12.6.1) CUINDEX=126 ;; 12.8.1) CUINDEX=128 ;; 12.9.1) CUINDEX=129 ;; 13.0.1) CUINDEX=130 ;; *) echo "Unsupported CUDA version: $CUDA_VERSION" && exit 1 ;; esac && if [ "$CUDA_VERSION" = "12.6.1" ]; then /opt/miniconda3/envs/serve/bin/pip install https://${GITHUB_ARTIFACTORY}/sgl-project/whl/releases/download/v${SGL_KERNEL_VERSION}/sgl_kernel-${SGL_KERNEL_VERSION}+cu124-cp310-abi3-manylinux2014_$(uname -m).whl --force-reinstall --no-deps ; elif [ "$CUDA_VERSION" = "12.8.1" ] || [ "$CUDA_VERSION" = "12.9.1" ]; then /opt/miniconda3/envs/serve/bin/pip install sgl-kernel==${SGL_KERNEL_VERSION} ; elif [ "$CUDA_VERSION" = "13.0.1" ]; then /opt/miniconda3/envs/serve/bin/pip install https://github.com/sgl-project/whl/releases/download/v${SGL_KERNEL_VERSION}/sgl_kernel-${SGL_KERNEL_VERSION}+cu130-cp310-abi3-manylinux2014_$(uname -m).whl --force-reinstall --no-deps ; fi # buildkit

2026-03-05 07:59:22 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c case "$CUDA_VERSION" in 12.6.1) CUINDEX=126 ;; 12.8.1) CUINDEX=128 ;; 12.9.1) CUINDEX=129 ;; 13.0.1) CUINDEX=130 ;; esac && export SGLANG_KT_VERSION=$(python3 -c "exec(open('/workspace/ktransformers/version.py').read()); print(__version__)") && echo "Installing sglang-kt v${SGLANG_KT_VERSION}" && cd /workspace/sglang && /opt/miniconda3/envs/serve/bin/pip install -e "python[all]" --extra-index-url https://download.pytorch.org/whl/cu${CUINDEX} # buildkit

2026-03-05 08:03:16 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c FLASHINFER_CUBIN_DOWNLOAD_THREADS=${BUILD_AND_DOWNLOAD_PARALLEL} FLASHINFER_LOGGING_LEVEL=warning /opt/miniconda3/envs/serve/bin/python -m flashinfer --download-cubin # buildkit

2026-03-05 08:03:18 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c set -eux; if [ "$GRACE_BLACKWELL" = "1" ]; then git clone https://github.com/fzyzcjy/DeepEP.git /workspace/DeepEP && cd /workspace/DeepEP && git checkout ${GRACE_BLACKWELL_DEEPEP_BRANCH} && sed -i 's/#define NUM_CPU_TIMEOUT_SECS 100/#define NUM_CPU_TIMEOUT_SECS 1000/' csrc/kernels/configs.cuh; elif [ "$HOPPER_SBO" = "1" ]; then git clone https://github.com/deepseek-ai/DeepEP.git -b antgroup-opt /workspace/DeepEP && cd /workspace/DeepEP && git checkout ${HOPPER_SBO_DEEPEP_COMMIT} && sed -i 's/#define NUM_CPU_TIMEOUT_SECS 100/#define NUM_CPU_TIMEOUT_SECS 1000/' csrc/kernels/configs.cuh; else curl --retry 3 --retry-delay 2 -fsSL -o /tmp/${DEEPEP_COMMIT}.zip https://${GITHUB_ARTIFACTORY}/deepseek-ai/DeepEP/archive/${DEEPEP_COMMIT}.zip && unzip -q /tmp/${DEEPEP_COMMIT}.zip -d /tmp && rm /tmp/${DEEPEP_COMMIT}.zip && mv /tmp/DeepEP-${DEEPEP_COMMIT} /workspace/DeepEP && cd /workspace/DeepEP && sed -i 's/#define NUM_CPU_TIMEOUT_SECS 100/#define NUM_CPU_TIMEOUT_SECS 1000/' csrc/kernels/configs.cuh; fi # buildkit

2026-03-05 08:05:06 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c cd /workspace/DeepEP && case "$CUDA_VERSION" in 12.6.1) CHOSEN_TORCH_CUDA_ARCH_LIST='9.0' ;; 12.8.1) CHOSEN_TORCH_CUDA_ARCH_LIST='9.0;10.0' ;; 12.9.1|13.0.1) CHOSEN_TORCH_CUDA_ARCH_LIST='9.0;10.0;10.3' ;; *) echo "Unsupported CUDA version: $CUDA_VERSION" && exit 1 ;; esac && . /opt/miniconda3/etc/profile.d/conda.sh && conda activate serve && TORCH_CUDA_ARCH_LIST="${CHOSEN_TORCH_CUDA_ARCH_LIST}" MAX_JOBS=${BUILD_AND_DOWNLOAD_PARALLEL} pip install --no-build-isolation . # buildkit

2026-03-05 08:05:09 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c if [ "${CUDA_VERSION%%.*}" = "12" ]; then /opt/miniconda3/envs/serve/bin/pip install nvidia-nccl-cu12==2.28.3 --force-reinstall --no-deps ; elif [ "${CUDA_VERSION%%.*}" = "13" ]; then /opt/miniconda3/envs/serve/bin/pip install nvidia-nccl-cu13==2.28.3 --force-reinstall --no-deps ; fi # buildkit

2026-03-05 08:13:00 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c . /opt/miniconda3/etc/profile.d/conda.sh && conda activate serve && cd /workspace/ktransformers/kt-kernel && CPUINFER_BUILD_ALL_VARIANTS=1 ./install.sh build # buildkit

2026-03-05 08:13:00 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c if [ "$FUNCTIONALITY" = "sft" ]; then conda install -n fine-tune -y -c https://mirrors.tuna.tsinghua.edu.cn/anaconda/cloud/conda-forge libstdcxx-ng gcc_impl_linux-64 && conda install -n fine-tune -y -c nvidia/label/cuda-11.8.0 cuda-runtime; fi # buildkit

2026-03-05 08:13:00 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c if [ "$FUNCTIONALITY" = "sft" ]; then case "$CUDA_VERSION" in 12.6.1) CUINDEX=126 ;; 12.8.1) CUINDEX=128 ;; 12.9.1) CUINDEX=129 ;; 13.0.1) CUINDEX=130 ;; esac && /opt/miniconda3/envs/fine-tune/bin/pip install --upgrade pip setuptools wheel hatchling && /opt/miniconda3/envs/fine-tune/bin/pip install torch==2.8.0 torchvision torchaudio --extra-index-url https://download.pytorch.org/whl/cu${CUINDEX}; fi # buildkit

2026-03-05 08:13:00 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c if [ "$FUNCTIONALITY" = "sft" ]; then cd /workspace/LLaMA-Factory && /opt/miniconda3/envs/fine-tune/bin/pip install -e ".[torch,metrics]" --no-build-isolation; fi # buildkit

2026-03-05 08:13:00 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c if [ "$FUNCTIONALITY" = "sft" ]; then /opt/miniconda3/envs/fine-tune/bin/pip install /workspace/${KTRANSFORMERS_WHEEL}; fi # buildkit

2026-03-05 08:13:00 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c if [ "$FUNCTIONALITY" = "sft" ]; then /opt/miniconda3/envs/fine-tune/bin/pip install /workspace/${FLASH_ATTN_WHEEL}; fi # buildkit

2026-03-05 08:13:00 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c if [ "$FUNCTIONALITY" = "sft" ]; then if [ "${CUDA_VERSION%%.*}" = "12" ]; then /opt/miniconda3/envs/fine-tune/bin/pip install nvidia-nccl-cu12==2.28.3 --force-reinstall --no-deps ; elif [ "${CUDA_VERSION%%.*}" = "13" ]; then /opt/miniconda3/envs/fine-tune/bin/pip install nvidia-nccl-cu13==2.28.3 --force-reinstall --no-deps ; fi; fi # buildkit

2026-03-05 08:13:00 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c if [ "$FUNCTIONALITY" = "sft" ]; then rm -f /workspace/${KTRANSFORMERS_WHEEL} /workspace/${FLASH_ATTN_WHEEL}; fi # buildkit

2026-03-05 08:13:01 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c /opt/miniconda3/bin/conda init bash # buildkit

2026-03-05 08:13:01 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c echo '\n# Conda environment aliases\nalias serve="conda activate serve"' >> /root/.bashrc && if [ "$FUNCTIONALITY" = "sft" ]; then echo 'alias finetune="conda activate fine-tune"' >> /root/.bashrc; fi # buildkit

2026-03-05 08:13:01 UTC (buildkit.dockerfile.v0)

RUN |25 TARGETARCH=amd64 GRACE_BLACKWELL=0 HOPPER_SBO=0 CPU_VARIANT=x86-intel-multi BUILD_ALL_CPU_VARIANTS=1 HTTP_PROXY=http://127.0.0.1:7890 HTTPS_PROXY=http://127.0.0.1:7890 http_proxy=http://127.0.0.1:7890 https_proxy=http://127.0.0.1:7890 GRACE_BLACKWELL_DEEPEP_BRANCH=gb200_blog_part_2 HOPPER_SBO_DEEPEP_COMMIT=9f2fc4b3182a51044ae7ecb6610f7c9c3258c4d6 DEEPEP_COMMIT=9af0e0d0e74f3577af1979c9b9e1ac2cad0104ee BUILD_AND_DOWNLOAD_PARALLEL=8 SGL_KERNEL_VERSION=0.3.19 SGL_VERSION=0.5.6.post1 USE_LATEST_SGLANG=0 GDRCOPY_VERSION=2.5.1 UBUNTU_MIRROR=1 GITHUB_ARTIFACTORY=github.com FLASHINFER_VERSION=0.5.3 KTRANSFORMERS_VERSION=0.4.2 KTRANSFORMERS_WHEEL=ktransformers-0.4.2+cu128torch28fancy-cp312-cp312-linux_x86_64.whl FLASH_ATTN_WHEEL=flash_attn-2.8.3+cu12torch2.8cxx11abiTRUE-cp312-cp312-linux_x86_64.whl CUDA_VERSION=12.8.1 FUNCTIONALITY=infer /bin/sh -c set -x && cd /workspace/ktransformers && KTRANSFORMERS_VERSION=$(python3 -c "exec(open('version.py').read()); print(__version__)" 2>/dev/null || echo "unknown") && echo "KTRANSFORMERS_VERSION=$KTRANSFORMERS_VERSION" > /workspace/versions.env && echo "Extracted KTransformers version: $KTRANSFORMERS_VERSION" && echo "SGLANG_KT_VERSION=$KTRANSFORMERS_VERSION" >> /workspace/versions.env && echo "sglang-kt version (aligned): $KTRANSFORMERS_VERSION" && if [ "$FUNCTIONALITY" = "sft" ]; then . /opt/miniconda3/etc/profile.d/conda.sh && conda activate fine-tune && cd /workspace/LLaMA-Factory && LLAMAFACTORY_VERSION=$(python -c "import sys; sys.path.insert(0, 'src'); from llamafactory import __version__; print(__version__)" 2>/dev/null || echo "unknown") && echo "LLAMAFACTORY_VERSION=$LLAMAFACTORY_VERSION" >> /workspace/versions.env && echo "Extracted LLaMA-Factory version: $LLAMAFACTORY_VERSION"; else echo "LLAMAFACTORY_VERSION=none" >> /workspace/versions.env && echo "LLaMA-Factory not installed (infer mode)"; fi && echo "=== Version Summary ===" && cat /workspace/versions.env # buildkit

2026-03-05 08:13:01 UTC (buildkit.dockerfile.v0)

WORKDIR /workspace

2026-03-05 08:13:01 UTC (buildkit.dockerfile.v0)

CMD ["/bin/bash"]

Danger Zone
Delete Tag

Please be careful as this will not just delete the reference but also the actual content!

For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.

Delete