Namespace
xprobe
Image / Tag
xinference:v1.10.0-cu128
Content Digest
sha256:8e9780fa21c1b8e0a150493b48cd904fb824205418d5d7d19836a3df81f1ad96
Details
Created

2025-09-13 16:52:47 UTC

Size

13.4 GB

Content Digest
Labels
  • maintainer
    NVIDIA CORPORATION <[email protected]>
  • org.opencontainers.image.ref.name
    ubuntu
  • org.opencontainers.image.version
    22.04

Environment
CUDA_VERSION

12.8.1

DEBIAN_FRONTEND

noninteractive

LD_LIBRARY_PATH

/usr/local/cuda/lib64:/usr/local/lib/python3.10/dist-packages/nvidia/cublas/lib:LD_LIBRARY_PATH=/usr/local/lib/python3.12/dist-packages/torch/lib:/usr/local/cuda/lib64

LIBRARY_PATH

/usr/local/cuda/lib64/stubs

NCCL_VERSION

2.25.1-1

NODE_VERSION

14.21.1

NVARCH

x86_64

NVIDIA_DRIVER_CAPABILITIES

compute,utility

NVIDIA_PRODUCT_NAME

CUDA

NVIDIA_REQUIRE_CUDA

cuda>=12.8 brand=unknown,driver>=470,driver<471 brand=grid,driver>=470,driver<471 brand=tesla,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=vapps,driver>=470,driver<471 brand=vpc,driver>=470,driver<471 brand=vcs,driver>=470,driver<471 brand=vws,driver>=470,driver<471 brand=cloudgaming,driver>=470,driver<471 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566

NVIDIA_VISIBLE_DEVICES

all

NVM_DIR

/usr/local/nvm

NV_CUDA_CUDART_DEV_VERSION

12.8.90-1

NV_CUDA_CUDART_VERSION

12.8.90-1

NV_CUDA_LIB_VERSION

12.8.1-1

NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE

cuda-nsight-compute-12-8=12.8.1-1

NV_CUDA_NSIGHT_COMPUTE_VERSION

12.8.1-1

NV_LIBCUBLAS_DEV_PACKAGE

libcublas-dev-12-8=12.8.4.1-1

NV_LIBCUBLAS_DEV_PACKAGE_NAME

libcublas-dev-12-8

NV_LIBCUBLAS_DEV_VERSION

12.8.4.1-1

NV_LIBCUBLAS_PACKAGE

libcublas-12-8=12.8.4.1-1

NV_LIBCUBLAS_PACKAGE_NAME

libcublas-12-8

NV_LIBCUBLAS_VERSION

12.8.4.1-1

NV_LIBCUSPARSE_DEV_VERSION

12.5.8.93-1

NV_LIBCUSPARSE_VERSION

12.5.8.93-1

NV_LIBNCCL_DEV_PACKAGE

libnccl-dev=2.25.1-1+cuda12.8

NV_LIBNCCL_DEV_PACKAGE_NAME

libnccl-dev

NV_LIBNCCL_DEV_PACKAGE_VERSION

2.25.1-1

NV_LIBNCCL_PACKAGE

libnccl2=2.25.1-1+cuda12.8

NV_LIBNCCL_PACKAGE_NAME

libnccl2

NV_LIBNCCL_PACKAGE_VERSION

2.25.1-1

NV_LIBNPP_DEV_PACKAGE

libnpp-dev-12-8=12.3.3.100-1

NV_LIBNPP_DEV_VERSION

12.3.3.100-1

NV_LIBNPP_PACKAGE

libnpp-12-8=12.3.3.100-1

NV_LIBNPP_VERSION

12.3.3.100-1

NV_NVML_DEV_VERSION

12.8.90-1

NV_NVPROF_DEV_PACKAGE

cuda-nvprof-12-8=12.8.90-1

NV_NVPROF_VERSION

12.8.90-1

NV_NVTX_VERSION

12.8.90-1

PATH

/usr/local/nvm/versions/node/v14.21.1/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

UV_HTTP_TIMEOUT

500

UV_INDEX_STRATEGY

unsafe-best-match

VLLM_USAGE_SOURCE

production-docker-image


Layers

[#000] sha256:8f84a9f2102e97a4a6bf673b150fc9894df5acc9618ad3484c6c36f768c1caa0 - 0.21% (29 MB)

[#001] sha256:b95112eaf2836b9c7193858419f6d17933a873c4a2c9227dc497f5e090ea9c87 - 0.03% (4.42 MB)

[#002] sha256:030ef82509363afebdc78482e6f8c07f2bc8b65a45caf082c2a9a621c7deae63 - 0.45% (61.3 MB)

[#003] sha256:72ac9ccfda38d144ef8e3aadbd5851e7fa9aacd261f8e15d7365db0f816d3433 - 0.0% (186 Bytes)

[#004] sha256:73389fbd088f5ed5d9fd258baced59de092978b4f483920ea6d074522a105119 - 0.0% (6.72 KB)

[#005] sha256:0264850675f7464ed6385d030d281ffb0f2037323c73511a5372948c1c69d92c - 14.26% (1.92 GB)

[#006] sha256:de1d03310308c2871217cf179589d5e7fcd8eee31d8f331b61041347f50404a0 - 0.0% (62.6 KB)

[#007] sha256:c1d2af7fad0f1c6cdaf09c568c086019e834bc6523c30aa9b2b0b24c4b782086 - 0.0% (1.64 KB)

[#008] sha256:5601308b3ac642f7df8b1dc62b9582abdd34857eec6190bcb50162abc5719226 - 0.0% (1.49 KB)

[#009] sha256:6b2035e8b73ed2b018995a7b2c8d607d5527daf948d41964f02cc3ce7ed0699a - 20.72% (2.78 GB)

[#010] sha256:ed71f8f81b33b96e7112757f6828a6dcb0861026aa63c5edc672d13e11045f6d - 0.0% (86.8 KB)

[#011] sha256:b1b6c1775c16e4e139f8ae775b194fe6a7076d94d952617f0cc078afa7e8c7bc - 0.0% (101 Bytes)

[#012] sha256:d373511744fdd8468b3db0459b36dafe58eb8be32638345084257a96a5e23e94 - 0.0% (229 Bytes)

[#013] sha256:3ebe67c1e0e2fd724bbabecb625ab6d28e8aba65fa92a2b39df3aba15c6656d6 - 2.3% (317 MB)

[#014] sha256:f91d7b42c5687bd6f8ac52b05214bf7b18de3c238c0c7bdb18bbb36ac0413d0f - 0.26% (35.9 MB)

[#015] sha256:fe325e27a56b10798d7baf0ebfa2d14ffebefdefc72e7a337e6560063af89d90 - 0.0% (12.8 KB)

[#016] sha256:28b1cbbf594386efb1e443045c03993c978f10b001f64a502bb67c35cb84e297 - 0.0% (120 Bytes)

[#017] sha256:45d2059167a18c99f6a2a60261df52993c4681dcc21a8dffce1d5a59ad14c341 - 33.07% (4.44 GB)

[#018] sha256:2fbac78b2be33f25544af88840807a8206f6cfc3205eaf3905f15ae0d6f63ed9 - 1.69% (232 MB)

[#019] sha256:6b88d7f7355b89825f087fafd0a1798cc45d32d383338cb8985045a33fccd442 - 0.0% (141 KB)

[#020] sha256:5f14061764b91068fadf6ae42740f0843437f9677419384a412e4acc3471965e - 0.0% (123 KB)

[#021] sha256:bf1312cdb91e9bacb75c734c3c91a8fe850f27ce744d69a5156eae216c4651f2 - 0.0% (8.21 KB)

[#022] sha256:298126e72930877a725fc2ada3fcb5449214771299549d1a83d597b9a869078d - 0.0% (123 Bytes)

[#023] sha256:fe58789a3a0c6498b46a4b8772221f38684717cb302aa3bf2cda5eb7bb942e18 - 0.0% (295 Bytes)

[#024] sha256:16540d6bc6b0bd43914cf52c824fba8affebfce2e49d36eedc4f64a7bd3ccaf3 - 0.19% (26 MB)

[#025] sha256:1cc57b2272cb8f7571d72770802f6ebc8dcb375c5a0555c95f78321b979df131 - 0.0% (188 Bytes)

[#026] sha256:a2afa617fa03a4fe3e5b22cc6d4280d8afc6f398c96ddee859c33bf9fe3e48d1 - 0.81% (111 MB)

[#027] sha256:2fc83748213a2b4402cd1e9d49010a2f9545cf0e2893fccd52e0492c766323d4 - 0.87% (119 MB)

[#028] sha256:6e8b128b0fb34a1f0a58033be491ab56fd372009047ed4a33dcdd34ed3706036 - 1.13% (155 MB)

[#029] sha256:ce3e9606e7337d27ddb028ddb454d5c2cb9754ba5c0332c303000a6e661f0c51 - 22.01% (2.96 GB)

[#030] sha256:dbb8df7c2fd20684a2d7dd87a28d5d2b647f2c96e2a8f8355eaaefc01eb53d3c - 0.88% (121 MB)

[#031] sha256:35aeb2c58b90732902e9a635d29cac5f090a914c7ab23fe76e2946e0fa0b26cf - 1.13% (156 MB)

[#032] sha256:09accec5a5fc1552c1dea50755eaba605ec4dfe5156c9ecaea297570ec75b9d1 - 0.0% (92 Bytes)


History
2025-01-26 05:31:07 UTC

/bin/sh -c #(nop) ARG RELEASE

2025-01-26 05:31:07 UTC

/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH

2025-01-26 05:31:07 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu

2025-01-26 05:31:07 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04

2025-01-26 05:31:10 UTC

/bin/sh -c #(nop) ADD file:1b6c8c9518be42fa2afe5e241ca31677fce58d27cdfa88baa91a65a259be3637 in /

2025-01-26 05:31:11 UTC

/bin/sh -c #(nop) CMD ["/bin/bash"]

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ENV NVARCH=x86_64

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_REQUIRE_CUDA=cuda>=12.8 brand=unknown,driver>=470,driver<471 brand=grid,driver>=470,driver<471 brand=tesla,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=vapps,driver>=470,driver<471 brand=vpc,driver>=470,driver<471 brand=vcs,driver>=470,driver<471 brand=vws,driver>=470,driver<471 brand=cloudgaming,driver>=470,driver<471 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_VERSION=12.8.90-1

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <[email protected]>

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ENV CUDA_VERSION=12.8.1

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-8=${NV_CUDA_CUDART_VERSION} cuda-compat-12-8 && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

COPY NGC-DL-CONTAINER-LICENSE / # buildkit

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_VISIBLE_DEVICES=all

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_LIB_VERSION=12.8.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_NVTX_VERSION=12.8.90-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_VERSION=12.3.3.100-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_PACKAGE=libnpp-12-8=12.3.3.100-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUSPARSE_VERSION=12.5.8.93-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-12-8

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_VERSION=12.8.4.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_PACKAGE=libcublas-12-8=12.8.4.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE_VERSION=2.25.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NCCL_VERSION=2.25.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE=libnccl2=2.25.1-1+cuda12.8

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <[email protected]>

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-12-8=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-12-8=${NV_NVTX_VERSION} libcusparse-12-8=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_PRODUCT_NAME=CUDA

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_LIB_VERSION=12.8.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_DEV_VERSION=12.8.90-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_NVML_DEV_VERSION=12.8.90-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUSPARSE_DEV_VERSION=12.5.8.93-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_DEV_VERSION=12.3.3.100-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_DEV_PACKAGE=libnpp-dev-12-8=12.3.3.100-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_VERSION=12.8.4.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_PACKAGE_NAME=libcublas-dev-12-8

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_PACKAGE=libcublas-dev-12-8=12.8.4.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_NSIGHT_COMPUTE_VERSION=12.8.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE=cuda-nsight-compute-12-8=12.8.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_NVPROF_VERSION=12.8.90-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_NVPROF_DEV_PACKAGE=cuda-nvprof-12-8=12.8.90-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE_NAME=libnccl-dev

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE_VERSION=2.25.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NCCL_VERSION=2.25.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE=libnccl-dev=2.25.1-1+cuda12.8

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <[email protected]>

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-dev-12-8=${NV_CUDA_CUDART_DEV_VERSION} cuda-command-line-tools-12-8=${NV_CUDA_LIB_VERSION} cuda-minimal-build-12-8=${NV_CUDA_LIB_VERSION} cuda-libraries-dev-12-8=${NV_CUDA_LIB_VERSION} cuda-nvml-dev-12-8=${NV_NVML_DEV_VERSION} ${NV_NVPROF_DEV_PACKAGE} ${NV_LIBNPP_DEV_PACKAGE} libcusparse-dev-12-8=${NV_LIBCUSPARSE_DEV_VERSION} ${NV_LIBCUBLAS_DEV_PACKAGE} ${NV_LIBNCCL_DEV_PACKAGE} ${NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_DEV_PACKAGE_NAME} ${NV_LIBNCCL_DEV_PACKAGE_NAME} # buildkit

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

ARG CUDA_VERSION

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

ARG PYTHON_VERSION

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

ARG INSTALL_KV_CONNECTORS=false

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

WORKDIR /vllm-workspace

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

ENV DEBIAN_FRONTEND=noninteractive

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

ARG TARGETPLATFORM

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

SHELL [/bin/bash -c]

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

ARG DEADSNAKES_MIRROR_URL

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

ARG DEADSNAKES_GPGKEY_URL

2025-07-07 18:13:28 UTC (buildkit.dockerfile.v0)

ARG GET_PIP_URL

2025-07-07 18:13:31 UTC (buildkit.dockerfile.v0)

RUN |7 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit

2025-07-07 18:15:39 UTC (buildkit.dockerfile.v0)

RUN |7 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py /bin/bash -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl wget sudo vim python3-pip && apt-get install -y ffmpeg libsm6 libxext6 libgl1 && if [ ! -z ${DEADSNAKES_MIRROR_URL} ] ; then if [ ! -z "${DEADSNAKES_GPGKEY_URL}" ] ; then mkdir -p -m 0755 /etc/apt/keyrings ; curl -L ${DEADSNAKES_GPGKEY_URL} | gpg --dearmor > /etc/apt/keyrings/deadsnakes.gpg ; sudo chmod 644 /etc/apt/keyrings/deadsnakes.gpg ; echo "deb [signed-by=/etc/apt/keyrings/deadsnakes.gpg] ${DEADSNAKES_MIRROR_URL} $(lsb_release -cs) main" > /etc/apt/sources.list.d/deadsnakes.list ; fi ; else for i in 1 2 3; do add-apt-repository -y ppa:deadsnakes/ppa && break || { echo "Attempt $i failed, retrying in 5s..."; sleep 5; }; done ; fi && apt-get update -y && apt-get install -y python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS ${GET_PIP_URL} | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit

2025-07-07 18:15:39 UTC (buildkit.dockerfile.v0)

ARG PIP_INDEX_URL UV_INDEX_URL

2025-07-07 18:15:39 UTC (buildkit.dockerfile.v0)

ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL

2025-07-07 18:15:39 UTC (buildkit.dockerfile.v0)

ARG PYTORCH_CUDA_INDEX_BASE_URL

2025-07-07 18:15:39 UTC (buildkit.dockerfile.v0)

ARG PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL

2025-07-07 18:15:39 UTC (buildkit.dockerfile.v0)

ARG PIP_KEYRING_PROVIDER UV_KEYRING_PROVIDER

2025-07-07 18:17:05 UTC (buildkit.dockerfile.v0)

RUN |15 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c python3 -m pip install uv # buildkit

2025-07-07 18:17:05 UTC (buildkit.dockerfile.v0)

ENV UV_HTTP_TIMEOUT=500

2025-07-07 18:17:05 UTC (buildkit.dockerfile.v0)

ENV UV_INDEX_STRATEGY=unsafe-best-match

2025-07-07 18:17:06 UTC (buildkit.dockerfile.v0)

RUN |15 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit

2025-07-07 18:17:07 UTC (buildkit.dockerfile.v0)

RUN |15 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c if [ "$TARGETPLATFORM" = "linux/arm64" ]; then uv pip install --system --index-url ${PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') "torch==2.8.0.dev20250318+cu128" "torchvision==0.22.0.dev20250319" ; uv pip install --system --index-url ${PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') --pre pytorch_triton==3.3.0+gitab727c40 ; fi # buildkit

2025-07-07 18:38:05 UTC (buildkit.dockerfile.v0)

RUN |15 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled /bin/bash -c uv pip install --system dist/*.whl --verbose --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit

2025-07-07 18:38:05 UTC (buildkit.dockerfile.v0)

ARG FLASHINFER_CUDA128_INDEX_URL=https://download.pytorch.org/whl/cu128/flashinfer

2025-07-07 18:38:05 UTC (buildkit.dockerfile.v0)

ARG FLASHINFER_CUDA128_WHEEL=flashinfer_python-0.2.6.post1%2Bcu128torch2.7-cp39-abi3-linux_x86_64.whl

2025-07-07 18:38:05 UTC (buildkit.dockerfile.v0)

ARG FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git

2025-07-07 18:38:05 UTC (buildkit.dockerfile.v0)

ARG FLASHINFER_GIT_REF=v0.2.6.post1

2025-07-07 18:38:22 UTC (buildkit.dockerfile.v0)

RUN |19 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_CUDA128_INDEX_URL=https://download.pytorch.org/whl/cu128/flashinfer FLASHINFER_CUDA128_WHEEL=flashinfer_python-0.2.6.post1%2Bcu128torch2.7-cp39-abi3-linux_x86_64.whl FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.2.6.post1 /bin/bash -c bash - <<'BASH' . /etc/environment if [ "$TARGETPLATFORM" != "linux/arm64" ]; then # FlashInfer already has a wheel for PyTorch 2.7.0 and CUDA 12.8. This is enough for CI use if [[ "$CUDA_VERSION" == 12.8* ]]; then uv pip install --system ${FLASHINFER_CUDA128_INDEX_URL}/${FLASHINFER_CUDA128_WHEEL} else export TORCH_CUDA_ARCH_LIST='7.5 8.0 8.9 9.0a 10.0a 12.0' git clone ${FLASHINFER_GIT_REPO} --single-branch --branch ${FLASHINFER_GIT_REF} --recursive # Needed to build AOT kernels (cd flashinfer && \ python3 -m flashinfer.aot && \ uv pip install --system --no-build-isolation . \ ) rm -rf flashinfer # Default arches (skipping 10.0a and 12.0 since these need 12.8) # TODO: Update this to allow setting TORCH_CUDA_ARCH_LIST as a build arg. TORCH_CUDA_ARCH_LIST="7.5 8.0 8.9 9.0a" if [[ "${CUDA_VERSION}" == 11.* ]]; then TORCH_CUDA_ARCH_LIST="7.5 8.0 8.9" fi echo "🏗️ Building FlashInfer for arches: ${TORCH_CUDA_ARCH_LIST}" git clone --depth 1 --recursive --shallow-submodules \ --branch v0.2.6.post1 \ https://github.com/flashinfer-ai/flashinfer.git flashinfer pushd flashinfer python3 -m flashinfer.aot TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST}" \ uv pip install --system --no-build-isolation . popd rm -rf flashinfer fi \ fi BASH # buildkit

2025-07-07 18:38:22 UTC (buildkit.dockerfile.v0)

COPY examples examples # buildkit

2025-07-07 18:38:22 UTC (buildkit.dockerfile.v0)

COPY benchmarks benchmarks # buildkit

2025-07-07 18:38:22 UTC (buildkit.dockerfile.v0)

COPY ./vllm/collect_env.py . # buildkit

2025-07-07 18:38:22 UTC (buildkit.dockerfile.v0)

RUN |19 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_CUDA128_INDEX_URL=https://download.pytorch.org/whl/cu128/flashinfer FLASHINFER_CUDA128_WHEEL=flashinfer_python-0.2.6.post1%2Bcu128torch2.7-cp39-abi3-linux_x86_64.whl FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.2.6.post1 /bin/bash -c . /etc/environment && uv pip list # buildkit

2025-07-07 18:38:22 UTC (buildkit.dockerfile.v0)

COPY requirements/build.txt requirements/build.txt # buildkit

2025-07-07 18:38:24 UTC (buildkit.dockerfile.v0)

RUN |19 CUDA_VERSION=12.8.1 PYTHON_VERSION=3.12 INSTALL_KV_CONNECTORS=true TARGETPLATFORM=linux/amd64 DEADSNAKES_MIRROR_URL= DEADSNAKES_GPGKEY_URL= GET_PIP_URL=https://bootstrap.pypa.io/get-pip.py PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly PIP_KEYRING_PROVIDER=disabled UV_KEYRING_PROVIDER=disabled FLASHINFER_CUDA128_INDEX_URL=https://download.pytorch.org/whl/cu128/flashinfer FLASHINFER_CUDA128_WHEEL=flashinfer_python-0.2.6.post1%2Bcu128torch2.7-cp39-abi3-linux_x86_64.whl FLASHINFER_GIT_REPO=https://github.com/flashinfer-ai/flashinfer.git FLASHINFER_GIT_REF=v0.2.6.post1 /bin/bash -c uv pip install --system -r requirements/build.txt --extra-index-url ${PYTORCH_CUDA_INDEX_BASE_URL}/cu$(echo $CUDA_VERSION | cut -d. -f1,2 | tr -d '.') # buildkit

2025-07-07 18:38:24 UTC (buildkit.dockerfile.v0)

ARG TARGETPLATFORM

2025-07-07 18:38:24 UTC (buildkit.dockerfile.v0)

ARG INSTALL_KV_CONNECTORS=false

2025-07-07 18:38:24 UTC (buildkit.dockerfile.v0)

ARG PIP_INDEX_URL UV_INDEX_URL

2025-07-07 18:38:24 UTC (buildkit.dockerfile.v0)

ARG PIP_EXTRA_INDEX_URL UV_EXTRA_INDEX_URL

2025-07-07 18:38:24 UTC (buildkit.dockerfile.v0)

ENV UV_HTTP_TIMEOUT=500

2025-07-07 18:38:24 UTC (buildkit.dockerfile.v0)

COPY requirements/kv_connectors.txt requirements/kv_connectors.txt # buildkit

2025-07-07 18:38:32 UTC (buildkit.dockerfile.v0)

RUN |6 TARGETPLATFORM=linux/amd64 INSTALL_KV_CONNECTORS=true PIP_INDEX_URL= UV_INDEX_URL= PIP_EXTRA_INDEX_URL= UV_EXTRA_INDEX_URL= /bin/bash -c if [ "$INSTALL_KV_CONNECTORS" = "true" ]; then uv pip install --system -r requirements/kv_connectors.txt; fi; if [ "$TARGETPLATFORM" = "linux/arm64" ]; then uv pip install --system accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.42.0' 'timm==0.9.10' boto3 runai-model-streamer runai-model-streamer[s3]; else uv pip install --system accelerate hf_transfer 'modelscope!=1.15.0' 'bitsandbytes>=0.46.1' 'timm==0.9.10' boto3 runai-model-streamer runai-model-streamer[s3]; fi # buildkit

2025-07-07 18:38:32 UTC (buildkit.dockerfile.v0)

ENV VLLM_USAGE_SOURCE=production-docker-image

2025-07-07 18:38:32 UTC (buildkit.dockerfile.v0)

ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"]

2025-09-13 16:30:16 UTC

/bin/bash -c #(nop) COPY dir:b36b404b38979e6d35aed3f0c4ce9ecccd27d8568b4ea3e5a859331f23b82e49 in /opt/inference

2025-09-13 16:30:20 UTC

/bin/bash -c #(nop) WORKDIR /opt/inference

2025-09-13 16:30:20 UTC

/bin/bash -c #(nop) ENV NVM_DIR=/usr/local/nvm

2025-09-13 16:30:20 UTC

/bin/bash -c #(nop) ENV NODE_VERSION=14.21.1

2025-09-13 16:31:04 UTC

/bin/bash -c apt-get -y update && apt install -y wget curl procps git libgl1 libfst-dev cmake libssl-dev && printf "\ndeb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ jammy main restricted universe multiverse" >> /etc/apt/sources.list && apt-get -y update && apt-get install -y --only-upgrade libstdc++6 && apt install -y libc6 && mkdir -p $NVM_DIR && curl -o- https://raw.githubusercontent.com/nvm-sh/nvm/v0.39.7/install.sh | bash && . $NVM_DIR/nvm.sh && nvm install $NODE_VERSION && nvm alias default $NODE_VERSION && nvm use default && apt-get -yq clean

2025-09-13 16:31:07 UTC

/bin/bash -c #(nop) ENV PATH=/usr/local/nvm/versions/node/v14.21.1/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

2025-09-13 16:31:07 UTC

/bin/bash -c #(nop) ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64:/usr/local/lib/python3.10/dist-packages/nvidia/cublas/lib:LD_LIBRARY_PATH=/usr/local/lib/python3.12/dist-packages/torch/lib:/usr/local/cuda/lib64

2025-09-13 16:31:07 UTC

/bin/bash -c #(nop) ARG LLAMA_CPP_USE_CUDA=true

2025-09-13 16:31:07 UTC

/bin/bash -c #(nop) ARG PIP_INDEX=https://pypi.org/simple

2025-09-13 16:48:30 UTC

|2 LLAMA_CPP_USE_CUDA=true PIP_INDEX=https://pypi.org/simple /bin/bash -c pip install --upgrade -i "$PIP_INDEX" pip setuptools wheel && apt-get -y update && ( wget -O openfst-1.7.2.tar.gz http://www.openslr.org/resources/2/openfst-1.7.2.tar.gz || wget -O openfst-1.7.2.tar.gz https://www.openfst.org/twiki/pub/FST/FstDownload/openfst-1.7.2.tar.gz ) && tar zxvf openfst-1.7.2.tar.gz && cd openfst-1.7.2 && ./configure --enable-shared --enable-static && make -j$(nproc) && make install && ldconfig && CPLUS_INCLUDE_PATH=/usr/local/include LIBRARY_PATH=/usr/local/lib LD_LIBRARY_PATH=/usr/local/lib:$LD_LIBRARY_PATH pip install -i "$PIP_INDEX" pynini==2.1.6.post1 && apt install -y wget curl procps git libgl1 rsync sqlite libpcre3 libpcre3-dev dmidecode libssl-dev perl make build-essential zlib1g-dev && apt-get -yq clean && pip install -i "$PIP_INDEX" "diskcache>=5.6.1" "jinja2>=2.11.3" && pip install -i "$PIP_INDEX" "cython>=0.29" && pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements_12.8/requirements-cu128-base.txt && pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements_12.8/requirements-cu128-ml.txt && pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements_12.8/requirements-cu128-models.txt && pip install -i "$PIP_INDEX" transformers>=4.51.3 && pip install -i "$PIP_INDEX" --no-deps sglang==0.4.6.post5 && pip install https://github.com/sgl-project/whl/releases/download/v0.2.6/sgl_kernel-0.2.6+cu128-cp39-abi3-manylinux2014_x86_64.whl && pip install -i "$PIP_INDEX" wetext && pip uninstall flashinfer -y && pip install -i "$PIP_INDEX" flashinfer-python && pip install -i "$PIP_INDEX" SQLAlchemy==1.4.54 && pip install https://github.com/mjun0812/flash-attention-prebuild-wheels/releases/download/v0.3.18/flash_attn-2.7.4+cu124torch2.7-cp312-cp312-linux_x86_64.whl && cd /opt/inference && python3 setup.py build_web && git restore . && pip install -i "$PIP_INDEX" --no-deps "." && pip uninstall xllamacpp -y && wget https://ghproxy.cn/https://github.com/xorbitsai/xllamacpp/releases/download/v0.2.0-cu124/xllamacpp-0.2.0-cp312-cp312-linux_x86_64.whl && pip install xllamacpp-0.2.0-cp312-cp312-linux_x86_64.whl && pip cache purge

2025-09-13 16:49:03 UTC

|2 LLAMA_CPP_USE_CUDA=true PIP_INDEX=https://pypi.org/simple /bin/bash -c wget -O Miniforge3.sh "https://github.com/conda-forge/miniforge/releases/download/4.12.0-0/Miniforge3-4.12.0-0-Linux-x86_64.sh" && bash Miniforge3.sh -b -p /opt/conda && rm Miniforge3.sh

2025-09-13 16:52:42 UTC

|2 LLAMA_CPP_USE_CUDA=true PIP_INDEX=https://pypi.org/simple /bin/bash -c /opt/conda/bin/conda create -n ffmpeg-env -c conda-forge 'ffmpeg<7' -y && ln -s /opt/conda/envs/ffmpeg-env/bin/ffmpeg /usr/local/bin/ffmpeg && ln -s /opt/conda/envs/ffmpeg-env/bin/ffprobe /usr/local/bin/ffprobe && /opt/conda/bin/conda clean --all -y

2025-09-13 16:52:47 UTC

|2 LLAMA_CPP_USE_CUDA=true PIP_INDEX=https://pypi.org/simple /bin/bash -c pip3 install --pre torch torchvision torchaudio --index-url https://download.pytorch.org/whl/nightly/cu128 --no-deps

2025-09-13 16:52:47 UTC

/bin/bash -c #(nop) ENTRYPOINT []

2025-09-13 16:52:47 UTC

/bin/bash -c #(nop) CMD ["/bin/bash"]

Danger Zone
Delete Tag

Please be careful as this will not just delete the reference but also the actual content!

For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.

Delete