Namespace
xprobe
Image / Tag
xinference:v1.7.0.post1
Content Digest
sha256:5370c46eb5325f3e831a189bec96d7ac32b7bf89366df8ab861be2d9f067a368
Details
Created

2025-06-13 17:48:07 UTC

Size

11.5 GB

Content Digest
Labels
  • maintainer
    NVIDIA CORPORATION <[email protected]>
  • org.opencontainers.image.ref.name
    ubuntu
  • org.opencontainers.image.version
    20.04

Environment
CUDA_VERSION

12.4.1

DEBIAN_FRONTEND

noninteractive

FLASH_ATTENTION_SKIP_CUDA_BUILD

TRUE

LD_LIBRARY_PATH

/usr/local/nvidia/lib:/usr/local/nvidia/lib64:/usr/local/lib/python3.10/dist-packages/nvidia/cublas/lib

NODE_VERSION

14.21.1

NVARCH

x86_64

NVIDIA_DRIVER_CAPABILITIES

compute,utility

NVIDIA_REQUIRE_CUDA

cuda>=12.4 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526 brand=tesla,driver>=535,driver<536 brand=unknown,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=geforce,driver>=535,driver<536 brand=geforcertx,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=titan,driver>=535,driver<536 brand=titanrtx,driver>=535,driver<536

NVIDIA_VISIBLE_DEVICES

all

NVM_DIR

/usr/local/nvm

NV_CUDA_COMPAT_PACKAGE

cuda-compat-12-4

NV_CUDA_CUDART_VERSION

12.4.127-1

PATH

/usr/local/nvm/versions/node/v14.21.1/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

VLLM_USAGE_SOURCE

production-docker-image


Layers

[#000] sha256:43cfb69dbb464ebad014cd4687bf02ee4f5011d540916c658af36faafbfd3481 - 0.22% (26.2 MB)

[#001] sha256:fbcd35dc5bc3a7bda41926aadd083020f942b001ebac6f1d30480f0f065394c0 - 0.06% (7.58 MB)

[#002] sha256:c7232af9ae05f7de83f8d6171bd0c35a4dd0a85ebafb15b950dbc08f89ea5fb5 - 0.47% (54.9 MB)

[#003] sha256:db6cdef1932a0d9ca6ef9a539e08d491f66d1b1ed81926ae1525375bdd8100cc - 0.0% (185 Bytes)

[#004] sha256:56dc8550293751a1604e97ac949cfae82ba20cb2a28e034737bafd7382559609 - 0.0% (6.72 KB)

[#005] sha256:9f61b3db38d69dddb7c6f05c299c875b3c7b6d97869e2f96bf128865bb80bd73 - 0.0% (104 Bytes)

[#006] sha256:0bd39d0469a8457b392113410f3125a0859d6e5f6d48ad8582bd4fa69650c458 - 0.0% (230 Bytes)

[#007] sha256:d22ff5f4aac61b315f6054a8a18ecbe9dcd3afad842ea601397dd9f728312da4 - 1.87% (220 MB)

[#008] sha256:d866993704f54dbc8fb066ffc01f4e0e0645617600bba305452c241dcedb7c11 - 0.0% (6.74 KB)

[#009] sha256:b4918d864665c1c0b4ab2df2c6951e0b7ec94e90b425d1586ef70aa05f2a6321 - 28.62% (3.3 GB)

[#010] sha256:e93cc01aab8b268f0f4cc7c62ca1401d317824b9c76b99c5dafb6e43981af2c5 - 10.82% (1.25 GB)

[#011] sha256:fd30840e514de4a28db901cf841543e45fc262213c5eb1dea29b38901020c9bd - 0.12% (14.4 MB)

[#012] sha256:e9730b1a006ea6204ab007ea6e4d6543b9d5b4d3603975eb80f249baae0d736e - 0.88% (103 MB)

[#013] sha256:15094d73c48ca9de90901a20c450a6a76b3b41405948e23d0fd095b19dd3dd99 - 1.56% (183 MB)

[#014] sha256:aa4522bf0b02abd3aed9a62efa5e3f27c58e0b08850ead5a29bc9ad9d3da892a - 52.24% (6.02 GB)

[#015] sha256:20820024388145c224eae52945ea7e0af2356e0dcad2c153c2a1b1ac366ec4e3 - 1.86% (220 MB)

[#016] sha256:01472ed2757640da87c42b19b2ce975367fdb4be0bd7244fba5a4ada3704263e - 1.28% (151 MB)


History
2024-04-10 18:50:35 UTC

/bin/sh -c #(nop) ARG RELEASE

2024-04-10 18:50:35 UTC

/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH

2024-04-10 18:50:35 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu

2024-04-10 18:50:35 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.version=20.04

2024-04-10 18:50:37 UTC

/bin/sh -c #(nop) ADD file:ea2128e23dce0162557abadd80656bd5ae047d573095d1d4323eb4154490dfdc in /

2024-04-10 18:50:37 UTC

/bin/sh -c #(nop) CMD ["/bin/bash"]

2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)

ENV NVARCH=x86_64

2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_REQUIRE_CUDA=cuda>=12.4 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526 brand=tesla,driver>=535,driver<536 brand=unknown,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=geforce,driver>=535,driver<536 brand=geforcertx,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=titan,driver>=535,driver<536 brand=titanrtx,driver>=535,driver<536

2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_VERSION=12.4.127-1

2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_COMPAT_PACKAGE=cuda-compat-12-4

2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <[email protected]>

2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSL https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2004/${NVARCH}/3bf863cc.pub | apt-key add - && echo "deb https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2004/${NVARCH} /" > /etc/apt/sources.list.d/cuda.list && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit

2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)

ENV CUDA_VERSION=12.4.1

2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-4=${NV_CUDA_CUDART_VERSION} ${NV_CUDA_COMPAT_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit

2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)

ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64

2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)

COPY NGC-DL-CONTAINER-LICENSE / # buildkit

2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_VISIBLE_DEVICES=all

2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility

2024-07-23 00:03:19 -0700 (buildkit.dockerfile.v0)

ARG CUDA_VERSION=12.4.1

2024-07-23 00:03:19 -0700 (buildkit.dockerfile.v0)

ARG PYTHON_VERSION=3.10

2024-07-23 00:03:19 -0700 (buildkit.dockerfile.v0)

WORKDIR /vllm-workspace

2024-07-23 00:03:19 -0700 (buildkit.dockerfile.v0)

ENV DEBIAN_FRONTEND=noninteractive

2024-09-04 16:36:15 -0700 (buildkit.dockerfile.v0)

RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit

2024-09-04 16:39:00 -0700 (buildkit.dockerfile.v0)

RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl sudo vim python3-pip && add-apt-repository ppa:deadsnakes/ppa && apt-get update -y && apt-get install -y python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS https://bootstrap.pypa.io/get-pip.py | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit

2024-09-04 16:39:00 -0700 (buildkit.dockerfile.v0)

RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit

2024-09-04 17:26:02 -0700 (buildkit.dockerfile.v0)

RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c python3 -m pip install dist/*.whl --verbose # buildkit

2024-09-04 17:26:55 -0700 (buildkit.dockerfile.v0)

RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c . /etc/environment && python3 -m pip install https://github.com/flashinfer-ai/flashinfer/releases/download/v0.1.6/flashinfer-0.1.6+cu121torch2.4-cp${PYTHON_VERSION_STR}-cp${PYTHON_VERSION_STR}-linux_x86_64.whl # buildkit

2024-09-04 17:27:15 -0700 (buildkit.dockerfile.v0)

RUN /bin/sh -c pip install accelerate hf_transfer 'modelscope!=1.15.0' # buildkit

2024-09-04 17:27:15 -0700 (buildkit.dockerfile.v0)

ENV VLLM_USAGE_SOURCE=production-docker-image

2024-09-04 17:27:15 -0700 (buildkit.dockerfile.v0)

ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"]

2025-06-13 17:27:12 UTC

/bin/sh -c #(nop) COPY dir:015665f89cdf45967938f7012458c48c75ab4196899ffa302bc6788ef46bf86f in /opt/inference

2025-06-13 17:27:15 UTC

/bin/sh -c #(nop) WORKDIR /opt/inference

2025-06-13 17:27:15 UTC

/bin/sh -c #(nop) ENV NVM_DIR=/usr/local/nvm

2025-06-13 17:27:15 UTC

/bin/sh -c #(nop) ENV NODE_VERSION=14.21.1

2025-06-13 17:28:13 UTC

/bin/sh -c apt-get -y update && apt install -y wget curl procps git libgl1 && printf "\ndeb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ jammy main restricted universe multiverse" >> /etc/apt/sources.list && apt-get -y update && apt-get install -y --only-upgrade libstdc++6 && apt install -y libc6 && mkdir -p $NVM_DIR && curl -o- https://raw.githubusercontent.com/nvm-sh/nvm/v0.39.7/install.sh | bash && . $NVM_DIR/nvm.sh && nvm install $NODE_VERSION && nvm alias default $NODE_VERSION && nvm use default && apt-get -yq clean

2025-06-13 17:28:16 UTC

/bin/sh -c #(nop) ENV PATH=/usr/local/nvm/versions/node/v14.21.1/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

2025-06-13 17:28:16 UTC

/bin/sh -c #(nop) ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64:/usr/local/lib/python3.10/dist-packages/nvidia/cublas/lib

2025-06-13 17:28:17 UTC

/bin/sh -c #(nop) ENV FLASH_ATTENTION_SKIP_CUDA_BUILD=TRUE

2025-06-13 17:28:17 UTC

/bin/sh -c #(nop) ARG PIP_INDEX=https://pypi.org/simple

2025-06-13 17:47:03 UTC

|1 PIP_INDEX=https://pypi.org/simple /bin/sh -c pip install --upgrade -i "$PIP_INDEX" pip setuptools wheel&& pip install -i "$PIP_INDEX" "diskcache>=5.6.1" "jinja2>=2.11.3" && pip install flash-attn --no-build-isolation && pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements-base.txt && pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements-ml.txt && pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements-models.txt && pip install -i "$PIP_INDEX" transformers>=4.51.3 && pip install -i "$PIP_INDEX" --no-deps sglang && pip uninstall flashinfer -y && pip install flashinfer-python -i https://flashinfer.ai/whl/cu124/torch2.6 && cd /opt/inference && python3 setup.py build_web && git restore . && pip install -i "$PIP_INDEX" --no-deps "." && pip uninstall xllamacpp -y && pip install "xllamacpp>=0.1.18" --index-url https://xorbitsai.github.io/xllamacpp/whl/cu124 && pip cache purge

2025-06-13 17:47:32 UTC

|1 PIP_INDEX=https://pypi.org/simple /bin/sh -c wget -O Miniforge3.sh "https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-$(uname)-$(uname -m).sh" && bash Miniforge3.sh -b -p /opt/conda && rm Miniforge3.sh

2025-06-13 17:48:04 UTC

|1 PIP_INDEX=https://pypi.org/simple /bin/sh -c /opt/conda/bin/conda create -n ffmpeg-env -c conda-forge 'ffmpeg<7' -y && ln -s /opt/conda/envs/ffmpeg-env/bin/ffmpeg /usr/local/bin/ffmpeg && ln -s /opt/conda/envs/ffmpeg-env/bin/ffprobe /usr/local/bin/ffprobe && /opt/conda/bin/conda clean --all -y

2025-06-13 17:48:07 UTC

/bin/sh -c #(nop) ENTRYPOINT []

2025-06-13 17:48:07 UTC

/bin/sh -c #(nop) CMD ["/bin/bash"]

Danger Zone
Delete Tag

Please be careful as this will not just delete the reference but also the actual content!

For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.

Delete