2025-06-13 17:48:07 UTC
11.5 GB
12.4.1
DEBIAN_FRONTENDnoninteractive
FLASH_ATTENTION_SKIP_CUDA_BUILDTRUE
LD_LIBRARY_PATH/usr/local/nvidia/lib:/usr/local/nvidia/lib64:/usr/local/lib/python3.10/dist-packages/nvidia/cublas/lib
NODE_VERSION14.21.1
NVARCHx86_64
NVIDIA_DRIVER_CAPABILITIEScompute,utility
NVIDIA_REQUIRE_CUDAcuda>=12.4 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526 brand=tesla,driver>=535,driver<536 brand=unknown,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=geforce,driver>=535,driver<536 brand=geforcertx,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=titan,driver>=535,driver<536 brand=titanrtx,driver>=535,driver<536
NVIDIA_VISIBLE_DEVICESall
NVM_DIR/usr/local/nvm
NV_CUDA_COMPAT_PACKAGEcuda-compat-12-4
NV_CUDA_CUDART_VERSION12.4.127-1
PATH/usr/local/nvm/versions/node/v14.21.1/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
VLLM_USAGE_SOURCEproduction-docker-image
[#000] sha256:43cfb69dbb464ebad014cd4687bf02ee4f5011d540916c658af36faafbfd3481 - 0.22% (26.2 MB)
[#001] sha256:fbcd35dc5bc3a7bda41926aadd083020f942b001ebac6f1d30480f0f065394c0 - 0.06% (7.58 MB)
[#002] sha256:c7232af9ae05f7de83f8d6171bd0c35a4dd0a85ebafb15b950dbc08f89ea5fb5 - 0.47% (54.9 MB)
[#003] sha256:db6cdef1932a0d9ca6ef9a539e08d491f66d1b1ed81926ae1525375bdd8100cc - 0.0% (185 Bytes)
[#004] sha256:56dc8550293751a1604e97ac949cfae82ba20cb2a28e034737bafd7382559609 - 0.0% (6.72 KB)
[#005] sha256:9f61b3db38d69dddb7c6f05c299c875b3c7b6d97869e2f96bf128865bb80bd73 - 0.0% (104 Bytes)
[#006] sha256:0bd39d0469a8457b392113410f3125a0859d6e5f6d48ad8582bd4fa69650c458 - 0.0% (230 Bytes)
[#007] sha256:d22ff5f4aac61b315f6054a8a18ecbe9dcd3afad842ea601397dd9f728312da4 - 1.87% (220 MB)
[#008] sha256:d866993704f54dbc8fb066ffc01f4e0e0645617600bba305452c241dcedb7c11 - 0.0% (6.74 KB)
[#009] sha256:b4918d864665c1c0b4ab2df2c6951e0b7ec94e90b425d1586ef70aa05f2a6321 - 28.62% (3.3 GB)
[#010] sha256:e93cc01aab8b268f0f4cc7c62ca1401d317824b9c76b99c5dafb6e43981af2c5 - 10.82% (1.25 GB)
[#011] sha256:fd30840e514de4a28db901cf841543e45fc262213c5eb1dea29b38901020c9bd - 0.12% (14.4 MB)
[#012] sha256:e9730b1a006ea6204ab007ea6e4d6543b9d5b4d3603975eb80f249baae0d736e - 0.88% (103 MB)
[#013] sha256:15094d73c48ca9de90901a20c450a6a76b3b41405948e23d0fd095b19dd3dd99 - 1.56% (183 MB)
[#014] sha256:aa4522bf0b02abd3aed9a62efa5e3f27c58e0b08850ead5a29bc9ad9d3da892a - 52.24% (6.02 GB)
[#015] sha256:20820024388145c224eae52945ea7e0af2356e0dcad2c153c2a1b1ac366ec4e3 - 1.86% (220 MB)
[#016] sha256:01472ed2757640da87c42b19b2ce975367fdb4be0bd7244fba5a4ada3704263e - 1.28% (151 MB)
/bin/sh -c #(nop) ARG RELEASE
2024-04-10 18:50:35 UTC/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH
2024-04-10 18:50:35 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu
2024-04-10 18:50:35 UTC/bin/sh -c #(nop) LABEL org.opencontainers.image.version=20.04
2024-04-10 18:50:37 UTC/bin/sh -c #(nop) ADD file:ea2128e23dce0162557abadd80656bd5ae047d573095d1d4323eb4154490dfdc in /
2024-04-10 18:50:37 UTC/bin/sh -c #(nop) CMD ["/bin/bash"]
2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)ENV NVARCH=x86_64
2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)ENV NVIDIA_REQUIRE_CUDA=cuda>=12.4 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526 brand=tesla,driver>=535,driver<536 brand=unknown,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=geforce,driver>=535,driver<536 brand=geforcertx,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=titan,driver>=535,driver<536 brand=titanrtx,driver>=535,driver<536
2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_CUDART_VERSION=12.4.127-1
2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)ENV NV_CUDA_COMPAT_PACKAGE=cuda-compat-12-4
2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)ARG TARGETARCH
2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)LABEL maintainer=NVIDIA CORPORATION <[email protected]>
2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSL https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2004/${NVARCH}/3bf863cc.pub | apt-key add - && echo "deb https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2004/${NVARCH} /" > /etc/apt/sources.list.d/cuda.list && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit
2024-04-22 23:42:24 UTC (buildkit.dockerfile.v0)ENV CUDA_VERSION=12.4.1
2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-4=${NV_CUDA_CUDART_VERSION} ${NV_CUDA_COMPAT_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit
2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit
2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64
2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)COPY NGC-DL-CONTAINER-LICENSE / # buildkit
2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)ENV NVIDIA_VISIBLE_DEVICES=all
2024-04-22 23:42:36 UTC (buildkit.dockerfile.v0)ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility
2024-07-23 00:03:19 -0700 (buildkit.dockerfile.v0)ARG CUDA_VERSION=12.4.1
2024-07-23 00:03:19 -0700 (buildkit.dockerfile.v0)ARG PYTHON_VERSION=3.10
2024-07-23 00:03:19 -0700 (buildkit.dockerfile.v0)WORKDIR /vllm-workspace
2024-07-23 00:03:19 -0700 (buildkit.dockerfile.v0)ENV DEBIAN_FRONTEND=noninteractive
2024-09-04 16:36:15 -0700 (buildkit.dockerfile.v0)RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit
2024-09-04 16:39:00 -0700 (buildkit.dockerfile.v0)RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl sudo vim python3-pip && add-apt-repository ppa:deadsnakes/ppa && apt-get update -y && apt-get install -y python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS https://bootstrap.pypa.io/get-pip.py | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit
2024-09-04 16:39:00 -0700 (buildkit.dockerfile.v0)RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit
2024-09-04 17:26:02 -0700 (buildkit.dockerfile.v0)RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c python3 -m pip install dist/*.whl --verbose # buildkit
2024-09-04 17:26:55 -0700 (buildkit.dockerfile.v0)RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.10 /bin/sh -c . /etc/environment && python3 -m pip install https://github.com/flashinfer-ai/flashinfer/releases/download/v0.1.6/flashinfer-0.1.6+cu121torch2.4-cp${PYTHON_VERSION_STR}-cp${PYTHON_VERSION_STR}-linux_x86_64.whl # buildkit
2024-09-04 17:27:15 -0700 (buildkit.dockerfile.v0)RUN /bin/sh -c pip install accelerate hf_transfer 'modelscope!=1.15.0' # buildkit
2024-09-04 17:27:15 -0700 (buildkit.dockerfile.v0)ENV VLLM_USAGE_SOURCE=production-docker-image
2024-09-04 17:27:15 -0700 (buildkit.dockerfile.v0)ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"]
2025-06-13 17:27:12 UTC/bin/sh -c #(nop) COPY dir:015665f89cdf45967938f7012458c48c75ab4196899ffa302bc6788ef46bf86f in /opt/inference
2025-06-13 17:27:15 UTC/bin/sh -c #(nop) WORKDIR /opt/inference
2025-06-13 17:27:15 UTC/bin/sh -c #(nop) ENV NVM_DIR=/usr/local/nvm
2025-06-13 17:27:15 UTC/bin/sh -c #(nop) ENV NODE_VERSION=14.21.1
2025-06-13 17:28:13 UTC/bin/sh -c apt-get -y update && apt install -y wget curl procps git libgl1 && printf "\ndeb https://mirrors.tuna.tsinghua.edu.cn/ubuntu/ jammy main restricted universe multiverse" >> /etc/apt/sources.list && apt-get -y update && apt-get install -y --only-upgrade libstdc++6 && apt install -y libc6 && mkdir -p $NVM_DIR && curl -o- https://raw.githubusercontent.com/nvm-sh/nvm/v0.39.7/install.sh | bash && . $NVM_DIR/nvm.sh && nvm install $NODE_VERSION && nvm alias default $NODE_VERSION && nvm use default && apt-get -yq clean
2025-06-13 17:28:16 UTC/bin/sh -c #(nop) ENV PATH=/usr/local/nvm/versions/node/v14.21.1/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
2025-06-13 17:28:16 UTC/bin/sh -c #(nop) ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64:/usr/local/lib/python3.10/dist-packages/nvidia/cublas/lib
2025-06-13 17:28:17 UTC/bin/sh -c #(nop) ENV FLASH_ATTENTION_SKIP_CUDA_BUILD=TRUE
2025-06-13 17:28:17 UTC/bin/sh -c #(nop) ARG PIP_INDEX=https://pypi.org/simple
2025-06-13 17:47:03 UTC|1 PIP_INDEX=https://pypi.org/simple /bin/sh -c pip install --upgrade -i "$PIP_INDEX" pip setuptools wheel&& pip install -i "$PIP_INDEX" "diskcache>=5.6.1" "jinja2>=2.11.3" && pip install flash-attn --no-build-isolation && pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements-base.txt && pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements-ml.txt && pip install -i "$PIP_INDEX" --upgrade-strategy only-if-needed -r /opt/inference/xinference/deploy/docker/requirements-models.txt && pip install -i "$PIP_INDEX" transformers>=4.51.3 && pip install -i "$PIP_INDEX" --no-deps sglang && pip uninstall flashinfer -y && pip install flashinfer-python -i https://flashinfer.ai/whl/cu124/torch2.6 && cd /opt/inference && python3 setup.py build_web && git restore . && pip install -i "$PIP_INDEX" --no-deps "." && pip uninstall xllamacpp -y && pip install "xllamacpp>=0.1.18" --index-url https://xorbitsai.github.io/xllamacpp/whl/cu124 && pip cache purge
2025-06-13 17:47:32 UTC|1 PIP_INDEX=https://pypi.org/simple /bin/sh -c wget -O Miniforge3.sh "https://github.com/conda-forge/miniforge/releases/latest/download/Miniforge3-$(uname)-$(uname -m).sh" && bash Miniforge3.sh -b -p /opt/conda && rm Miniforge3.sh
2025-06-13 17:48:04 UTC|1 PIP_INDEX=https://pypi.org/simple /bin/sh -c /opt/conda/bin/conda create -n ffmpeg-env -c conda-forge 'ffmpeg<7' -y && ln -s /opt/conda/envs/ffmpeg-env/bin/ffmpeg /usr/local/bin/ffmpeg && ln -s /opt/conda/envs/ffmpeg-env/bin/ffprobe /usr/local/bin/ffprobe && /opt/conda/bin/conda clean --all -y
2025-06-13 17:48:07 UTC/bin/sh -c #(nop) ENTRYPOINT []
2025-06-13 17:48:07 UTC/bin/sh -c #(nop) CMD ["/bin/bash"]
Please be careful as this will not just delete the reference but also the actual content!
For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.