llama-swap-build-vllm (sha256:368b7d468c7d15e57c62704f41d11e5603a7a85659a2bf43e5d593e9fea805d2)
Installation
docker pull gitea.simcop2387.info/simcop2387/llama-swap-build-vllm@sha256:368b7d468c7d15e57c62704f41d11e5603a7a85659a2bf43e5d593e9fea805d2sha256:368b7d468c7d15e57c62704f41d11e5603a7a85659a2bf43e5d593e9fea805d2Image layers
| ARG RELEASE |
| ARG LAUNCHPAD_BUILD_ARCH |
| LABEL org.opencontainers.image.ref.name=ubuntu |
| LABEL org.opencontainers.image.version=24.04 |
| ADD file:6df775300d76441aa33f31b22c1afce8dfe35c8ffbc14ef27c27009235b12a95 in / |
| CMD ["/bin/bash"] |
| ENV NVARCH=x86_64 |
| ENV NVIDIA_REQUIRE_CUDA=cuda>=12.8 brand=unknown,driver>=470,driver<471 brand=grid,driver>=470,driver<471 brand=tesla,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=vapps,driver>=470,driver<471 brand=vpc,driver>=470,driver<471 brand=vcs,driver>=470,driver<471 brand=vws,driver>=470,driver<471 brand=cloudgaming,driver>=470,driver<471 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566 |
| ENV NV_CUDA_CUDART_VERSION=12.8.90-1 |
| ARG TARGETARCH |
| LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com> |
| RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSL https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2404/${NVARCH}/3bf863cc.pub | apt-key add - && echo "deb https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2404/${NVARCH} /" > /etc/apt/sources.list.d/cuda.list && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit |
| ENV CUDA_VERSION=12.8.1 |
| RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-8=${NV_CUDA_CUDART_VERSION} cuda-compat-12-8 && rm -rf /var/lib/apt/lists/* # buildkit |
| RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit |
| ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin |
| ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64 |
| COPY NGC-DL-CONTAINER-LICENSE / # buildkit |
| ENV NVIDIA_VISIBLE_DEVICES=all |
| ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility |
| ENV NV_CUDA_LIB_VERSION=12.8.1-1 |
| ENV NV_NVTX_VERSION=12.8.90-1 |
| ENV NV_LIBNPP_VERSION=12.3.3.100-1 |
| ENV NV_LIBNPP_PACKAGE=libnpp-12-8=12.3.3.100-1 |
| ENV NV_LIBCUSPARSE_VERSION=12.5.8.93-1 |
| ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-12-8 |
| ENV NV_LIBCUBLAS_VERSION=12.8.4.1-1 |
| ENV NV_LIBCUBLAS_PACKAGE=libcublas-12-8=12.8.4.1-1 |
| ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2 |
| ENV NV_LIBNCCL_PACKAGE_VERSION=2.25.1-1 |
| ENV NCCL_VERSION=2.25.1-1 |
| ENV NV_LIBNCCL_PACKAGE=libnccl2=2.25.1-1+cuda12.8 |
| ARG TARGETARCH |
| LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com> |
| RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-12-8=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-12-8=${NV_NVTX_VERSION} libcusparse-12-8=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit |
| RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit |
| COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit |
| COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit |
| ENV NVIDIA_PRODUCT_NAME=CUDA |
| ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"] |
| ENV NV_CUDA_LIB_VERSION=12.8.1-1 |
| ENV NV_CUDA_CUDART_DEV_VERSION=12.8.90-1 |
| ENV NV_NVML_DEV_VERSION=12.8.90-1 |
| ENV NV_LIBCUSPARSE_DEV_VERSION=12.5.8.93-1 |
| ENV NV_LIBNPP_DEV_VERSION=12.3.3.100-1 |
| ENV NV_LIBNPP_DEV_PACKAGE=libnpp-dev-12-8=12.3.3.100-1 |
| ENV NV_LIBCUBLAS_DEV_VERSION=12.8.4.1-1 |
| ENV NV_LIBCUBLAS_DEV_PACKAGE_NAME=libcublas-dev-12-8 |
| ENV NV_LIBCUBLAS_DEV_PACKAGE=libcublas-dev-12-8=12.8.4.1-1 |
| ENV NV_CUDA_NSIGHT_COMPUTE_VERSION=12.8.1-1 |
| ENV NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE=cuda-nsight-compute-12-8=12.8.1-1 |
| ENV NV_NVPROF_VERSION=12.8.90-1 |
| ENV NV_NVPROF_DEV_PACKAGE=cuda-nvprof-12-8=12.8.90-1 |
| ENV NV_LIBNCCL_DEV_PACKAGE_NAME=libnccl-dev |
| ENV NV_LIBNCCL_DEV_PACKAGE_VERSION=2.25.1-1 |
| ENV NCCL_VERSION=2.25.1-1 |
| ENV NV_LIBNCCL_DEV_PACKAGE=libnccl-dev=2.25.1-1+cuda12.8 |
| ARG TARGETARCH |
| LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com> |
| RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-dev-12-8=${NV_CUDA_CUDART_DEV_VERSION} cuda-command-line-tools-12-8=${NV_CUDA_LIB_VERSION} cuda-minimal-build-12-8=${NV_CUDA_LIB_VERSION} cuda-libraries-dev-12-8=${NV_CUDA_LIB_VERSION} cuda-nvml-dev-12-8=${NV_NVML_DEV_VERSION} ${NV_NVPROF_DEV_PACKAGE} ${NV_LIBNPP_DEV_PACKAGE} libcusparse-dev-12-8=${NV_LIBCUSPARSE_DEV_VERSION} ${NV_LIBCUBLAS_DEV_PACKAGE} ${NV_LIBNCCL_DEV_PACKAGE} ${NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit |
| RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_DEV_PACKAGE_NAME} ${NV_LIBNCCL_DEV_PACKAGE_NAME} # buildkit |
| ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs |
| ENV NV_CUDNN_VERSION=9.8.0.87-1 |
| ENV NV_CUDNN_PACKAGE_NAME=libcudnn9-cuda-12 |
| ENV NV_CUDNN_PACKAGE=libcudnn9-cuda-12=9.8.0.87-1 |
| ENV NV_CUDNN_PACKAGE_DEV=libcudnn9-dev-cuda-12=9.8.0.87-1 |
| ARG TARGETARCH |
| LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com> |
| LABEL com.nvidia.cudnn.version=9.8.0.87-1 |
| RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends ${NV_CUDNN_PACKAGE} ${NV_CUDNN_PACKAGE_DEV} && apt-mark hold ${NV_CUDNN_PACKAGE_NAME} && rm -rf /var/lib/apt/lists/* # buildkit |
| ARG PYTHON_VER=3.10 |
| ARG CUDA_DOCKER_ARCH=61;70;75;80;86;89 |
| RUN |2 PYTHON_VER=3.10 CUDA_DOCKER_ARCH=61;70;75;80;86;89 /bin/sh -c apt-get update && apt-get install -y git python3 build-essential git cmake libcurl4-openssl-dev curl ccache pkg-config make build-essential libssl-dev zlib1g-dev libbz2-dev libreadline-dev libsqlite3-dev curl git golang ninja-build libncursesw5-dev xz-utils tk-dev libxml2-dev libxmlsec1-dev libffi-dev liblzma-dev libzstd-dev libgomp1 && apt autoremove -y && apt clean -y && rm -rf /tmp/* /var/tmp/* && find /var/cache/apt/archives /var/lib/apt/lists -not -name lock -type f -delete && find /var/cache -type f -delete # buildkit |
| ARG PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl |
| ARG PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly |
| ENV PYENV_ROOT=/.pyenv |
| ENV PATH=/.pyenv/shims:/.pyenv/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin |
| RUN |4 PYTHON_VER=3.10 CUDA_DOCKER_ARCH=61;70;75;80;86;89 PYTORCH_CUDA_INDEX_BASE_URL=https://download.pytorch.org/whl PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL=https://download.pytorch.org/whl/nightly /bin/sh -c curl -fsSL https://pyenv.run | bash && pyenv install --verbose $PYTHON_VER && pyenv global $PYTHON_VER && pyenv rehash && pip install --upgrade setuptools wheel pip # buildkit |
| COPY ./vllm-mirror /build/vllm/ # buildkit |
| WORKDIR /build/vllm/ |
| ARG PYTORCH_CUDA_INDEX_BASE_URL |
| ARG PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL |
| RUN |2 PYTORCH_CUDA_INDEX_BASE_URL= PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL= /bin/sh -c pip install -r requirements/build.txt # buildkit |
| RUN |2 PYTORCH_CUDA_INDEX_BASE_URL= PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL= /bin/sh -c pip install -v -r requirements/cuda.txt # buildkit |
| RUN |2 PYTORCH_CUDA_INDEX_BASE_URL= PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL= /bin/sh -c SETUPTOOLS_SCM_PRETEND_VERSION=v0.11.0 VLLM_TARGET_DEVICE=cuda python3 setup.py bdist_wheel # buildkit |
| RUN |2 PYTORCH_CUDA_INDEX_BASE_URL= PYTORCH_CUDA_NIGHTLY_INDEX_BASE_URL= /bin/sh -c sh -c 'ls /build/vllm -la; ls -la /build/vllm/dist; /bin/true' # buildkit |
Labels
| Key | Value |
|---|---|
| com.nvidia.cudnn.version | 9.8.0.87-1 |
| maintainer | NVIDIA CORPORATION <cudatools@nvidia.com> |
| org.opencontainers.image.created | 2025-12-01T17:32:59.901Z |
| org.opencontainers.image.description | |
| org.opencontainers.image.licenses | |
| org.opencontainers.image.ref.name | ubuntu |
| org.opencontainers.image.revision | 4968efd5fe6fb6a06adc15e17d62c832c8f00b2d |
| org.opencontainers.image.source | https://gitea.simcop2387.info/simcop2387/llama-swap-infra |
| org.opencontainers.image.title | llama-swap-infra |
| org.opencontainers.image.url | https://gitea.simcop2387.info/simcop2387/llama-swap-infra |
| org.opencontainers.image.version | main |
Details
2025-12-01 12:33:51 -05:00
Versions (9)
View all
Container
0
OCI / Docker
linux/amd64
20 GiB
main
2025-12-02
latest
2025-12-02
413-2025-12-02
2025-12-02
411-2025-12-01
2025-12-01
409-2025-12-01
2025-12-01