Namespace
gptbasesparticle
Image / Tag
gb_llmapi:v656
Content Digest
sha256:baa975e426d451af9087b748d70aaad37d22a55d1f1eba881568aec6b7d8d9e3
Details
Created

2025-08-23 02:36:46 UTC

Size

16.5 GB

Content Digest
Labels
  • maintainer
    NVIDIA CORPORATION <cudatools@nvidia.com>
  • org.opencontainers.image.authors
    sparticle
  • org.opencontainers.image.description
    vLLM server optimized for OpenAI GPT-OSS models on Ada Lovelace GPUs
  • org.opencontainers.image.ref.name
    ubuntu
  • org.opencontainers.image.title
    vLLM GPT-OSS Server for Ada GPUs
  • org.opencontainers.image.vendor
    gptbasesparticle
  • org.opencontainers.image.version
    v655

Environment
CUDA_VERSION

12.8.1

CUDA_VISIBLE_DEVICES

all

DEBIAN_FRONTEND

noninteractive

HF_HUB_ENABLE_HF_TRANSFER

1

LD_LIBRARY_PATH

/usr/local/cuda/lib64

LIBRARY_PATH

/usr/local/cuda/lib64/stubs

NCCL_VERSION

2.25.1-1

NVARCH

x86_64

NVIDIA_DRIVER_CAPABILITIES

compute,utility

NVIDIA_PRODUCT_NAME

CUDA

NVIDIA_REQUIRE_CUDA

cuda>=12.8 brand=unknown,driver>=470,driver<471 brand=grid,driver>=470,driver<471 brand=tesla,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=vapps,driver>=470,driver<471 brand=vpc,driver>=470,driver<471 brand=vcs,driver>=470,driver<471 brand=vws,driver>=470,driver<471 brand=cloudgaming,driver>=470,driver<471 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566

NVIDIA_VISIBLE_DEVICES

all

NV_CUDA_CUDART_DEV_VERSION

12.8.90-1

NV_CUDA_CUDART_VERSION

12.8.90-1

NV_CUDA_LIB_VERSION

12.8.1-1

NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE

cuda-nsight-compute-12-8=12.8.1-1

NV_CUDA_NSIGHT_COMPUTE_VERSION

12.8.1-1

NV_LIBCUBLAS_DEV_PACKAGE

libcublas-dev-12-8=12.8.4.1-1

NV_LIBCUBLAS_DEV_PACKAGE_NAME

libcublas-dev-12-8

NV_LIBCUBLAS_DEV_VERSION

12.8.4.1-1

NV_LIBCUBLAS_PACKAGE

libcublas-12-8=12.8.4.1-1

NV_LIBCUBLAS_PACKAGE_NAME

libcublas-12-8

NV_LIBCUBLAS_VERSION

12.8.4.1-1

NV_LIBCUSPARSE_DEV_VERSION

12.5.8.93-1

NV_LIBCUSPARSE_VERSION

12.5.8.93-1

NV_LIBNCCL_DEV_PACKAGE

libnccl-dev=2.25.1-1+cuda12.8

NV_LIBNCCL_DEV_PACKAGE_NAME

libnccl-dev

NV_LIBNCCL_DEV_PACKAGE_VERSION

2.25.1-1

NV_LIBNCCL_PACKAGE

libnccl2=2.25.1-1+cuda12.8

NV_LIBNCCL_PACKAGE_NAME

libnccl2

NV_LIBNCCL_PACKAGE_VERSION

2.25.1-1

NV_LIBNPP_DEV_PACKAGE

libnpp-dev-12-8=12.3.3.100-1

NV_LIBNPP_DEV_VERSION

12.3.3.100-1

NV_LIBNPP_PACKAGE

libnpp-12-8=12.3.3.100-1

NV_LIBNPP_VERSION

12.3.3.100-1

NV_NVML_DEV_VERSION

12.8.90-1

NV_NVPROF_DEV_PACKAGE

cuda-nvprof-12-8=12.8.90-1

NV_NVPROF_VERSION

12.8.90-1

NV_NVTX_VERSION

12.8.90-1

PATH

/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

PYTHON_EXECUTION_BACKEND

uv

TIKTOKEN_CACHE_DIR

/tiktoken_cache

UV_HTTP_TIMEOUT

500

UV_INDEX_STRATEGY

unsafe-best-match

VLLM_ATTENTION_BACKEND

TRITON_ATTN_VLLM_V1

VLLM_USAGE_SOURCE

production-docker-image


Layers

[#000] sha256:8f84a9f2102e97a4a6bf673b150fc9894df5acc9618ad3484c6c36f768c1caa0 - 0.17% (29 MB)

[#001] sha256:b95112eaf2836b9c7193858419f6d17933a873c4a2c9227dc497f5e090ea9c87 - 0.03% (4.42 MB)

[#002] sha256:030ef82509363afebdc78482e6f8c07f2bc8b65a45caf082c2a9a621c7deae63 - 0.36% (61.3 MB)

[#003] sha256:72ac9ccfda38d144ef8e3aadbd5851e7fa9aacd261f8e15d7365db0f816d3433 - 0.0% (186 Bytes)

[#004] sha256:73389fbd088f5ed5d9fd258baced59de092978b4f483920ea6d074522a105119 - 0.0% (6.72 KB)

[#005] sha256:0264850675f7464ed6385d030d281ffb0f2037323c73511a5372948c1c69d92c - 11.62% (1.92 GB)

[#006] sha256:de1d03310308c2871217cf179589d5e7fcd8eee31d8f331b61041347f50404a0 - 0.0% (62.6 KB)

[#007] sha256:c1d2af7fad0f1c6cdaf09c568c086019e834bc6523c30aa9b2b0b24c4b782086 - 0.0% (1.64 KB)

[#008] sha256:5601308b3ac642f7df8b1dc62b9582abdd34857eec6190bcb50162abc5719226 - 0.0% (1.49 KB)

[#009] sha256:6b2035e8b73ed2b018995a7b2c8d607d5527daf948d41964f02cc3ce7ed0699a - 16.87% (2.78 GB)

[#010] sha256:ed71f8f81b33b96e7112757f6828a6dcb0861026aa63c5edc672d13e11045f6d - 0.0% (86.8 KB)

[#011] sha256:ae8e0ca9a3b398fba06d5f6b82a9c0d7a82c6aa13f51d4a8ce36a9b634c8803c - 0.0% (104 Bytes)

[#012] sha256:dd1de8147c9526d7113acab63e5e5b2c1aa1fba6ccbb0bb7f035031cb71ad3ed - 0.0% (230 Bytes)

[#013] sha256:0ec7e06d28f4003e10926c3e5e1b8528b9570e17a5a3cce95391862be7749f97 - 1.7% (288 MB)

[#014] sha256:3991ad70924c78b270b42b9ada9a8bcad5b6d8941a312416b38005cf33627724 - 0.19% (31.9 MB)

[#015] sha256:c02a399570135e8face5b05ef40799dc2e1d30baa80ce5fce9d19688ebc89e8f - 0.22% (37.6 MB)

[#016] sha256:40ba384cef6ccf65e2ee6a6b68da628805c698bdf521df2265e1b1f828806db5 - 0.0% (12.8 KB)

[#017] sha256:8e46657044706f6ce782fea091848ba645f2c3bd0c0f1b30664a74a56375c9b1 - 37.1% (6.12 GB)

[#018] sha256:88268b66a2256bf95a8f28e939ac626620d3e5274d18344751a47c5b901e3a18 - 31.72% (5.23 GB)

[#019] sha256:943b7d8b6c677c588984bf135c7b352f10426d4d148b120607c2ce2a0f89fa73 - 0.0% (104 Bytes)

[#020] sha256:3321dbe153ce451120963376f2229513bc84ddcdc0dccc3c9321499da33f4ade - 0.01% (1.64 MB)

[#021] sha256:c86ecc563b2976be7b605b999c798301b065c172ff213930c441271025792831 - 0.0% (767 KB)

[#022] sha256:9bb007225627b24ab46b40b1e10c525d816a4a419164acc999c3a1e05e790f9b - 0.0% (99 Bytes)

[#023] sha256:5ba1d81b53622e56d1081da688a565eb9215c7f0a8f9093676ddb2e5629e1f32 - 0.0% (610 Bytes)

[#024] sha256:4f000add097c3625f7db62f9c487b97763ed2680b2bf035e22565327c1dac920 - 0.0% (609 Bytes)


History
2025-01-26 05:31:07 UTC

/bin/sh -c #(nop) ARG RELEASE

2025-01-26 05:31:07 UTC

/bin/sh -c #(nop) ARG LAUNCHPAD_BUILD_ARCH

2025-01-26 05:31:07 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.ref.name=ubuntu

2025-01-26 05:31:07 UTC

/bin/sh -c #(nop) LABEL org.opencontainers.image.version=22.04

2025-01-26 05:31:10 UTC

/bin/sh -c #(nop) ADD file:1b6c8c9518be42fa2afe5e241ca31677fce58d27cdfa88baa91a65a259be3637 in /

2025-01-26 05:31:11 UTC

/bin/sh -c #(nop) CMD ["/bin/bash"]

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ENV NVARCH=x86_64

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_REQUIRE_CUDA=cuda>=12.8 brand=unknown,driver>=470,driver<471 brand=grid,driver>=470,driver<471 brand=tesla,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=vapps,driver>=470,driver<471 brand=vpc,driver>=470,driver<471 brand=vcs,driver>=470,driver<471 brand=vws,driver>=470,driver<471 brand=cloudgaming,driver>=470,driver<471 brand=unknown,driver>=535,driver<536 brand=grid,driver>=535,driver<536 brand=tesla,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=vapps,driver>=535,driver<536 brand=vpc,driver>=535,driver<536 brand=vcs,driver>=535,driver<536 brand=vws,driver>=535,driver<536 brand=cloudgaming,driver>=535,driver<536 brand=unknown,driver>=550,driver<551 brand=grid,driver>=550,driver<551 brand=tesla,driver>=550,driver<551 brand=nvidia,driver>=550,driver<551 brand=quadro,driver>=550,driver<551 brand=quadrortx,driver>=550,driver<551 brand=nvidiartx,driver>=550,driver<551 brand=vapps,driver>=550,driver<551 brand=vpc,driver>=550,driver<551 brand=vcs,driver>=550,driver<551 brand=vws,driver>=550,driver<551 brand=cloudgaming,driver>=550,driver<551 brand=unknown,driver>=560,driver<561 brand=grid,driver>=560,driver<561 brand=tesla,driver>=560,driver<561 brand=nvidia,driver>=560,driver<561 brand=quadro,driver>=560,driver<561 brand=quadrortx,driver>=560,driver<561 brand=nvidiartx,driver>=560,driver<561 brand=vapps,driver>=560,driver<561 brand=vpc,driver>=560,driver<561 brand=vcs,driver>=560,driver<561 brand=vws,driver>=560,driver<561 brand=cloudgaming,driver>=560,driver<561 brand=unknown,driver>=565,driver<566 brand=grid,driver>=565,driver<566 brand=tesla,driver>=565,driver<566 brand=nvidia,driver>=565,driver<566 brand=quadro,driver>=565,driver<566 brand=quadrortx,driver>=565,driver<566 brand=nvidiartx,driver>=565,driver<566 brand=vapps,driver>=565,driver<566 brand=vpc,driver>=565,driver<566 brand=vcs,driver>=565,driver<566 brand=vws,driver>=565,driver<566 brand=cloudgaming,driver>=565,driver<566

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_VERSION=12.8.90-1

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:19:05 UTC (buildkit.dockerfile.v0)

ENV CUDA_VERSION=12.8.1

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-8=${NV_CUDA_CUDART_VERSION} cuda-compat-12-8 && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/cuda/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

ENV PATH=/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

ENV LD_LIBRARY_PATH=/usr/local/cuda/lib64

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

COPY NGC-DL-CONTAINER-LICENSE / # buildkit

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_VISIBLE_DEVICES=all

2025-03-10 22:19:20 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_LIB_VERSION=12.8.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_NVTX_VERSION=12.8.90-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_VERSION=12.3.3.100-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_PACKAGE=libnpp-12-8=12.3.3.100-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUSPARSE_VERSION=12.5.8.93-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_PACKAGE_NAME=libcublas-12-8

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_VERSION=12.8.4.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_PACKAGE=libcublas-12-8=12.8.4.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE_NAME=libnccl2

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE_VERSION=2.25.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NCCL_VERSION=2.25.1-1

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_PACKAGE=libnccl2=2.25.1-1+cuda12.8

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-libraries-12-8=${NV_CUDA_LIB_VERSION} ${NV_LIBNPP_PACKAGE} cuda-nvtx-12-8=${NV_NVTX_VERSION} libcusparse-12-8=${NV_LIBCUSPARSE_VERSION} ${NV_LIBCUBLAS_PACKAGE} ${NV_LIBNCCL_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_PACKAGE_NAME} ${NV_LIBNCCL_PACKAGE_NAME} # buildkit

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

COPY nvidia_entrypoint.sh /opt/nvidia/ # buildkit

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENV NVIDIA_PRODUCT_NAME=CUDA

2025-03-10 22:24:31 UTC (buildkit.dockerfile.v0)

ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_LIB_VERSION=12.8.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_CUDART_DEV_VERSION=12.8.90-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_NVML_DEV_VERSION=12.8.90-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUSPARSE_DEV_VERSION=12.5.8.93-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_DEV_VERSION=12.3.3.100-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNPP_DEV_PACKAGE=libnpp-dev-12-8=12.3.3.100-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_VERSION=12.8.4.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_PACKAGE_NAME=libcublas-dev-12-8

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBCUBLAS_DEV_PACKAGE=libcublas-dev-12-8=12.8.4.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_NSIGHT_COMPUTE_VERSION=12.8.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE=cuda-nsight-compute-12-8=12.8.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_NVPROF_VERSION=12.8.90-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_NVPROF_DEV_PACKAGE=cuda-nvprof-12-8=12.8.90-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE_NAME=libnccl-dev

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE_VERSION=2.25.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NCCL_VERSION=2.25.1-1

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV NV_LIBNCCL_DEV_PACKAGE=libnccl-dev=2.25.1-1+cuda12.8

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ARG TARGETARCH

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com>

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-dev-12-8=${NV_CUDA_CUDART_DEV_VERSION} cuda-command-line-tools-12-8=${NV_CUDA_LIB_VERSION} cuda-minimal-build-12-8=${NV_CUDA_LIB_VERSION} cuda-libraries-dev-12-8=${NV_CUDA_LIB_VERSION} cuda-nvml-dev-12-8=${NV_NVML_DEV_VERSION} ${NV_NVPROF_DEV_PACKAGE} ${NV_LIBNPP_DEV_PACKAGE} libcusparse-dev-12-8=${NV_LIBCUSPARSE_DEV_VERSION} ${NV_LIBCUBLAS_DEV_PACKAGE} ${NV_LIBNCCL_DEV_PACKAGE} ${NV_CUDA_NSIGHT_COMPUTE_DEV_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

RUN |1 TARGETARCH=amd64 /bin/sh -c apt-mark hold ${NV_LIBCUBLAS_DEV_PACKAGE_NAME} ${NV_LIBNCCL_DEV_PACKAGE_NAME} # buildkit

2025-03-10 22:36:52 UTC (buildkit.dockerfile.v0)

ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs

2025-08-08 15:14:04 -0700 (buildkit.dockerfile.v0)

WORKDIR /vllm-workspace

2025-08-08 15:14:05 -0700 (buildkit.dockerfile.v0)

ENV DEBIAN_FRONTEND=noninteractive

2025-08-08 15:14:05 -0700 (buildkit.dockerfile.v0)

SHELL [/bin/bash -c]

2025-08-08 15:14:05 -0700 (buildkit.dockerfile.v0)

RUN /bin/bash -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION:-3.12} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit

2025-08-08 15:15:24 -0700 (buildkit.dockerfile.v0)

RUN /bin/bash -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl wget sudo vim python3-pip && apt-get install -y ffmpeg libsm6 libxext6 libgl1 # buildkit

2025-08-08 15:16:42 -0700 (buildkit.dockerfile.v0)

RUN /bin/bash -c add-apt-repository -y ppa:deadsnakes/ppa && apt-get update -y && apt-get install -y python3.12 python3.12-dev python3.12-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.12 1 && update-alternatives --set python3 /usr/bin/python3.12 && ln -sf /usr/bin/python3.12-config /usr/bin/python3-config && curl -sS "https://bootstrap.pypa.io/get-pip.py" | python3.12 && python3 --version && python3 -m pip --version # buildkit

2025-08-08 15:17:07 -0700 (buildkit.dockerfile.v0)

RUN /bin/bash -c python3 -m pip install uv # buildkit

2025-08-08 15:17:07 -0700 (buildkit.dockerfile.v0)

ENV UV_HTTP_TIMEOUT=500

2025-08-08 15:17:07 -0700 (buildkit.dockerfile.v0)

ENV UV_INDEX_STRATEGY=unsafe-best-match

2025-08-08 15:17:08 -0700 (buildkit.dockerfile.v0)

RUN /bin/bash -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit

2025-08-08 15:52:19 -0700 (buildkit.dockerfile.v0)

COPY . . # buildkit

2025-08-08 15:52:49 -0700 (buildkit.dockerfile.v0)

RUN /bin/bash -c . /etc/environment && uv pip install --system *.whl torch==2.9.0.dev20250804 --extra-index-url https://download.pytorch.org/whl/nightly/cu128 --index-strategy unsafe-best-match && uv pip uninstall --system torch-triton && uv pip install --system accelerate hf_transfer modelscope "bitsandbytes" 'timm==0.9.10' boto3 runai-model-streamer runai-model-streamer[s3] && uv pip list # buildkit

2025-08-08 15:52:49 -0700 (buildkit.dockerfile.v0)

ENV VLLM_USAGE_SOURCE=production-docker-image

2025-08-08 15:52:49 -0700 (buildkit.dockerfile.v0)

ENV PYTHON_EXECUTION_BACKEND=uv

2025-08-08 15:52:49 -0700 (buildkit.dockerfile.v0)

ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"]

2025-08-23 02:36:00 UTC (buildkit.dockerfile.v0)

LABEL org.opencontainers.image.title=vLLM GPT-OSS Server for Ada GPUs

2025-08-23 02:36:00 UTC (buildkit.dockerfile.v0)

LABEL org.opencontainers.image.description=vLLM server optimized for OpenAI GPT-OSS models on Ada Lovelace GPUs

2025-08-23 02:36:00 UTC (buildkit.dockerfile.v0)

LABEL org.opencontainers.image.version=v655

2025-08-23 02:36:00 UTC (buildkit.dockerfile.v0)

LABEL org.opencontainers.image.vendor=gptbasesparticle

2025-08-23 02:36:00 UTC (buildkit.dockerfile.v0)

LABEL org.opencontainers.image.authors=sparticle

2025-08-23 02:36:00 UTC (buildkit.dockerfile.v0)

RUN /bin/bash -c mkdir -p /tiktoken_cache # buildkit

2025-08-23 02:36:45 UTC (buildkit.dockerfile.v0)

COPY tiktoken_files/o200k_base.tiktoken /tiktoken_cache/ # buildkit

2025-08-23 02:36:45 UTC (buildkit.dockerfile.v0)

COPY tiktoken_files/cl100k_base.tiktoken /tiktoken_cache/ # buildkit

2025-08-23 02:36:45 UTC (buildkit.dockerfile.v0)

ENV VLLM_ATTENTION_BACKEND=TRITON_ATTN_VLLM_V1

2025-08-23 02:36:45 UTC (buildkit.dockerfile.v0)

ENV TIKTOKEN_CACHE_DIR=/tiktoken_cache

2025-08-23 02:36:45 UTC (buildkit.dockerfile.v0)

ENV VLLM_USAGE_SOURCE=production-docker-image

2025-08-23 02:36:45 UTC (buildkit.dockerfile.v0)

ENV HF_HUB_ENABLE_HF_TRANSFER=1

2025-08-23 02:36:45 UTC (buildkit.dockerfile.v0)

ENV CUDA_VISIBLE_DEVICES=all

2025-08-23 02:36:45 UTC (buildkit.dockerfile.v0)

WORKDIR /workspace

2025-08-23 02:36:45 UTC (buildkit.dockerfile.v0)

RUN /bin/bash -c cat > /start.sh << 'EOF' #!/bin/bash # vLLM GPT-OSS 启动脚本 # 检查是否提供了模型路径 if [ -z "$1" ]; then echo "Usage: /start.sh <model-path> [additional-args]" echo "Example: /start.sh /model --port 8000" exit 1 fi MODEL_PATH=$1 shift # 移除第一个参数,剩下的作为额外参数 # 默认参数 DEFAULT_ARGS="--host 0.0.0.0 --port 8000 --trust-remote-code" # 启动vLLM服务 echo "Starting vLLM with model: $MODEL_PATH" echo "Environment:" echo " VLLM_ATTENTION_BACKEND=$VLLM_ATTENTION_BACKEND" echo " TIKTOKEN_CACHE_DIR=$TIKTOKEN_CACHE_DIR" echo " CUDA_VISIBLE_DEVICES=$CUDA_VISIBLE_DEVICES" echo "" exec python3 -m vllm.entrypoints.openai.api_server \ --model $MODEL_PATH \ $DEFAULT_ARGS \ $@ EOF # buildkit

2025-08-23 02:36:46 UTC (buildkit.dockerfile.v0)

RUN /bin/bash -c chmod +x /start.sh # buildkit

2025-08-23 02:36:46 UTC (buildkit.dockerfile.v0)

HEALTHCHECK &{["CMD-SHELL" "curl -f http://localhost:8000/health || exit 1"] "30s" "10s" "2m0s" "0s" '\x03'}

2025-08-23 02:36:46 UTC (buildkit.dockerfile.v0)

ENTRYPOINT ["/start.sh"]

2025-08-23 02:36:46 UTC (buildkit.dockerfile.v0)

CMD ["/model"]

Danger Zone
Delete Tag

Please be careful as this will not just delete the reference but also the actual content!

For example when you have latest and v1.2.3 both pointing to the same image
the deletion of latest will also permanently remove v1.2.3.

Delete