vllm (v0.6.3.post1)
Published 2024-10-21 05:19:37 +00:00 by ivampiresp
Installation
docker pull leafdev.top/packaged/vllm:v0.6.3.post1
sha256:76db50934cbaa4e7f78b2bea6b52e9f6d189ec51f3121dcac7afa404468d48f1
Image Layers
ARG RELEASE |
ARG LAUNCHPAD_BUILD_ARCH |
LABEL org.opencontainers.image.ref.name=ubuntu |
LABEL org.opencontainers.image.version=22.04 |
ADD file:3bd10da0673e2e72cb06a1f64a9df49a36341df39b0f762e3d1b38ee4de296fa in / |
CMD ["/bin/bash"] |
ENV NVARCH=x86_64 |
ENV NVIDIA_REQUIRE_CUDA=cuda>=12.4 brand=tesla,driver>=470,driver<471 brand=unknown,driver>=470,driver<471 brand=nvidia,driver>=470,driver<471 brand=nvidiartx,driver>=470,driver<471 brand=geforce,driver>=470,driver<471 brand=geforcertx,driver>=470,driver<471 brand=quadro,driver>=470,driver<471 brand=quadrortx,driver>=470,driver<471 brand=titan,driver>=470,driver<471 brand=titanrtx,driver>=470,driver<471 brand=tesla,driver>=525,driver<526 brand=unknown,driver>=525,driver<526 brand=nvidia,driver>=525,driver<526 brand=nvidiartx,driver>=525,driver<526 brand=geforce,driver>=525,driver<526 brand=geforcertx,driver>=525,driver<526 brand=quadro,driver>=525,driver<526 brand=quadrortx,driver>=525,driver<526 brand=titan,driver>=525,driver<526 brand=titanrtx,driver>=525,driver<526 brand=tesla,driver>=535,driver<536 brand=unknown,driver>=535,driver<536 brand=nvidia,driver>=535,driver<536 brand=nvidiartx,driver>=535,driver<536 brand=geforce,driver>=535,driver<536 brand=geforcertx,driver>=535,driver<536 brand=quadro,driver>=535,driver<536 brand=quadrortx,driver>=535,driver<536 brand=titan,driver>=535,driver<536 brand=titanrtx,driver>=535,driver<536 |
ENV NV_CUDA_CUDART_VERSION=12.4.127-1 |
ENV NV_CUDA_COMPAT_PACKAGE=cuda-compat-12-4 |
ARG TARGETARCH |
LABEL maintainer=NVIDIA CORPORATION <cudatools@nvidia.com> |
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends gnupg2 curl ca-certificates && curl -fsSLO https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/${NVARCH}/cuda-keyring_1.1-1_all.deb && dpkg -i cuda-keyring_1.1-1_all.deb && apt-get purge --autoremove -y curl && rm -rf /var/lib/apt/lists/* # buildkit |
ENV CUDA_VERSION=12.4.1 |
RUN |1 TARGETARCH=amd64 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends cuda-cudart-12-4=${NV_CUDA_CUDART_VERSION} ${NV_CUDA_COMPAT_PACKAGE} && rm -rf /var/lib/apt/lists/* # buildkit |
RUN |1 TARGETARCH=amd64 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit |
ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin |
ENV LD_LIBRARY_PATH=/usr/local/nvidia/lib:/usr/local/nvidia/lib64 |
COPY NGC-DL-CONTAINER-LICENSE / # buildkit |
ENV NVIDIA_VISIBLE_DEVICES=all |
ENV NVIDIA_DRIVER_CAPABILITIES=compute,utility |
ARG CUDA_VERSION=12.4.1 |
ARG PYTHON_VERSION=3.12 |
WORKDIR /vllm-workspace |
ENV DEBIAN_FRONTEND=noninteractive |
RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.12 /bin/sh -c PYTHON_VERSION_STR=$(echo ${PYTHON_VERSION} | sed 's/\.//g') && echo "export PYTHON_VERSION_STR=${PYTHON_VERSION_STR}" >> /etc/environment # buildkit |
RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.12 /bin/sh -c echo 'tzdata tzdata/Areas select America' | debconf-set-selections && echo 'tzdata tzdata/Zones/America select Los_Angeles' | debconf-set-selections && apt-get update -y && apt-get install -y ccache software-properties-common git curl sudo vim python3-pip && apt-get install -y ffmpeg libsm6 libxext6 libgl1 && add-apt-repository ppa:deadsnakes/ppa && apt-get update -y && apt-get install -y python${PYTHON_VERSION} python${PYTHON_VERSION}-dev python${PYTHON_VERSION}-venv libibverbs-dev && update-alternatives --install /usr/bin/python3 python3 /usr/bin/python${PYTHON_VERSION} 1 && update-alternatives --set python3 /usr/bin/python${PYTHON_VERSION} && ln -sf /usr/bin/python${PYTHON_VERSION}-config /usr/bin/python3-config && curl -sS https://bootstrap.pypa.io/get-pip.py | python${PYTHON_VERSION} && python3 --version && python3 -m pip --version # buildkit |
RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.12 /bin/sh -c ldconfig /usr/local/cuda-$(echo $CUDA_VERSION | cut -d. -f1,2)/compat/ # buildkit |
RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.12 /bin/sh -c python3 -m pip install dist/*.whl --verbose # buildkit |
RUN |2 CUDA_VERSION=12.4.1 PYTHON_VERSION=3.12 /bin/sh -c . /etc/environment && python3 -m pip install https://github.com/flashinfer-ai/flashinfer/releases/download/v0.1.6/flashinfer-0.1.6+cu121torch2.4-cp${PYTHON_VERSION_STR}-cp${PYTHON_VERSION_STR}-linux_x86_64.whl # buildkit |
COPY examples examples # buildkit |
RUN /bin/sh -c pip install accelerate hf_transfer 'modelscope!=1.15.0' bitsandbytes>=0.44.0 timm==0.9.10 # buildkit |
ENV VLLM_USAGE_SOURCE=production-docker-image |
ENTRYPOINT ["python3" "-m" "vllm.entrypoints.openai.api_server"] |
Labels
Key | Value |
---|---|
maintainer | NVIDIA CORPORATION <cudatools@nvidia.com> |
org.opencontainers.image.ref.name | ubuntu |
org.opencontainers.image.version | 22.04 |
Details
2024-10-21 05:19:37 +00:00
Versions (2)
View all
Container
0
OCI / Docker
linux/amd64
5.1 GiB
v0.6.3.post1
2024-10-21
v0.6.3.post1-cpu
2024-10-21