You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
gpustack/Dockerfile

45 lines
1012 B

ARG CUDA_VERSION=12.4.1
ARG CUDA_TAG_SUFFIX=-cudnn-runtime-ubuntu22.04
FROM nvidia/cuda:${CUDA_VERSION}${CUDA_TAG_SUFFIX}
ARG TARGETPLATFORM
ENV DEBIAN_FRONTEND=noninteractive
RUN apt-get update && apt-get install -y \
git \
curl \
wget \
tzdata \
iproute2 \
python3 \
python3-pip \
python3-venv \
tini \
&& rm -rf /var/lib/apt/lists/*
COPY . /workspace/gpustack
RUN cd /workspace/gpustack && \
make build
ARG VLLM_VERSION=0.8.5.post1
RUN <<EOF
if [ "$TARGETPLATFORM" = "linux/amd64" ]; then
# Install vllm dependencies for x86_64
WHEEL_PACKAGE="$(ls /workspace/gpustack/dist/*.whl)[all]";
else
WHEEL_PACKAGE="$(ls /workspace/gpustack/dist/*.whl)[audio]";
fi
pip install pipx
pip install $WHEEL_PACKAGE
pip cache purge
rm -rf /workspace/gpustack
EOF
RUN gpustack download-tools
# Download dac weights used by audio models like Dia
RUN python3 -m dac download
ENTRYPOINT [ "tini", "--", "gpustack", "start" ]