text-generation-webui/docker/Dockerfile

FROM nvidia/cuda:12.1.0-devel-ubuntu22.04 as builder

RUN --mount=type=cache,target=/var/cache/apt,sharing=locked,rw apt-get update && \
    apt-get install --no-install-recommends -y git vim build-essential python3-dev python3-venv && \
    rm -rf /var/lib/apt/lists/*

RUN git clone --depth=1 https://github.com/oobabooga/GPTQ-for-LLaMa /build

WORKDIR /build

RUN --mount=type=cache,target=/root/.cache/pip,rw \
    python3 -m venv /build/venv && \
    . /build/venv/bin/activate && \
    pip3 install --upgrade pip setuptools wheel ninja && \
    pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121 && \
    pip3 install -r requirements.txt

# https://developer.nvidia.com/cuda-gpus
# for a rtx 2060: ARG TORCH_CUDA_ARCH_LIST="7.5"
ARG TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST:-3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6+PTX}"
RUN . /build/venv/bin/activate && \
    python3 setup_cuda.py bdist_wheel -d .

FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04

LABEL maintainer="Your Name <your.email@example.com>"
LABEL description="Docker image for GPTQ-for-LLaMa and Text Generation WebUI"

RUN --mount=type=cache,target=/var/cache/apt,sharing=locked,rw apt-get update && \
    apt-get install --no-install-recommends -y python3-dev libportaudio2 libasound-dev git python3 python3-pip make g++ ffmpeg && \
    rm -rf /var/lib/apt/lists/*

RUN --mount=type=cache,target=/root/.cache/pip,rw pip3 install virtualenv

RUN mkdir /app

WORKDIR /app

ARG WEBUI_VERSION
RUN test -n "${WEBUI_VERSION}" && git reset --hard ${WEBUI_VERSION} || echo "Using provided webui source"

# Create virtualenv
RUN virtualenv /app/venv
RUN --mount=type=cache,target=/root/.cache/pip,rw \
    . /app/venv/bin/activate && \
    pip3 install --upgrade pip setuptools wheel ninja && \
    pip3 install torch --index-url https://download.pytorch.org/whl/cu121 && \
    pip3 install torchvision torchaudio sentence_transformers xformers

# Copy and install GPTQ-for-LLaMa
COPY --from=builder /build /app/repositories/GPTQ-for-LLaMa
RUN --mount=type=cache,target=/root/.cache/pip,rw \
    . /app/venv/bin/activate && \
    pip3 install /app/repositories/GPTQ-for-LLaMa/*.whl

# Install main requirements
COPY requirements.txt /app/requirements.txt
RUN --mount=type=cache,target=/root/.cache/pip,rw \
    . /app/venv/bin/activate && \
    pip3 install -r requirements.txt

COPY . /app/

RUN cp /app/venv/lib/python3.10/site-packages/bitsandbytes/libbitsandbytes_cuda121.so /app/venv/lib/python3.10/site-packages/bitsandbytes/libbitsandbytes_cpu.so

# Install extension requirements
RUN --mount=type=cache,target=/root/.cache/pip,rw \
    . /app/venv/bin/activate && \
    for ext in /app/extensions/*/requirements.txt; do \
    cd "$(dirname "$ext")"; \
    pip3 install -r requirements.txt; \
    done

ENV CLI_ARGS=""

EXPOSE ${CONTAINER_PORT:-7860} ${CONTAINER_API_PORT:-5000} ${CONTAINER_API_STREAM_PORT:-5005}
CMD . /app/venv/bin/activate && python3 server.py ${CLI_ARGS}
Add flash-attention 2 for windows (#4235) 2023-10-21 02:46:23 -04:00			`FROM nvidia/cuda:12.1.0-devel-ubuntu22.04 as builder`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00
improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`RUN --mount=type=cache,target=/var/cache/apt,sharing=locked,rw apt-get update && \`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00			`apt-get install --no-install-recommends -y git vim build-essential python3-dev python3-venv && \`
			`rm -rf /var/lib/apt/lists/*`

improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`RUN git clone --depth=1 https://github.com/oobabooga/GPTQ-for-LLaMa /build`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00
			`WORKDIR /build`

improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`RUN --mount=type=cache,target=/root/.cache/pip,rw \`
			`python3 -m venv /build/venv && \`
			`. /build/venv/bin/activate && \`
Fix for using Torch with CUDA 11.8 (#4298) 2023-10-15 18:27:19 -04:00			`pip3 install --upgrade pip setuptools wheel ninja && \`
Docker: Remove explicit CUDA 11.8 Reference (#4343) 2023-10-21 14:09:34 -04:00			`pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121 && \`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00			`pip3 install -r requirements.txt`

			`# https://developer.nvidia.com/cuda-gpus`
			`# for a rtx 2060: ARG TORCH_CUDA_ARCH_LIST="7.5"`
Make dockerfile respect specified cuda version (#3474) 2023-08-07 09:19:16 -04:00			`ARG TORCH_CUDA_ARCH_LIST="${TORCH_CUDA_ARCH_LIST:-3.5;5.0;6.0;6.1;7.0;7.5;8.0;8.6+PTX}"`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00			`RUN . /build/venv/bin/activate && \`
			`python3 setup_cuda.py bdist_wheel -d .`

Add flash-attention 2 for windows (#4235) 2023-10-21 02:46:23 -04:00			`FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00
			`LABEL maintainer="Your Name <your.email@example.com>"`
			`LABEL description="Docker image for GPTQ-for-LLaMa and Text Generation WebUI"`

improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`RUN --mount=type=cache,target=/var/cache/apt,sharing=locked,rw apt-get update && \`
Add ffmpeg to the Docker image (#3664) 2023-08-27 11:29:00 -04:00			`apt-get install --no-install-recommends -y python3-dev libportaudio2 libasound-dev git python3 python3-pip make g++ ffmpeg && \`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00			`rm -rf /var/lib/apt/lists/*`

improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`RUN --mount=type=cache,target=/root/.cache/pip,rw pip3 install virtualenv`
Fix for using Torch with CUDA 11.8 (#4298) 2023-10-15 18:27:19 -04:00
Tweak COPY order in Dockerfile (#863) 2023-04-06 23:56:44 -04:00			`RUN mkdir /app`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00
			`WORKDIR /app`

			`ARG WEBUI_VERSION`
			`RUN test -n "${WEBUI_VERSION}" && git reset --hard ${WEBUI_VERSION} \|\| echo "Using provided webui source"`

improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`# Create virtualenv`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00			`RUN virtualenv /app/venv`
improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`RUN --mount=type=cache,target=/root/.cache/pip,rw \`
			`. /app/venv/bin/activate && \`
Fix for using Torch with CUDA 11.8 (#4298) 2023-10-15 18:27:19 -04:00			`pip3 install --upgrade pip setuptools wheel ninja && \`
Docker: Remove explicit CUDA 11.8 Reference (#4343) 2023-10-21 14:09:34 -04:00			`pip3 install torch --index-url https://download.pytorch.org/whl/cu121 && \`
Fix for using Torch with CUDA 11.8 (#4298) 2023-10-15 18:27:19 -04:00			`pip3 install torchvision torchaudio sentence_transformers xformers`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00
improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`# Copy and install GPTQ-for-LLaMa`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00			`COPY --from=builder /build /app/repositories/GPTQ-for-LLaMa`
improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`RUN --mount=type=cache,target=/root/.cache/pip,rw \`
			`. /app/venv/bin/activate && \`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00			`pip3 install /app/repositories/GPTQ-for-LLaMa/*.whl`

improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`# Install main requirements`
Tweak COPY order in Dockerfile (#863) 2023-04-06 23:56:44 -04:00			`COPY requirements.txt /app/requirements.txt`
improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`RUN --mount=type=cache,target=/root/.cache/pip,rw \`
			`. /app/venv/bin/activate && \`
Tweak COPY order in Dockerfile (#863) 2023-04-06 23:56:44 -04:00			`pip3 install -r requirements.txt`

improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`COPY . /app/`

Docker: Remove explicit CUDA 11.8 Reference (#4343) 2023-10-21 14:09:34 -04:00			`RUN cp /app/venv/lib/python3.10/site-packages/bitsandbytes/libbitsandbytes_cuda121.so /app/venv/lib/python3.10/site-packages/bitsandbytes/libbitsandbytes_cpu.so`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00
improve docker builds (#3715) 2023-09-11 11:22:00 -04:00			`# Install extension requirements`
			`RUN --mount=type=cache,target=/root/.cache/pip,rw \`
			`. /app/venv/bin/activate && \`
			`for ext in /app/extensions/*/requirements.txt; do \`
			`cd "$(dirname "$ext")"; \`
			`pip3 install -r requirements.txt; \`
			`done`

Tweak COPY order in Dockerfile (#863) 2023-04-06 23:56:44 -04:00			`ENV CLI_ARGS=""`
improve docker builds (#3715) 2023-09-11 11:22:00 -04:00
			`EXPOSE ${CONTAINER_PORT:-7860} ${CONTAINER_API_PORT:-5000} ${CONTAINER_API_STREAM_PORT:-5005}`
creating a layer with Docker/docker-compose (#633) 2023-04-06 21:46:04 -04:00			`CMD . /app/venv/bin/activate && python3 server.py ${CLI_ARGS}`