turbopilot/Dockerfile.cuda

31 lines
603 B
Docker
Raw Normal View History

2023-05-08 06:38:25 -04:00
FROM nvidia/cuda:11.7.1-devel-ubuntu22.04 AS build
2023-04-10 03:51:48 -04:00
2023-07-29 10:44:56 -04:00
RUN apt-get update && apt-get install -y build-essential cmake libboost-dev libasio-dev
2023-04-10 03:51:48 -04:00
ADD ./ /turbopilot
2023-04-10 03:51:48 -04:00
RUN mkdir /turbopilot/build
2023-04-10 03:51:48 -04:00
WORKDIR /turbopilot/build
2023-04-10 03:51:48 -04:00
2023-05-08 06:38:25 -04:00
RUN cmake -DGGML_CUBLAS=ON -DCMAKE_CUDA_COMPILER=/usr/local/cuda/bin/nvcc ..
RUN make turbopilot
2023-04-10 03:51:48 -04:00
2023-05-08 06:38:25 -04:00
FROM nvidia/cuda:11.7.1-cudnn8-runtime-ubuntu22.04 AS runtime
2023-04-10 03:51:48 -04:00
WORKDIR /app
2023-07-29 10:49:43 -04:00
COPY --from=build /turbopilot/build/bin/turbopilot /app/turbopilot
2023-04-10 03:51:48 -04:00
ENV THREADS=4
2023-04-10 04:18:04 -04:00
ENV MODEL="/models/codegen-2B-multi-ggml-4bit-quant.bin"
2023-04-10 03:51:48 -04:00
2023-05-08 09:24:49 -04:00
ENV BATCHSIZE=64
2023-04-10 03:51:48 -04:00
COPY ./run.sh /app/
EXPOSE 18080
CMD /app/run.sh