update batch size arg in run.sh

This commit is contained in:
James Ravenscroft 2023-05-08 14:24:49 +01:00
parent ed3b40d643
commit 78c989076f
3 changed files with 5 additions and 1 deletions

View File

@ -22,6 +22,8 @@ ENV THREADS=4
ENV MODEL="/models/codegen-2B-multi-ggml-4bit-quant.bin"
ENV BATCHSIZE=64
COPY ./run.sh /app/
EXPOSE 18080

View File

@ -22,6 +22,8 @@ ENV THREADS=4
ENV MODEL="/models/codegen-2B-multi-ggml-4bit-quant.bin"
ENV BATCHSIZE=8
COPY ./run.sh /app/
EXPOSE 18080

2
run.sh
View File

@ -1,3 +1,3 @@
#!/bin/sh
/app/codegen-serve -t $THREADS -m $MODEL
/app/codegen-serve -t $THREADS -m $MODEL -b $BATCHSIZE