File size: 923 Bytes
2c0eedc
e449931
1dbb897
1c97e32
1dbb897
a1992ae
015004d
a82a39b
 
 
 
8a48d19
541084a
a8a3c1a
 
 
1c97e32
 
a82a39b
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
FROM nvidia/cuda:12.1.1-devel-ubuntu22.04
ARG MODEL
ARG IMGMODEL
ARG WHISPERMODEL
ARG MMPROJ
ARG MODEL_NAME
ARG ADDITIONAL
RUN mkdir /opt/koboldcpp
RUN apt update && apt install git build-essential libopenblas-dev wget python3-pip -y
RUN git clone https://github.com/lostruins/koboldcpp /opt/koboldcpp
WORKDIR /opt/koboldcpp
COPY default.json /opt/koboldcpp/default.json
RUN make -j$(nproc) LLAMA_OPENBLAS=1 LLAMA_CUBLAS=1 LLAMA_PORTABLE=1 LLAMA_COLAB=1
RUN wget -O model.ggml $MODEL || true
RUN wget -O imgmodel.ggml $IMGMODEL || true
RUN wget -O mmproj.ggml $MMPROJ || true
RUN wget -O whispermodel.ggml $WHISPERMODEL || true
CMD /bin/python3 ./koboldcpp.py --model model.ggml --whispermodel whispermodel.ggml --sdmodel imgmodel.ggml --sdthreads 4 --sdquant --sdclamped --mmproj mmproj.ggml $ADDITIONAL --port 7860 --hordemodelname $MODEL_NAME --hordemaxctx 1 --hordegenlen 1 --preloadstory default.json --ignoremissing