Henk717 commited on
Commit
1708639
·
verified ·
1 Parent(s): 7c47ec5

Upgrade to the upstream fixes

Browse files
Files changed (1) hide show
  1. Dockerfile +12 -7
Dockerfile CHANGED
@@ -1,13 +1,18 @@
1
- FROM nvidia/cuda:11.8.0-devel-ubuntu22.04
2
  ARG MODEL
 
 
 
3
  ARG MODEL_NAME
4
  ARG ADDITIONAL
5
  RUN mkdir /opt/koboldcpp
6
- RUN apt update && apt install git build-essential libopenblas-dev wget python3-pip -y
7
- RUN git clone https://github.com/lostruins/koboldcpp /opt/koboldcpp
8
  WORKDIR /opt/koboldcpp
9
  COPY default.json /opt/koboldcpp/default.json
10
- RUN make LLAMA_OPENBLAS=1 LLAMA_CUBLAS=1 LLAMA_PORTABLE=1
11
- RUN wget -O model.ggml $MODEL
12
- CMD /bin/python3 ./koboldcpp.py --model model.ggml $ADDITIONAL --port 7860 --hordeconfig $MODEL_NAME 1 1 --preloadstory default.json
13
-
 
 
 
 
1
+ FROM nvidia/cuda:12.1.1-devel-ubuntu22.04
2
  ARG MODEL
3
+ ARG IMGMODEL
4
+ ARG WHISPERMODEL
5
+ ARG MMPROJ
6
  ARG MODEL_NAME
7
  ARG ADDITIONAL
8
  RUN mkdir /opt/koboldcpp
9
+ RUN apt update && apt install curl -y
 
10
  WORKDIR /opt/koboldcpp
11
  COPY default.json /opt/koboldcpp/default.json
12
+ RUN curl -fLO koboldcpp https://koboldai.org/cpplinuxcu12
13
+ RUN chmod +x ./koboldcpp
14
+ RUN curl -fLO model.ggml $MODEL || true
15
+ RUN curl -fLO imgmodel.ggml $IMGMODEL || true
16
+ RUN curl -fLO mmproj.ggml $MMPROJ || true
17
+ RUN curl -fLO whispermodel.ggml $WHISPERMODEL || true
18
+ CMD ./koboldcpp --model model.ggml --whispermodel whispermodel.ggml --sdmodel imgmodel.ggml --sdthreads 4 --sdquant --sdclamped --mmproj mmproj.ggml $ADDITIONAL --port 7860 --hordemodelname $MODEL_NAME --hordemaxctx 1 --hordegenlen 1 --preloadstory default.json --ignoremissing