goliath-120b-GGUF

Paused

gfjiogopdfgdfs commited on Jan 31

Commit

592d153

•

1 Parent(s): e8787df

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,5 +1,19 @@
-FROM nvidia/cuda:12.1.1-devel-ubuntu22.04
-RUN apt update && apt install git python3-pip -y
-ARG ENGINE_ARGS
-RUN pip3 install aphrodite-engine
-CMD /bin/python3 -m aphrodite.endpoints.kobold.api_server $ENGINE_ARGS --port 7860

+FROM nvidia/cuda:11.8.0-devel-ubuntu22.04
+RUN apt update && apt install git build-essential libopenblas-dev wget python3-pip -y
+RUN apt update && apt install -y wget
+ARG MODEL_PART_A
+ARG MODEL_PART_B
+ARG MODEL_NAME
+ARG ADDITIONAL
+RUN mkdir /opt/koboldcpp
+RUN apt update && apt install git build-essential libopenblas-dev wget python3-pip -y
+RUN git clone https://github.com/lostruins/koboldcpp /opt/koboldcpp
+WORKDIR /opt/koboldcpp
+COPY default.json /opt/koboldcpp/default.json
+RUN make LLAMA_OPENBLAS=1 LLAMA_CUBLAS=1 LLAMA_PORTABLE=1
+RUN wget -O part_a.gguf $MODEL_PART_A
+RUN wget -O part_b.gguf $MODEL_PART_B
+RUN cat part_a.gguf part_b.gguf > model.gguf
+RUN rm part_a.gguf part_b.gguf
+CMD /bin/python3 ./koboldcpp.py --model model.gguf $ADDITIONAL --port 7860 --hordeconfig $MODEL_NAME 1 1 --preloadstory default.json