MidnightMiquHost / Dockerfile
Henk717's picture
GPU Edition
9a38c06
raw
history blame
503 Bytes
FROM nvidia/cuda:11.0.3-devel-ubi8
RUN mkdir /opt/koboldcpp
RUN apt update && apt install git build-essential libopenblas-dev wget python3-pip -y
RUN git clone https://github.com/lostruins/koboldcpp /opt/koboldcpp
WORKDIR /opt/koboldcpp
RUN make LLAMA_OPENBLAS=1 LLAMA_CUBLAS=1
RUN wget -O model.ggml $MODEL
CMD ["/bin/python3", "./koboldcpp.py", "--model", "model.ggml", "--usecublas", "mmq", "--multiuser", "--contextsize", "4096", "--port", "7860", "--hordeconfig", "HF_SPACE_Tiefighter", "1", "1"]