File size: 552 Bytes
092a975 495083b 092a975 8ae6c69 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 |
FROM python:3.12
RUN useradd -m -u 1000 app
WORKDIR /home/app
RUN apt update
RUN apt install -y wget make cmake clang git g++
RUN wget https://huggingface.co/neph1/llama-3.1-instruct-bellman-8b-swedish/resolve/main/gguf/llama-3.1-instruct-bellman-8b-swedish-Q8.gguf?download=true -O model.gguf
RUN git clone https://github.com/ggerganov/llama.cpp
RUN mv llama.cpp llama_temp
RUN mv llama_temp/* .
RUN cmake
RUN apt install socat -y
EXPOSE 7860
CMD ["sh", "-c", "./build/bin/llama-server -m /home/app/model.gguf -c 8192 --host 0.0.0.0 --port 7860"] |