server_cpp / Dockerfile
CreativeWorks's picture
Create Dockerfile
6202702 verified
raw
history blame contribute delete
633 Bytes
FROM python:3.9-slim-bookworm
USER root
RUN apt update && apt install curl git gcc make build-essential -y
RUN git clone https://github.com/ggerganov/llama.cpp
WORKDIR /llama.cpp
RUN make -ij server
WORKDIR /llama.cpp/models
RUN curl -L "https://huggingface.co/CreativeWorks/CreativeWorks_Llama-3-8B-BR-8K/resolve/main/CreativeWorks_Llama-3-8B-BR-8Kunsloth.Q4_K_M.gguf?download=true" --output CreativeWorks_Llama-3-8B-BR-8Kunsloth.Q4_K_M.gguf
WORKDIR /llama.cpp
EXPOSE 7860
RUN chmod -R 777 /llama.cpp
RUN nproc
CMD ./server --host 0.0.0.0 --port 7860 -t 3 -m ./models/CreativeWorks_Llama-3-8B-BR-8Kunsloth.Q4_K_M.gguf --parallel 2