FROM python:3.9-slim-bookworm USER root RUN apt update && apt install curl git gcc make build-essential -y RUN git clone https://github.com/ggerganov/llama.cpp WORKDIR /llama.cpp RUN make -ij server WORKDIR /llama.cpp/models RUN curl -L "https://huggingface.co/NousResearch/Meta-Llama-3-8B-Instruct-GGUF/resolve/main/Meta-Llama-3-8B-Instruct-Q4_K_M.gguf?download=true" --output Meta-Llama-3-8B-Instruct-Q4_K_M.gguf WORKDIR /llama.cpp EXPOSE 7860 RUN chmod -R 777 /llama.cpp RUN nproc CMD ./server --host 0.0.0.0 --port 7860 -t 3 -m ./models/Meta-Llama-3-8B-Instruct-Q4_K_M.gguf