server.cpp / Dockerfile
iAkashPaul's picture
Update Dockerfile
8cdfd69 verified
raw
history blame
551 Bytes
FROM python:3.9-slim-bookworm
USER root
RUN apt update && apt install curl git gcc make build-essential -y
RUN git clone https://github.com/ggerganov/llama.cpp
WORKDIR /llama.cpp
RUN make -ij server
WORKDIR /llama.cpp/models
RUN curl -L "https://huggingface.co/iAkashPaul/gemma-7b-it-gguf/resolve/main/gemma-7b-it-Q4_0.gguf?download=true" --output gemma-7b-it-Q4_0.gguf
WORKDIR /llama.cpp
EXPOSE 8080
RUN chmod -R 777 /.cache
RUN chmod -R 777 /.config
RUN chmod -R 777 /llama.cpp
CMD ./server -t 4 -m ./models/gemma-7b-it-Q4_0.gguf & sleep infinity