File size: 569 Bytes
6fdf93a
 
 
 
7cadd44
6fdf93a
7cadd44
a8e13c6
7cadd44
3939046
8cdfd69
1dc1589
0630f9d
1
2
3
4
5
6
7
8
9
10
11
12
13
FROM python:3.9-slim-bookworm
USER root
RUN apt update && apt install curl git gcc make build-essential -y
RUN git clone https://github.com/ggerganov/llama.cpp
WORKDIR /llama.cpp
RUN make -ij server
WORKDIR /llama.cpp/models 
RUN curl -L  "https://huggingface.co/microsoft/Phi-3-mini-4k-instruct-gguf/resolve/main/Phi-3-mini-4k-instruct-q4.gguf?download=true" --output Phi-3-mini-4k-instruct-q4.gguf
WORKDIR /llama.cpp
EXPOSE 7860
RUN chmod -R 777 /llama.cpp
RUN nproc
CMD ./server --host 0.0.0.0 --port 7860 -t 3 -m ./models/Phi-3-mini-4k-instruct-q4.gguf --parallel 2