litellm / Dockerfile
zhengr's picture
Create Dockerfile
3e7b48f verified
raw
history blame
370 Bytes
# Dockerfile
FROM quay.io/go-skynet/local-ai:latest
WORKDIR /app
RUN mkdir models
RUN wget -q "https://huggingface.co/TheBloke/Mistral-7B-Instruct-v0.2-GGUF/resolve/main/mistral-7b-instruct-v0.2.Q4_0.gguf" -O models/mistral-7b-instruct-v0.2.Q4_0.gguf
COPY models/* models/
EXPOSE 8080
CMD ["--models-path", "/app/models", "--context-size", "4090", "--threads", "4"]