llama_2_api / Dockerfile
amancod's picture
Update Dockerfile
225b6ed verified
raw
history blame contribute delete
313 Bytes
FROM python:3.9
WORKDIR /code
COPY ./requirements.txt /code/requirements.txt
RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
COPY ./llama-2-7b-chat.Q4_K_S.gguf /code/llama-2-7b-chat.Q4_K_S.gguf
COPY ./main.py /code/main.py
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]