matthoffner commited on
Commit
857e31a
·
verified ·
1 Parent(s): 1f7d2e2

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +7 -18
Dockerfile CHANGED
@@ -1,30 +1,19 @@
1
  FROM ghcr.io/ggerganov/llama.cpp:full
2
 
3
- ENV DEBIAN_FRONTEND=noninteractive
 
4
 
5
- # Update and install necessary dependencies
6
- RUN apt update && \
7
- apt install --no-install-recommends -y \
8
- build-essential \
9
- python3 \
10
- python3-pip \
11
- wget \
12
- curl \
13
- git \
14
- cmake \
15
- zlib1g-dev \
16
- libblas-dev && \
17
- apt clean && \
18
- rm -rf /var/lib/apt/lists/*
19
 
20
  WORKDIR /app
21
 
22
- RUN wget https://huggingface.co/matthoffner/Magicoder-S-DS-6.7B-GGUF/resolve/main/Magicoder-S-DS-6.7B_Q4_K_M.gguf
 
23
 
24
  RUN make
25
 
26
  # Expose the port
27
  EXPOSE 8080
28
 
29
- # Start the llava-server with models
30
- CMD ["--server", "--model", "Magicoder-S-DS-6.7B_Q4_K_M.gguf", "--threads", "6", "--host", "0.0.0.0", "-ngl", "33"]
 
1
  FROM ghcr.io/ggerganov/llama.cpp:full
2
 
3
+ ARG MODEL_URL=https://huggingface.co/Nan-Do/Truthful_DPO_TomGrc_FusionNet_7Bx2_MoE_13B-GGUF/resolve/main
4
+ ARG MODEL_NAME=Truthful_DPO_TomGrc_FusionNet_7Bx2_MoE_13B-Q4_0.gguf
5
 
6
+ ENV DEBIAN_FRONTEND=noninteractive
 
 
 
 
 
 
 
 
 
 
 
 
 
7
 
8
  WORKDIR /app
9
 
10
+ # Use the variables for the model URL and name
11
+ RUN wget ${MODEL_URL}/${MODEL_NAME}
12
 
13
  RUN make
14
 
15
  # Expose the port
16
  EXPOSE 8080
17
 
18
+ # Use the model name variable in CMD as well
19
+ CMD ["--server", "--model", "${MODEL_NAME}", "--threads", "10", "--host", "0.0.0.0"]