matthoffner commited on
Commit
2c4789e
·
verified ·
1 Parent(s): 526c573

Update Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +2 -4
Dockerfile CHANGED
@@ -1,5 +1,4 @@
1
- # Base image
2
- FROM nvidia/cuda:11.8.0-devel-ubuntu22.04
3
 
4
  ENV DEBIAN_FRONTEND=noninteractive
5
 
@@ -7,7 +6,6 @@ ENV DEBIAN_FRONTEND=noninteractive
7
  RUN apt update && \
8
  apt install --no-install-recommends -y \
9
  build-essential \
10
- nvidia-cuda-toolkit \
11
  python3 \
12
  python3-pip \
13
  wget \
@@ -55,4 +53,4 @@ WORKDIR $HOME/app
55
  EXPOSE 8080
56
 
57
  # Start the llava-server with models
58
- CMD ["/app/llama.cpp/server", "--model", "ggml-model-q4_k.gguf", "--mmproj", "mmproj-model-f16.gguf", "--host", "0.0.0.0", "--threads", "4", "-ngl", "30", "-ts", "100,0"]
 
1
+ FROM nvidia/cuda:12.2.0-devel-ubuntu22.04
 
2
 
3
  ENV DEBIAN_FRONTEND=noninteractive
4
 
 
6
  RUN apt update && \
7
  apt install --no-install-recommends -y \
8
  build-essential \
 
9
  python3 \
10
  python3-pip \
11
  wget \
 
53
  EXPOSE 8080
54
 
55
  # Start the llava-server with models
56
+ CMD ["/app/llama.cpp/server", "--model", "ggml-model-q4_k.gguf", "--mmproj", "mmproj-model-f16.gguf", "--host", "0.0.0.0", "--threads", "10"]