Spaces:

matthoffner
/

ggml-mllm

Paused

matthoffner commited on Feb 2, 2024

Commit

2c4789e

verified ·

1 Parent(s): 526c573

Update Dockerfile

Files changed (1) hide show

Dockerfile CHANGED Viewed

@@ -1,5 +1,4 @@
-# Base image
-FROM nvidia/cuda:11.8.0-devel-ubuntu22.04
 ENV DEBIAN_FRONTEND=noninteractive
@@ -7,7 +6,6 @@ ENV DEBIAN_FRONTEND=noninteractive
 RUN apt update && \
     apt install --no-install-recommends -y \
         build-essential \
-        nvidia-cuda-toolkit \
         python3 \
         python3-pip \
         wget \
@@ -55,4 +53,4 @@ WORKDIR $HOME/app
 EXPOSE 8080
 # Start the llava-server with models
-CMD ["/app/llama.cpp/server", "--model", "ggml-model-q4_k.gguf", "--mmproj", "mmproj-model-f16.gguf", "--host", "0.0.0.0", "--threads", "4", "-ngl", "30", "-ts", "100,0"]

+FROM nvidia/cuda:12.2.0-devel-ubuntu22.04
 ENV DEBIAN_FRONTEND=noninteractive
 RUN apt update && \
     apt install --no-install-recommends -y \
         build-essential \
         python3 \
         python3-pip \
         wget \
 EXPOSE 8080
 # Start the llava-server with models
+CMD ["/app/llama.cpp/server", "--model", "ggml-model-q4_k.gguf", "--mmproj", "mmproj-model-f16.gguf", "--host", "0.0.0.0", "--threads", "10"]