Create Dockerfile
Browse files- Dockerfile +13 -0
Dockerfile
ADDED
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
FROM ghcr.io/ggerganov/llama.cpp:server-cuda
|
2 |
+
|
3 |
+
ENV LLAMA_ARG_N_GPU_LAYERS=9999
|
4 |
+
ENV LLAMA_ARG_CTX_SIZE=10000
|
5 |
+
ENV LLAMA_ARG_FLASH_ATTN=1
|
6 |
+
ENV LLAMA_ARG_HF_REPO=AstroMLab/AstroSage-8B-GGUF
|
7 |
+
ENV LLAMA_ARG_HF_FILE=AstroSage-8B-Q8_0.gguf
|
8 |
+
ENV LLAMA_ARG_N_PARALLEL=2
|
9 |
+
ENV LLAMA_ARG_PORT=7860
|
10 |
+
ENV LLAMA_ARG_HOST=0.0.0.0
|
11 |
+
|
12 |
+
RUN useradd -m -u 1000 user
|
13 |
+
USER user
|