Tijmen2 commited on
Commit
4984c66
·
verified ·
1 Parent(s): dd699aa

Create Dockerfile

Browse files
Files changed (1) hide show
  1. Dockerfile +13 -0
Dockerfile ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ FROM ghcr.io/ggerganov/llama.cpp:server-cuda
2
+
3
+ ENV LLAMA_ARG_N_GPU_LAYERS=9999
4
+ ENV LLAMA_ARG_CTX_SIZE=10000
5
+ ENV LLAMA_ARG_FLASH_ATTN=1
6
+ ENV LLAMA_ARG_HF_REPO=AstroMLab/AstroSage-8B-GGUF
7
+ ENV LLAMA_ARG_HF_FILE=AstroSage-8B-Q8_0.gguf
8
+ ENV LLAMA_ARG_N_PARALLEL=2
9
+ ENV LLAMA_ARG_PORT=7860
10
+ ENV LLAMA_ARG_HOST=0.0.0.0
11
+
12
+ RUN useradd -m -u 1000 user
13
+ USER user