Spaces:
Running
Running
Update Dockerfile
Browse files- Dockerfile +2 -7
Dockerfile
CHANGED
@@ -3,11 +3,7 @@ FROM nvidia/cuda:12.5.1-cudnn-devel-ubuntu20.04
|
|
3 |
|
4 |
# Set environment variables for non-interactive installation and timezone
|
5 |
ENV DEBIAN_FRONTEND=noninteractive \
|
6 |
-
TZ=Europe/Paris
|
7 |
-
VLLM_CPU_KVCACHE_SPACE=40 \
|
8 |
-
VLLM_CPU_OMP_THREADS_BIND=29 \
|
9 |
-
OMP_NUM_THREADS=4 \
|
10 |
-
MKL_NUM_THREADS=4
|
11 |
|
12 |
# Remove third-party apt sources to avoid issues with expiring keys
|
13 |
# Install basic utilities
|
@@ -90,9 +86,8 @@ RUN pip install --upgrade pip && \
|
|
90 |
RUN pip install vllm && \
|
91 |
pip install huggingface-hub[cli]
|
92 |
|
93 |
-
|
94 |
# Expose port for the model server
|
95 |
-
EXPOSE
|
96 |
|
97 |
# Set the working directory to /app and set the model directory
|
98 |
WORKDIR $HOME/app
|
|
|
3 |
|
4 |
# Set environment variables for non-interactive installation and timezone
|
5 |
ENV DEBIAN_FRONTEND=noninteractive \
|
6 |
+
TZ=Europe/Paris
|
|
|
|
|
|
|
|
|
7 |
|
8 |
# Remove third-party apt sources to avoid issues with expiring keys
|
9 |
# Install basic utilities
|
|
|
86 |
RUN pip install vllm && \
|
87 |
pip install huggingface-hub[cli]
|
88 |
|
|
|
89 |
# Expose port for the model server
|
90 |
+
EXPOSE 8007
|
91 |
|
92 |
# Set the working directory to /app and set the model directory
|
93 |
WORKDIR $HOME/app
|