Spaces:

xfcxcxcdfdfd
/

zxzxzxzx

Running

App Files Files Community

xfcxcxcdfdfd commited on Dec 15, 2024

Commit

d774023

verified ·

1 Parent(s): 61e1204

Update Dockerfile

Browse files

Files changed (1) hide show

Dockerfile +34 -14

Dockerfile CHANGED Viewed

@@ -1,19 +1,39 @@
-# Use the latest Ubuntu image
-FROM ubuntu:latest
-# Update and install required packages
-RUN apt-get update && apt-get install -y \
-    python3 \
-    python3-pip
-# Set the working directory
-WORKDIR /app
-# Install JupyterLab
-RUN pip3 install jupyterlab
-# Expose port 8080
-EXPOSE 7860
-# Start JupyterLab on port 8080 without authentication
-CMD ["jupyter", "lab", "--ip=0.0.0.0", "--port=7860", "--no-browser", "--allow-root", "--NotebookApp.token=''"]

+# Use a base image with Python and necessary tools
+FROM python:3.10-slim
+# Set environment variables for non-interactive installations
+ENV DEBIAN_FRONTEND=noninteractive
+# Update and install system dependencies
+RUN apt-get update -y && \
+    apt-get install -y --no-install-recommends \
+        gcc-12 g++-12 libnuma-dev libtcmalloc-minimal4 && \
+    apt-get clean && \
+    rm -rf /var/lib/apt/lists/*
+# Configure gcc and g++ alternatives
+RUN update-alternatives --install /usr/bin/gcc gcc /usr/bin/gcc-12 10 --slave /usr/bin/g++ g++ /usr/bin/g++-12
+# Upgrade pip and install Python dependencies
+RUN pip install --upgrade pip && \
+    pip install "cmake>=3.26" wheel packaging ninja "setuptools-scm>=8" numpy && \
+    pip install vllm && \
+    pip install --upgrade numba scipy "huggingface-hub[cli]" && \
+    pip install "numpy<2" && \
+    pip uninstall torch -y && \
+    pip install --no-cache-dir --pre torch==2.6.0.dev20241122 --index-url https://download.pytorch.org/whl/nightly/rocm6.2
+# Find the dynamic link library path and set LD_PRELOAD
+RUN LD_PATH=$(find / -name "*libtcmalloc*.so.4" 2>/dev/null | head -n 1) && \
+    echo "export LD_PRELOAD=$LD_PATH:\$LD_PRELOAD" >> /etc/profile && \
+    export LD_PRELOAD=$LD_PATH:$LD_PRELOAD
+# Set additional environment variables
+ENV VLLM_CPU_KVCACHE_SPACE=40
+ENV VLLM_CPU_OMP_THREADS_BIND=0-29
+# Expose the port for the model server
+EXPOSE 8007
+# Command to run the model server
+CMD ["vllm", "serve", "--device", "cpu", "--port", "8007", "Hjgugugjhuhjggg/mergekit-ties-tzamfyy", "--max-model-len", "100"]