Shawn732 commited on
Commit
8aa15e7
·
1 Parent(s): 6445214
Files changed (1) hide show
  1. Dockerfile +15 -28
Dockerfile CHANGED
@@ -1,17 +1,9 @@
1
- # Use an NVIDIA CUDA base image
2
- ARG CUDA_IMAGE="12.3.1-base-ubuntu22.04"
3
  FROM nvidia/cuda:${CUDA_IMAGE}
4
 
 
5
  ENV HOST 0.0.0.0
6
 
7
- # Set the working directory in the container to /app
8
- #WORKDIR /app
9
-
10
- RUN mkdir -p /app/cache && chmod -R 777 /app/cache
11
-
12
- ENV HF_HOME=/app/cache
13
-
14
- # Install Python and pip
15
  RUN apt-get update && apt-get upgrade -y \
16
  && apt-get install -y git build-essential \
17
  python3 python3-pip gcc wget \
@@ -19,28 +11,23 @@ RUN apt-get update && apt-get upgrade -y \
19
  libclblast-dev libopenblas-dev \
20
  && mkdir -p /etc/OpenCL/vendors && echo "libnvidia-opencl.so.1" > /etc/OpenCL/vendors/nvidia.icd
21
 
 
 
 
22
  ENV CUDA_DOCKER_ARCH=all
23
  ENV LLAMA_CUBLAS=1
24
 
25
- # Copy the current directory contents into the container at /app
26
- COPY . /app
 
 
27
 
28
- # Install required packages from requirements.txt
29
- COPY ./requirements.txt /app/requirements.txt
30
- RUN pip3 install --no-cache-dir -r /app/requirements.txt
31
-
32
- # Expose the ports for FastAPI and Streamlit
33
- EXPOSE 8000
34
- EXPOSE 8501
35
-
36
- # Copy and give execute permissions to the start script
37
- COPY start_server.sh /app/start_server.sh
38
- RUN chmod +x /app/start_server.sh
39
 
40
  RUN useradd -m -u 1000 user
41
  # Switch to the "user" user
42
  USER user
43
- WORKDIR /home/user/app
44
  # Set home to the user's home directory
45
  ENV HOME=/home/user \
46
  PATH=/home/user/.local/bin:$PATH \
@@ -52,9 +39,9 @@ ENV HOME=/home/user \
52
  GRADIO_THEME=huggingface \
53
  SYSTEM=spaces
54
 
 
 
55
  # Copy the current directory contents into the container at $HOME/app setting the owner to the user
56
- COPY --chown=user . /home/user/app
57
 
58
- # Run the start script
59
- #CMD ["/app/start_server.sh"]
60
- CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]
 
1
+ ARG CUDA_IMAGE="12.1.1-devel-ubuntu22.04"
 
2
  FROM nvidia/cuda:${CUDA_IMAGE}
3
 
4
+ # We need to set the host to 0.0.0.0 to allow outside access
5
  ENV HOST 0.0.0.0
6
 
 
 
 
 
 
 
 
 
7
  RUN apt-get update && apt-get upgrade -y \
8
  && apt-get install -y git build-essential \
9
  python3 python3-pip gcc wget \
 
11
  libclblast-dev libopenblas-dev \
12
  && mkdir -p /etc/OpenCL/vendors && echo "libnvidia-opencl.so.1" > /etc/OpenCL/vendors/nvidia.icd
13
 
14
+ COPY . .
15
+
16
+ # setting build related env vars
17
  ENV CUDA_DOCKER_ARCH=all
18
  ENV LLAMA_CUBLAS=1
19
 
20
+ # Install depencencies
21
+ RUN python3 -m pip install --upgrade pip pytest cmake \
22
+ scikit-build setuptools fastapi uvicorn sse-starlette \
23
+ pydantic-settings starlette-context gradio huggingface_hub hf_transfer
24
 
25
+ # Install llama-cpp-python (build with cuda)
26
+ RUN CMAKE_ARGS="-DLLAMA_CUBLAS=on" pip install llama-cpp-python
 
 
 
 
 
 
 
 
 
27
 
28
  RUN useradd -m -u 1000 user
29
  # Switch to the "user" user
30
  USER user
 
31
  # Set home to the user's home directory
32
  ENV HOME=/home/user \
33
  PATH=/home/user/.local/bin:$PATH \
 
39
  GRADIO_THEME=huggingface \
40
  SYSTEM=spaces
41
 
42
+ WORKDIR $HOME/app
43
+
44
  # Copy the current directory contents into the container at $HOME/app setting the owner to the user
45
+ COPY --chown=user . $HOME/app
46
 
47
+ CMD ["python3", "app.py"]