none commited on
Commit
731bd50
·
1 Parent(s): ebb4897
Files changed (6) hide show
  1. .gitattributes +1 -0
  2. .gitignore +1 -0
  3. Dockerfile +11 -6
  4. kaggle.json.enc +2 -0
  5. libbitsandbytes_cuda124.so +3 -0
  6. start.sh +8 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ *.so filter=lfs diff=lfs merge=lfs -text
.gitignore CHANGED
@@ -1 +1,2 @@
1
  apps.json
 
 
1
  apps.json
2
+ kaggle.json
Dockerfile CHANGED
@@ -1,13 +1,13 @@
1
- # build with: docker build . --tag sctg/roco-idefics3:0.0.15 --tag sctg/roco-idefics3:latest --push
2
  # run with
3
- # docker run --gpus all --user=42420:42420 -p 7000-8000:7000-8000 -p 8080:8080 -e HF_TOKEN=hf_TOKEN -it sctg/roco-idefics3:0.0.15 bash -i /start.sh sleep infinity
4
- # docker run --gpus all --user=42420:42420 -p 7000-8000:7000-8000 -p 8080:8080 -it sctg/roco-idefics3:0.0.15 bash -i /start.sh python /learn.py hf_...
5
  FROM cloudflare/cloudflared:latest as cloudflared
6
- FROM nvidia/cuda:12.6.2-devel-ubuntu22.04
7
  ARG NODE_MAJOR="20"
8
  RUN /usr/sbin/addgroup --gid 42420 ovh
9
  RUN /usr/sbin/useradd -u 42420 --gid 42420 -m -d /workspace -s /bin/bash ovh
10
- RUN apt update -y && apt-get install -y curl git git-lfs screen sudo \
11
  && mkdir -p /etc/apt/keyrings \
12
  && curl -fsSL https://deb.nodesource.com/gpgkey/nodesource-repo.gpg.key | gpg --dearmor -o /etc/apt/keyrings/nodesource.gpg \
13
  && echo "deb [signed-by=/etc/apt/keyrings/nodesource.gpg] https://deb.nodesource.com/node_$NODE_MAJOR.x nodistro main" | tee /etc/apt/sources.list.d/nodesource.list \
@@ -27,6 +27,7 @@ RUN . /workspace/.miniconda3/bin/activate && conda init --all
27
  RUN . /workspace/.miniconda3/bin/activate \
28
  && pip install -U "safetensors>=0.4.5" \
29
  && pip install -U tensorflow \
 
30
  && pip install -U 'https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_multi-backend-refactor/bitsandbytes-0.44.1.dev0-py3-none-manylinux_2_24_x86_64.whl' \
31
  && pip install -U git+https://github.com/huggingface/transformers.git\
32
  && pip install huggingface_hub[cli] accelerate datasets peft\
@@ -39,12 +40,16 @@ RUN . /workspace/.miniconda3/bin/activate \
39
  && pip install unsloth\
40
  && pip install gradio \
41
  && pip uninstall unsloth -y \
42
- && pip install --upgrade --no-cache-dir --no-deps git+https://github.com/unslothai/unsloth.git
 
 
 
43
 
44
  RUN . /workspace/.miniconda3/bin/activate && conda install -y jupyter
45
  RUN rm -f /workspace/miniconda.sh
46
  RUN mkdir -p /workspace/.config/github-copilot/
47
  COPY apps.json.enc /workspace/.config/github-copilot/apps.json.enc
 
48
  COPY CFTOKEN.enc /workspace/.config/CFTOKEN.enc
49
  # Mandatory to run the jobs in rootless mode
50
  # USER root
 
1
+ # build with: docker build . --tag sctg/roco-idefics3:0.0.17 --tag sctg/roco-idefics3:latest --push
2
  # run with
3
+ # docker run --gpus all --user=42420:42420 -p 7000-8000:7000-8000 -p 8080:8080 -e WANDB_API_KEY=wdkfjzfjz -e HF_TOKEN=hf_TOKEN -it sctg/roco-idefics3:0.0.17 bash -i /start.sh sleep infinity
4
+ # docker run --gpus all --user=42420:42420 -p 7000-8000:7000-8000 -p 8080:8080 -it sctg/roco-idefics3:0.0.17 bash -i /start.sh python /learn.py hf_...
5
  FROM cloudflare/cloudflared:latest as cloudflared
6
+ FROM nvidia/cuda:12.6.2-cudnn-devel-ubuntu22.04
7
  ARG NODE_MAJOR="20"
8
  RUN /usr/sbin/addgroup --gid 42420 ovh
9
  RUN /usr/sbin/useradd -u 42420 --gid 42420 -m -d /workspace -s /bin/bash ovh
10
+ RUN apt update -y && apt-get install -y cmake curl git git-lfs screen sudo \
11
  && mkdir -p /etc/apt/keyrings \
12
  && curl -fsSL https://deb.nodesource.com/gpgkey/nodesource-repo.gpg.key | gpg --dearmor -o /etc/apt/keyrings/nodesource.gpg \
13
  && echo "deb [signed-by=/etc/apt/keyrings/nodesource.gpg] https://deb.nodesource.com/node_$NODE_MAJOR.x nodistro main" | tee /etc/apt/sources.list.d/nodesource.list \
 
27
  RUN . /workspace/.miniconda3/bin/activate \
28
  && pip install -U "safetensors>=0.4.5" \
29
  && pip install -U tensorflow \
30
+ && pip install -U tf-keras \
31
  && pip install -U 'https://github.com/bitsandbytes-foundation/bitsandbytes/releases/download/continuous-release_multi-backend-refactor/bitsandbytes-0.44.1.dev0-py3-none-manylinux_2_24_x86_64.whl' \
32
  && pip install -U git+https://github.com/huggingface/transformers.git\
33
  && pip install huggingface_hub[cli] accelerate datasets peft\
 
40
  && pip install unsloth\
41
  && pip install gradio \
42
  && pip uninstall unsloth -y \
43
+ && pip install --upgrade --no-cache-dir --no-deps git+https://github.com/unslothai/unsloth.git \
44
+ && pip install wandb
45
+
46
+ COPY --chmod=777 libbitsandbytes_cuda124.so /workspace/.miniconda3/lib/python3.12/site-packages/bitsandbytes/libbitsandbytes_cuda124.so
47
 
48
  RUN . /workspace/.miniconda3/bin/activate && conda install -y jupyter
49
  RUN rm -f /workspace/miniconda.sh
50
  RUN mkdir -p /workspace/.config/github-copilot/
51
  COPY apps.json.enc /workspace/.config/github-copilot/apps.json.enc
52
+ COPY kaggle.json.enc /workspace/.config/kaggle.json.enc
53
  COPY CFTOKEN.enc /workspace/.config/CFTOKEN.enc
54
  # Mandatory to run the jobs in rootless mode
55
  # USER root
kaggle.json.enc ADDED
@@ -0,0 +1,2 @@
 
 
 
1
+ U2FsdGVkX1+XKfjZhSpObwI5HP7f0R/U/8Paum3H41R7B3HImmd1rUJNeG4x1zFJ
2
+ HqBGdGRcJiWwKkMVOCQyFQrNJTKKOFt/wDk1FWqEoQ8=
libbitsandbytes_cuda124.so ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41c9698af520efd7212d164e394aadb42d45b5fdee0b36ed31ae25422ac29c30
3
+ size 34242400
start.sh CHANGED
@@ -37,6 +37,14 @@ if [ -f /workspace/.config/CFTOKEN.enc ]; then
37
  /usr/local/bin/cloudflared --pidfile /tmp/cf.pid --autoupdate-freq 24h0m0s tunnel run --token $CFTOKEN &
38
  fi
39
 
 
 
 
 
 
 
 
 
40
  git clone https://huggingface.co/eltorio/IDEFICS3_ROCOv2
41
  git config --global user.email "[email protected]"
42
  git config --global user.name "[email protected]"
 
37
  /usr/local/bin/cloudflared --pidfile /tmp/cf.pid --autoupdate-freq 24h0m0s tunnel run --token $CFTOKEN &
38
  fi
39
 
40
+ # Decode kaggle.json.enc file
41
+ # encoded with: openssl aes-256-cbc -base64 -md sha256 -pass pass:"$HF_TOKEN" -in kaggle.json -out kaggle.json.enc
42
+ # decode with: openssl aes-256-cbc -a -d -md sha256 -pass pass:"$HF_TOKEN" -in kaggle.json.enc -out kaggle.json
43
+ if [ -f /workspace/.config/kaggle.json.enc ]; then
44
+ mkdir -p $HOME/.kaggle
45
+ openssl aes-256-cbc -a -d -md sha256 -pass pass:"$HF_TOKEN" -in /workspace/.config/kaggle.json.enc -out /workspace/.kaggle/kaggle.json
46
+ fi
47
+
48
  git clone https://huggingface.co/eltorio/IDEFICS3_ROCOv2
49
  git config --global user.email "[email protected]"
50
  git config --global user.name "[email protected]"