Spaces:

SDbiaseval
/

stablediffusionembeddings

No application file

App Files Files Community

cakiki commited on Oct 24, 2022

Commit

99cea46

1 Parent(s): 125e851

Upload 2 files

Browse files

Files changed (2) hide show

dataset.py +110 -0
vae_embeddings.ipynb +276 -0

dataset.py ADDED Viewed

	@@ -0,0 +1,110 @@

+# Copyright 2020 The HuggingFace Datasets Authors and the current dataset script contributor.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# TODO: Address all TODOs and remove all explanatory comments
+"""TODO: Add a description here."""
+import zipfile
+import os
+import datasets
+from PIL import Image
+from io import BytesIO
+# TODO: Name of the dataset usually match the script name with CamelCase instead of snake_case
+class sdbias(datasets.GeneratorBasedBuilder):
+    """TODO: Short description of my dataset."""
+    VERSION = datasets.Version("1.1.0")
+    # This is an example of a dataset with multiple configurations.
+    # If you don't want/need to define several sub-sets in your dataset,
+    # just remove the BUILDER_CONFIG_CLASS and the BUILDER_CONFIGS attributes.
+    # If you need to make complex sub-parts in the datasets with configurable options
+    # You can create your own builder configuration class to store attribute, inheriting from datasets.BuilderConfig
+    # BUILDER_CONFIG_CLASS = MyBuilderConfig
+    # You will be able to load one or the other configurations in the following list with
+    # data = datasets.load_dataset('my_dataset', 'first_domain')
+    # data = datasets.load_dataset('my_dataset', 'second_domain')
+    BUILDER_CONFIGS = [
+        datasets.BuilderConfig(name="first_domain", version=VERSION, description="This part of my dataset covers a first domain"),
+    ]
+    DEFAULT_CONFIG_NAME = "first_domain"  # It's not mandatory to have a default configuration. Just use one if it make sense.
+    def _info(self):
+        if self.config.name == "first_domain":  # This is the name of the configuration selected in BUILDER_CONFIGS above
+            features = datasets.Features(
+                {
+                    "adjective": datasets.Value("string"),
+                    "profession": datasets.Value("string"),
+                    "seed": datasets.Value("int32"),
+                    "image": datasets.Image()
+                    # These are the features of your dataset like images, labels ...
+                }
+            )
+        return datasets.DatasetInfo(
+            # This is the description that will appear on the datasets page.
+            description="bla",
+            # This defines the different columns of the dataset and their types
+            features=features,  # Here we define them above because they are different between the two configurations
+            # If there's a common (input, target) tuple from the features, uncomment supervised_keys line below and
+            # specify them. They'll be used if as_supervised=True in builder.as_dataset.
+            # supervised_keys=("sentence", "label"),
+            # Homepage of the dataset for documentation
+            homepage="bla",
+            # License for the dataset if available
+            license="bla",
+            # Citation for the dataset
+            citation="bli",
+        )
+    def _split_generators(self, dl_manager):
+        # TODO: This method is tasked with downloading/extracting the data and defining the splits depending on the configuration
+        # If several configurations are possible (listed in BUILDER_CONFIGS), the configuration selected by the user is in self.config.name
+        # dl_manager is a datasets.download.DownloadManager that can be used to download and extract URLS
+        # It can accept any type or nested list/dict and will give back the same structure with the url replaced with path to local files.
+        # By default the archives will be extracted and a path to a cached folder where they are extracted is returned instead of the archive
+        data_dir = "/mnt/1da05489-3812-4f15-a6e5-c8d3c57df39e/StableDiffusionBiasExplorer/zipped_images"
+        return [
+            datasets.SplitGenerator(
+                name=datasets.Split.TRAIN,
+                # These kwargs will be passed to _generate_examples
+                gen_kwargs={
+                    "filepath":data_dir,
+                    "split": "train",
+                },
+            ),
+        ]
+    # method parameters are unpacked from `gen_kwargs` as given in `_split_generators`
+    def _generate_examples(self, filepath, split):
+        zip_files = os.listdir(filepath)
+        key = 0
+        for zip_file in zip_files:
+            with zipfile.ZipFile(filepath + "/" + zip_file, "r") as zf:
+                for f in zf.filelist:
+                    if ".jpg" in f.filename:
+                        jpg_content = BytesIO(zf.read(f))
+                        with Image.open(jpg_content) as image:
+                            yield key, {
+                                "adjective": zip_file.split("_", 1)[0],
+                                "profession": zip_file.split("_", 1)[-1].replace(".zip",""),
+                                "seed": int(f.filename.split("Seed_")[-1].split("/")[0]),
+                                "image": image,
+                            }
+                        key+=1

vae_embeddings.ipynb ADDED Viewed

	@@ -0,0 +1,276 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "873b1354-b85f-4c5b-9163-95190f07b39a",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "import zipfile\n",
+    "from PIL import Image\n",
+    "from io import BytesIO\n",
+    "import numpy as np\n",
+    "from datasets import load_dataset\n",
+    "import torch\n",
+    "from diffusers import AutoencoderKL, UNet2DModel, UNet2DConditionModel\n",
+    "import pickle"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "35949720-3e01-43b0-8487-a1b2131d5a9e",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def preprocess_image(image):\n",
+    "    w, h = image.size\n",
+    "    w, h = map(lambda x: x - x % 32, (w, h))  # resize to integer multiple of 32\n",
+    "    image = image.resize((w, h), resample=Image.Resampling.LANCZOS)\n",
+    "    image = np.array(image).astype(np.float32) / 255.0\n",
+    "    image = image[None].transpose(0, 3, 1, 2)\n",
+    "    return 2.0 * image - 1.0\n",
+    "\n",
+    "def vae_embedding(preprocessed, num_samples=5, device=\"cuda\"):\n",
+    "    with torch.no_grad():\n",
+    "        processed_image = preprocessed.to(device=device)\n",
+    "        latent_dist = vae.encode(processed_image).latent_dist\n",
+    "        t = [0.18215*latent_dist.sample().to(\"cpu\").squeeze() for i in range(num_samples)] # sample num_samples latent vecs\n",
+    "        t = torch.stack(t) # stack them\n",
+    "        return torch.mean(t, axis=0).numpy() #average them. output shape: (4,64,64)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "6ebd9d84-98f7-4883-ac4b-0ec875b86911",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "Using custom data configuration SDbiaseval--dataset-cc8e38e46c1acd54\n",
+      "Found cached dataset parquet (/mnt/1da05489-3812-4f15-a6e5-c8d3c57df39e/cache/huggingface/SDbiaseval___parquet/SDbiaseval--dataset-cc8e38e46c1acd54/0.0.0/2a3b91fbd88a2c90d1dbbb32b460cf621d31bd5b05b934492fdef7d8d6f236ec)\n"
+     ]
+    },
+    {
+     "data": {
+      "application/vnd.jupyter.widget-view+json": {
+       "model_id": "f184861d2e2749c9b7c1c1ea3910be27",
+       "version_major": 2,
+       "version_minor": 0
+      },
+      "text/plain": [
+       "  0%|          | 0/1 [00:00<?, ?it/s]"
+      ]
+     },
+     "metadata": {},
+     "output_type": "display_data"
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 196 ms, sys: 23.3 ms, total: 219 ms\n",
+      "Wall time: 2.51 s\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "# dset = load_dataset(\"./dataset.py\", ignore_verifications=True) This uses the loading script and loads data from the zipped folders\n",
+    "dset = load_dataset(\"SDbiaseval/dataset\")\n",
+    "ds = dset[\"train\"]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "fd832e2b-6ced-43ca-a4ca-fd54f523d22e",
+   "metadata": {
+    "tags": []
+   },
+   "outputs": [],
+   "source": [
+    "vae = AutoencoderKL.from_pretrained(\"CompVis/stable-diffusion-v1-4\", subfolder=\"vae\");\n",
+    "vae.eval()\n",
+    "vae.to(\"cuda\");"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "b2af2692-a372-4b96-8250-8c83c122457d",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "19554 batches of 16. Last batch of size 15.\n"
+     ]
+    }
+   ],
+   "source": [
+    "ix = np.arange(len(ds))\n",
+    "np.random.shuffle(ix)\n",
+    "batch_size = 16\n",
+    "batche_indices = np.array_split(ix, np.ceil(len(ix)/batch_size))\n",
+    "print(f\"{len(batche_indices)} batches of {batch_size}. Last batch of size {len(batche_indices[-1])}.\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "id": "8a54fdf1-f0e5-487e-b53d-afc8dbcc989c",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 9h 52min 30s, sys: 2min 25s, total: 9h 54min 55s\n",
+      "Wall time: 7h 54min 48s\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "embs = []\n",
+    "for i in batche_indices:\n",
+    "    imx = ds.select(i)[\"image\"]\n",
+    "    preprocessed = np.concatenate([preprocess_image(im) for im in imx])\n",
+    "    emb = vae_embedding(torch.from_numpy(preprocessed), num_samples=10)\n",
+    "    embs.append(emb)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "id": "06d9346c-912f-4e24-a0ff-d5386c1780a1",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "with open('embs.pkl', 'wb') as f:\n",
+    "    pickle.dump(embs, f)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "3d0cbe87-dfb2-4c59-adf5-b4d015e2d441",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "embeddings = np.concatenate(embs)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "a6e826a9-93e0-4298-813d-9c42d139ff96",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "with open(\"embs.pkl\", \"rb\") as f:\n",
+    "    embeddings = pickle.load(f)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "id": "0783bb60-5439-4a62-a4ac-15198688b331",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 3.82 s, sys: 4.34 s, total: 8.16 s\n",
+      "Wall time: 8.2 s\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "embeddings = np.concatenate(embeddings)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "id": "50369f37-a4f1-4a7c-89dd-b4ef9a8ebf8b",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "(312860, 4, 64, 64)"
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "embeddings.shape"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "id": "93f1ea7b-cbcd-49c3-a7c7-4ea26012f9b3",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 0 ns, sys: 10.3 s, total: 10.3 s\n",
+      "Wall time: 10.3 s\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "with open('vae_embeddings.npy', 'wb') as f:\n",
+    "    np.save(f, embeddings)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "2b316682-f5cc-44d7-a8ed-f1da9b6c3089",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}