Spaces:

webai-community
/

demos

Running

App Files Files Community

Yang Gu commited on Apr 17, 2024

Commit

78e34bc

1 Parent(s): 397aeb0

Refine SD turbo

Browse files

Files changed (6) hide show

demo/sd-turbo/index.html +14 -58
demo/sd-turbo/models/{text_encoder/model.onnx → text_encoder.onnx} +0 -0
demo/sd-turbo/models/{unet/model.onnx → unet.onnx} +0 -0
demo/sd-turbo/models/{vae_decoder/model.onnx → vae_decoder.onnx} +0 -0
main.js +7 -5
util.js +7 -7

demo/sd-turbo/index.html CHANGED Viewed

@@ -9,8 +9,8 @@
   window.AutoTokenizer = AutoTokenizer;
   env.localModelPath = 'models';
 </script>
-<script src="https://cdn.jsdelivr.net/npm/onnxruntime-web@dev/dist/ort.webgpu.min.js">
-</script>
 <head>
   <title>Stable Diffusion Turbo</title>
@@ -57,6 +57,7 @@
       </canvas>
     </div>
     <p class="text-lg-start">
     <div id="status" style="font: 1em consolas;"></div>
     </p>
   </div>
@@ -226,26 +227,6 @@ fn main(@location(0) fragUV : vec2<f32>) -> @location(0) vec4<f32> {
     return data;
   }
-  async function fetchAndCache(base_url, model_path) {
-    const url = `${base_url}/${model_path}`;
-    try {
-      const cache = await caches.open("onnx");
-      let cachedResponse = await cache.match(url);
-      if (cachedResponse == undefined) {
-        await cache.add(url);
-        cachedResponse = await cache.match(url);
-        log(`${model_path} (network)`);
-      } else {
-        log(`${model_path} (cached)`);
-      }
-      const data = await cachedResponse.arrayBuffer();
-      return data;
-    } catch (error) {
-      log(`${model_path} (network)`);
-      return await fetch(url).then(response => response.arrayBuffer());
-    }
-  }
   function uploadToGPU(buffer, values, type) {
     const stagingBuffer = deviceWebgpu.createBuffer({
@@ -278,62 +259,37 @@ fn main(@location(0) fragUV : vec2<f32>) -> @location(0) vec4<f32> {
   }
   async function load_models(models) {
-    const cache = await caches.open("onnx");
-    let missing = 0;
-    for (const [name, model] of Object.entries(models)) {
-      const url = `${config.model}/${model.url}`;
-      let cachedResponse = await cache.match(url);
-      if (cachedResponse === undefined) {
-        missing += model.size;
-      }
-    }
-    if (missing > 0) {
-      log(`downloading ${missing} MB from network ... it might take a while`);
-    } else {
-      log("loading...");
-    }
     let loadedCount = 0;
     for (const [name, model] of Object.entries(models)) {
-      try {
-        if (loadedCount === 1) {
-          webgpuResourceInitialize();
-        }
-        const start = performance.now();
-        const model_bytes = await fetchAndCache(config.model, model.url);
-        const sess_opt = { ...opt, ...model.opt };
-        // profiling
-        //ort.env.webgpu.profiling = { mode: "default" };
-        models[name].sess = await ort.InferenceSession.create(model_bytes, sess_opt);
-        const stop = performance.now();
-        loadedCount++;
-        log(`${model.url} in ${(stop - start).toFixed(1)}ms`);
-      } catch (e) {
-        log(`${model.url} failed, ${e}`);
-      }
     }
     const latent_shape = [1, 4, 64, 64];
     latentData = randn_latents(latent_shape, sigma);
     uploadToGPU(latentBuffer, latentData, "float32");
     submitComputeTask(prescaleLatentSpacePipeline, prescaleLatentSpaceBindGroup);
-    log("ready.");
   }
   const config = getConfig();
   const models = {
     "unet": {
-      url: "unet/model.onnx", size: 640,
       // should have 'steps: 1' but will fail to create the session
       opt: { freeDimensionOverrides: { batch_size: 1, num_channels: 4, height: 64, width: 64, sequence_length: 77, } }
     },
     "text_encoder": {
-      url: "text_encoder/model.onnx", size: 1700,
       // should have 'sequence_length: 77' but produces a bad image
       opt: { freeDimensionOverrides: { batch_size: 1, } },
     },
     "vae_decoder": {
-      url: "vae_decoder/model.onnx", size: 95,
       opt: { freeDimensionOverrides: { batch_size: 1, num_channels_latent: 4, height_latent: 64, width_latent: 64 } }
     }
   }
@@ -714,4 +670,4 @@ fn main(@location(0) fragUV : vec2<f32>) -> @location(0) vec4<f32> {
   }
 </script>
-</html>

   window.AutoTokenizer = AutoTokenizer;
   env.localModelPath = 'models';
 </script>
+<script src="https://cdn.jsdelivr.net/npm/onnxruntime-web@dev/dist/ort.webgpu.min.js"></script>
+<script src="../../util.js"></script>
 <head>
   <title>Stable Diffusion Turbo</title>
       </canvas>
     </div>
     <p class="text-lg-start">
+      <text id="model-progress">Downloading model</text><br />
     <div id="status" style="font: 1em consolas;"></div>
     </p>
   </div>
     return data;
   }
   function uploadToGPU(buffer, values, type) {
     const stagingBuffer = deviceWebgpu.createBuffer({
   }
   async function load_models(models) {
     let loadedCount = 0;
     for (const [name, model] of Object.entries(models)) {
+      const model_bytes = await getModelOPFS(model.url, `models/${model.url}`, false);
+      const sess_opt = { ...opt, ...model.opt };
+      // profiling
+      //ort.env.webgpu.profiling = { mode: "default" };
+      models[name].sess = await ort.InferenceSession.create(model_bytes, sess_opt);
     }
+    document.getElementById('model-progress').innerHTML = 'Model download finished. You may now click "Send" button to generate a new image.';
+    webgpuResourceInitialize();
     const latent_shape = [1, 4, 64, 64];
     latentData = randn_latents(latent_shape, sigma);
     uploadToGPU(latentBuffer, latentData, "float32");
     submitComputeTask(prescaleLatentSpacePipeline, prescaleLatentSpaceBindGroup);
   }
   const config = getConfig();
   const models = {
     "unet": {
+      url: "unet.onnx", size: 640,
       // should have 'steps: 1' but will fail to create the session
       opt: { freeDimensionOverrides: { batch_size: 1, num_channels: 4, height: 64, width: 64, sequence_length: 77, } }
     },
     "text_encoder": {
+      url: "text_encoder.onnx", size: 1700,
       // should have 'sequence_length: 77' but produces a bad image
       opt: { freeDimensionOverrides: { batch_size: 1, } },
     },
     "vae_decoder": {
+      url: "vae_decoder.onnx", size: 95,
       opt: { freeDimensionOverrides: { batch_size: 1, num_channels_latent: 4, height_latent: 64, width_latent: 64 } }
     }
   }
   }
 </script>
+</html>

demo/sd-turbo/models/{text_encoder/model.onnx → text_encoder.onnx} RENAMED Viewed

File without changes

demo/sd-turbo/models/{unet/model.onnx → unet.onnx} RENAMED Viewed

File without changes

demo/sd-turbo/models/{vae_decoder/model.onnx → vae_decoder.onnx} RENAMED Viewed

File without changes

main.js CHANGED Viewed

@@ -49,21 +49,23 @@ function createElem(tag, attrs = {}, children = []) {
   return elem;
 }
 const pageCategories = [
   {
     title: `Computer Vision`,
     description: `Computer Vision`,
     demos: {
-      gemma: {
-        name: 'Stable Diffusion Turbo',
-        description: `Stable Diffusion Turbo from https://github.com/guschmue/ort-webgpu/tree/master/sd-turbo`,
-        filename: "sd-turbo",
-      },
       sam: {
         name: 'Segment Anything',
         description: `Segment Anything from https://github.com/guschmue/ort-webgpu/tree/master/segment-anything`,
         filename: "sam",
       },
       yolo: {
         name: 'Yolo',
         description: `Yolo V9 from https://github.com/guschmue/ort-webgpu/tree/master/yolov9`,

   return elem;
 }
+// todo: Musicgen
 const pageCategories = [
   {
     title: `Computer Vision`,
     description: `Computer Vision`,
     demos: {
       sam: {
         name: 'Segment Anything',
         description: `Segment Anything from https://github.com/guschmue/ort-webgpu/tree/master/segment-anything`,
         filename: "sam",
       },
+      sdturbo: {
+        name: 'Stable Diffusion Turbo',
+        description: `Stable Diffusion Turbo from https://github.com/guschmue/ort-webgpu/tree/master/sd-turbo`,
+        filename: "sd-turbo",
+      },
       yolo: {
         name: 'Yolo',
         description: `Yolo V9 from https://github.com/guschmue/ort-webgpu/tree/master/yolov9`,

util.js CHANGED Viewed

@@ -1,7 +1,7 @@
-function updateGetModelProgress(loaded, total) {
     const progressElement = document.getElementById('model-progress');
     if (total === 0) {
-        progressElement.innerHTML = "Model is already in local cache";
         return;
     }
     const percent = ((loaded / total) * 100).toFixed(2);
@@ -11,7 +11,7 @@ function updateGetModelProgress(loaded, total) {
     } else {
         progress = "Downloading";
     }
-    progressElement.innerHTML = `${progress} model: Total ${total} bytes, loaded ${loaded} bytes, ${percent}%`;
 }
 // Get model via Origin Private File System
@@ -21,7 +21,7 @@ async function getModelOPFS(name, url, updateModel) {
   async function updateFile() {
     const response = await fetch(url);
-    const buffer = await readResponse(response, updateGetModelProgress);
     fileHandle = await root.getFileHandle(name, {create: true});
     const writable = await fileHandle.createWritable();
     await writable.write(buffer);
@@ -36,14 +36,14 @@ async function getModelOPFS(name, url, updateModel) {
   try {
     fileHandle = await root.getFileHandle(name);
     const blob = await fileHandle.getFile();
-    updateGetModelProgress(0, 0);
     return await blob.arrayBuffer();
   } catch (e) {
     return await updateFile();
   }
 }
-async function readResponse(response, progressCallback) {
   const contentLength = response.headers.get('Content-Length');
   let total = parseInt(contentLength ?? '0');
   let buffer = new Uint8Array(total);
@@ -65,7 +65,7 @@ async function readResponse(response, progressCallback) {
     loaded = newLoaded;
     if (progressCallback) {
-        progressCallback(loaded, total);
     }
     return read();

+function updateGetModelProgress(name, loaded, total) {
     const progressElement = document.getElementById('model-progress');
     if (total === 0) {
+        progressElement.innerHTML = `Model ${name} is already in local cache`;
         return;
     }
     const percent = ((loaded / total) * 100).toFixed(2);
     } else {
         progress = "Downloading";
     }
+    progressElement.innerHTML = `${progress} model ${name}: Total ${total} bytes, loaded ${loaded} bytes, ${percent}%`;
 }
 // Get model via Origin Private File System
   async function updateFile() {
     const response = await fetch(url);
+    const buffer = await readResponse(name, response, updateGetModelProgress);
     fileHandle = await root.getFileHandle(name, {create: true});
     const writable = await fileHandle.createWritable();
     await writable.write(buffer);
   try {
     fileHandle = await root.getFileHandle(name);
     const blob = await fileHandle.getFile();
+    updateGetModelProgress(name, 0, 0);
     return await blob.arrayBuffer();
   } catch (e) {
     return await updateFile();
   }
 }
+async function readResponse(name, response, progressCallback) {
   const contentLength = response.headers.get('Content-Length');
   let total = parseInt(contentLength ?? '0');
   let buffer = new Uint8Array(total);
     loaded = newLoaded;
     if (progressCallback) {
+        progressCallback(name, loaded, total);
     }
     return read();