Spaces:

vettorazi
/

wsj-server

App Files Files Community

vettorazi commited on 10 days ago

Commit

a756e18

•

1 Parent(s): dff4a80

new dockerfile

Browse files

Files changed (5) hide show

Dockerfile +54 -0
entrypoint.sh +14 -0
requirements.txt +23 -0
wsj-api-rnd-v2.json +162 -0
wsj-server.py +107 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,54 @@

+FROM nvidia/cuda:11.8.0-cudnn8-runtime-ubuntu22.04
+ENV DEBIAN_FRONTEND=noninteractive \
+    TZ=America/Los_Angeles
+RUN apt-get update && apt-get install -y \
+    git \
+    python3 \
+    python3-pip \
+    ffmpeg \
+    libsm6 \
+    libxext6 \
+    libgl1-mesa-glx \
+    && rm -rf /var/lib/apt/lists/*
+WORKDIR /code
+COPY ./requirements.txt /code/requirements.txt
+RUN useradd -m -u 1000 user
+USER user
+ENV HOME=/home/user \
+    PATH=/home/user/.local/bin:$PATH
+RUN pip install --no-cache-dir --upgrade pip setuptools wheel
+RUN pip install --no-cache-dir --upgrade -r /code/requirements.txt
+WORKDIR $HOME/app
+# Clone ComfyUI
+RUN git clone https://github.com/comfyanonymous/ComfyUI.git . && \
+    pip install --no-cache-dir -r requirements.txt
+# Download specific models
+RUN mkdir -p ./models/unet ./models/vae ./models/clip && \
+    wget -c https://huggingface.co/black-forest-labs/FLUX.1-dev/resolve/main/flux1-dev.safetensors -P ./models/unet/ && \
+    wget -c https://huggingface.co/black-forest-labs/FLUX.1-dev/resolve/main/vae/diffusion_pytorch_model.safetensors -P ./models/vae/ && \
+    wget -c https://huggingface.co/comfyanonymous/flux_text_encoders/resolve/main/clip_l.safetensors -P ./models/clip/ && \
+    wget -c https://huggingface.co/comfyanonymous/flux_text_encoders/resolve/main/t5xxl_fp16.safetensors -P ./models/clip/ && \
+    wget -c https://huggingface.co/comfyanonymous/flux_text_encoders/resolve/main/t5xxl_fp8_e4m3fn.safetensors -P ./models/clip/
+# Copy wsj-server.py
+COPY --chown=user wsj-server.py .
+# Expose ports for ComfyUI and wsj-server
+EXPOSE 8188 7860
+# Create entrypoint script
+RUN echo '#!/bin/bash\n\
+    python main.py --listen 0.0.0.0 --port 8188 --use-split-cross-attention &\n\
+    python wsj-server.py &\n\
+    wait -n' > entrypoint.sh && chmod +x entrypoint.sh
+CMD ["./entrypoint.sh"]

entrypoint.sh ADDED Viewed

	@@ -0,0 +1,14 @@

+#!/bin/bash
+set -e
+# Start ComfyUI
+python main.py --listen &
+# Start wsj-server
+python wsj-server.py &
+# Wait for any process to exit
+wait -n
+# Exit with status of process that exited first
+exit $?

requirements.txt ADDED Viewed

	@@ -0,0 +1,23 @@

+fastapi
+uvicorn[standard]
+pillow
+torch
+torchsde
+torchvision
+torchaudio
+einops
+transformers>=4.28.1
+tokenizers>=0.13.3
+sentencepiece
+safetensors>=0.4.2
+aiohttp
+pyyaml
+Pillow
+scipy
+tqdm
+psutil
+#non essential dependencies:
+kornia>=0.7.1
+spandrel
+soundfile

wsj-api-rnd-v2.json ADDED Viewed

	@@ -0,0 +1,162 @@

+{
+  "5": {
+    "inputs": {
+      "width": 1024,
+      "height": 1024,
+      "batch_size": 1
+    },
+    "class_type": "EmptyLatentImage",
+    "_meta": {
+      "title": "Empty Latent Image"
+    }
+  },
+  "6": {
+    "inputs": {
+      "text": "Create a painting in the style of American Realism or American Gothic, inspired by a political landscape reflecting the growing influence of evangelical movements in the U.S. Depict a large revival tent under a darkened sky, with a preacher, Lance Wallnau, standing among a crowd of around 2,000 people. The preacher's posture should convey urgency as he lays hands on those seeking prayer, emphasizing the idea of political and spiritual mobilization. In the distance, banners with slogans supporting Donald Trump are visible, alongside imagery evoking the tension between religion and politics, with Christian symbols intertwined with political messages. The atmosphere should evoke a somber, yet intense energy, blending realism with a sense of looming uncertainty and urgency. Include the presence of JD Vance addressing the crowd in the background, emphasizing the merging of faith and politics",
+      "clip": [
+        "11",
+        0
+      ]
+    },
+    "class_type": "CLIPTextEncode",
+    "_meta": {
+      "title": "articlePrompt"
+    }
+  },
+  "8": {
+    "inputs": {
+      "samples": [
+        "13",
+        0
+      ],
+      "vae": [
+        "10",
+        0
+      ]
+    },
+    "class_type": "VAEDecode",
+    "_meta": {
+      "title": "VAE Decode"
+    }
+  },
+  "9": {
+    "inputs": {
+      "filename_prefix": "ComfyUI",
+      "images": [
+        "8",
+        0
+      ]
+    },
+    "class_type": "SaveImage",
+    "_meta": {
+      "title": "Save Image"
+    }
+  },
+  "10": {
+    "inputs": {
+      "vae_name": "diffusion_pytorch_model_flux.safetensors"
+    },
+    "class_type": "VAELoader",
+    "_meta": {
+      "title": "Load VAE"
+    }
+  },
+  "11": {
+    "inputs": {
+      "clip_name1": "t5xxl_fp16.safetensors",
+      "clip_name2": "clip_l.safetensors",
+      "type": "flux"
+    },
+    "class_type": "DualCLIPLoader",
+    "_meta": {
+      "title": "DualCLIPLoader"
+    }
+  },
+  "12": {
+    "inputs": {
+      "unet_name": "flux1-dev.safetensors",
+      "weight_dtype": "default"
+    },
+    "class_type": "UNETLoader",
+    "_meta": {
+      "title": "Load Diffusion Model"
+    }
+  },
+  "13": {
+    "inputs": {
+      "noise": [
+        "25",
+        0
+      ],
+      "guider": [
+        "22",
+        0
+      ],
+      "sampler": [
+        "16",
+        0
+      ],
+      "sigmas": [
+        "17",
+        0
+      ],
+      "latent_image": [
+        "5",
+        0
+      ]
+    },
+    "class_type": "SamplerCustomAdvanced",
+    "_meta": {
+      "title": "SamplerCustomAdvanced"
+    }
+  },
+  "16": {
+    "inputs": {
+      "sampler_name": "euler"
+    },
+    "class_type": "KSamplerSelect",
+    "_meta": {
+      "title": "KSamplerSelect"
+    }
+  },
+  "17": {
+    "inputs": {
+      "scheduler": "simple",
+      "steps": 20,
+      "denoise": 1,
+      "model": [
+        "12",
+        0
+      ]
+    },
+    "class_type": "BasicScheduler",
+    "_meta": {
+      "title": "BasicScheduler"
+    }
+  },
+  "22": {
+    "inputs": {
+      "model": [
+        "12",
+        0
+      ],
+      "conditioning": [
+        "6",
+        0
+      ]
+    },
+    "class_type": "BasicGuider",
+    "_meta": {
+      "title": "BasicGuider"
+    }
+  },
+  "25": {
+    "inputs": {
+      "noise_seed": 533166222602070
+    },
+    "class_type": "RandomNoise",
+    "_meta": {
+      "title": "RandomNoise"
+    }
+  }
+}

wsj-server.py ADDED Viewed

	@@ -0,0 +1,107 @@

+#This is an example that uses the websockets api to know when a prompt execution is done
+#Once the prompt execution is done it downloads the images using the /history endpoint
+import websocket #NOTE: websocket-client (https://github.com/websocket-client/websocket-client)
+import uuid
+import json
+import urllib.request
+import urllib.parse
+import random
+import io
+from fastapi import FastAPI, Response
+from pydantic import BaseModel
+from PIL import Image
+server_address = "127.0.0.1:8188"
+client_id = str(uuid.uuid4())
+def queue_prompt(prompt):
+    p = {"prompt": prompt, "client_id": client_id}
+    data = json.dumps(p).encode('utf-8')
+    req =  urllib.request.Request("http://{}/prompt".format(server_address), data=data)
+    return json.loads(urllib.request.urlopen(req).read())
+def get_image(filename, subfolder, folder_type):
+    data = {"filename": filename, "subfolder": subfolder, "type": folder_type}
+    url_values = urllib.parse.urlencode(data)
+    with urllib.request.urlopen("http://{}/view?{}".format(server_address, url_values)) as response:
+        return response.read()
+def get_history(prompt_id):
+    with urllib.request.urlopen("http://{}/history/{}".format(server_address, prompt_id)) as response:
+        return json.loads(response.read())
+def get_images(ws, prompt):
+    prompt_id = queue_prompt(prompt)['prompt_id']
+    output_images = {}
+    while True:
+        out = ws.recv()
+        if isinstance(out, str):
+            message = json.loads(out)
+            if message['type'] == 'executing':
+                data = message['data']
+                if data['node'] is None and data['prompt_id'] == prompt_id:
+                    break #Execution is done
+        else:
+            # If you want to be able to decode the binary stream for latent previews, here is how you can do it:
+            # bytesIO = BytesIO(out[8:])
+            # preview_image = Image.open(bytesIO) # This is your preview in PIL image format, store it in a global
+            continue #previews are binary data
+    history = get_history(prompt_id)[prompt_id]
+    for node_id in history['outputs']:
+        node_output = history['outputs'][node_id]
+        images_output = []
+        if 'images' in node_output:
+            for image in node_output['images']:
+                image_data = get_image(image['filename'], image['subfolder'], image['type'])
+                images_output.append(image_data)
+        output_images[node_id] = images_output
+    return output_images
+app = FastAPI()
+class PromptRequest(BaseModel):
+    prompt: str
+@app.post("/generate-image")
+async def generate_image(prompt_request: PromptRequest):
+    # Load the workflow JSON
+    with open("wsj-api-rnd-v2.json", "r", encoding="utf-8") as f:
+        workflow_jsondata = f.read()
+    jsonwf = json.loads(workflow_jsondata)
+    # Set the text prompt
+    jsonwf["6"]["inputs"]["text"] = prompt_request.prompt
+    # Set a random seed
+    seednum = random.randint(0, 10000)
+    jsonwf["25"]["inputs"]["noise_seed"] = seednum
+    # Connect to WebSocket
+    ws = websocket.WebSocket()
+    ws.connect(f"ws://{server_address}/ws?clientId={client_id}")
+    # Generate images
+    images = get_images(ws, jsonwf)
+    ws.close()
+    # Assuming we want to return the first image from the first node
+    first_node = next(iter(images))
+    image_data = images[first_node][0]
+    # Convert image data to PIL Image
+    image = Image.open(io.BytesIO(image_data))
+    # Convert PIL Image to bytes
+    img_byte_arr = io.BytesIO()
+    image.save(img_byte_arr, format='PNG')
+    img_byte_arr = img_byte_arr.getvalue()
+    return Response(content=img_byte_arr, media_type="image/png")
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=7860)