Spaces:
Configuration error
Configuration error
from diffusers import StableDiffusionPipeline | |
from lora_diffusion import monkeypatch_lora, tune_lora_scale | |
import torch | |
import os | |
import gradio as gr | |
import subprocess | |
MODEL_NAME="stabilityai/stable-diffusion-2-1-base" | |
INSTANCE_DIR="./data_example" | |
OUTPUT_DIR="./output_example" | |
model_id = "stabilityai/stable-diffusion-2-1-base" | |
pipe = StableDiffusionPipeline.from_pretrained(model_id, torch_dtype=torch.float16).to("cuda") | |
#prompt = "style of sks, baby lion" | |
torch.manual_seed(1) | |
#image = pipe(prompt, num_inference_steps=50, guidance_scale= 7).images[0] #no need | |
#image # nice. diffusers are cool. #no need | |
#finetuned_lora_weights = "./lora_weight.pt" | |
#global var | |
counter = 0 | |
#Getting Lora fine-tuned weights | |
def monkeypatching(alpha, in_prompt): #, prompt, pipe): finetuned_lora_weights | |
print("****** inside monkeypatching *******") | |
print(f"in_prompt is - {str(in_prompt)}") | |
global counter | |
if counter == 0 : | |
monkeypatch_lora(pipe.unet, torch.load("./output_example/lora_weight.pt")) #finetuned_lora_weights | |
tune_lora_scale(pipe.unet, alpha) #1.00) | |
counter +=1 | |
else : | |
tune_lora_scale(pipe.unet, alpha) #1.00) | |
prompt = "style of hclu, " + str(in_prompt) #"baby lion" | |
image = pipe(prompt, num_inference_steps=50, guidance_scale=7).images[0] | |
image.save("./illust_lora.jpg") #"./contents/illust_lora.jpg") | |
return image | |
def accelerate_train_lora(steps): | |
print("*********** inside accelerate_train_lora ***********") | |
#subprocess.run(accelerate launch {"./train_lora_dreambooth.py"} \ | |
#subprocess.Popen(f'accelerate launch {"./train_lora_dreambooth.py"} \ | |
os.system( f'accelerate launch {"./train_lora_dreambooth.py"} \ | |
--pretrained_model_name_or_path={MODEL_NAME} \ | |
--instance_data_dir={INSTANCE_DIR} \ | |
--output_dir={OUTPUT_DIR} \ | |
--instance_prompt="style of hclu" \ | |
--resolution=512 \ | |
--train_batch_size=1 \ | |
--gradient_accumulation_steps=1 \ | |
--learning_rate=1e-4 \ | |
--lr_scheduler="constant" \ | |
--lr_warmup_steps=0 \ | |
--max_train_steps={int(steps)}') #,shell=True) #30000 | |
print("*********** completing accelerate_train_lora ***********") | |
return "./output_example/lora_weight.pt" | |
with gr.Blocks() as demo: | |
gr.Markdown("""<h1><center>LORA - Low-rank Adaptation for Fast Text-to-Image Diffusion Fine-tuning</center></h1> | |
""") | |
gr.HTML("<p>You can skip the queue by duplicating this space and upgrading to gpu in settings: <a style='display:inline-block' href='https://huggingface.co/spaces/ysharma/Low-rank-Adaptation?duplicate=true'><img src='https://img.shields.io/badge/-Duplicate%20Space-blue?labelColor=white&style=flat&logo=&logoWidth=14' alt='Duplicate Space'></a></p>") | |
gr.Markdown( | |
"""**Main Features**<br>- Fine-tune Stable diffusion models twice as faster than dreambooth method, by Low-rank Adaptation.<br>- Get insanely small end result, easy to share and download.<br>- Easy to use, compatible with diffusers.<br>- Sometimes even better performance than full fine-tuning<br><br>Please refer to the GitHub repo this Space is based on, here - <a href = "https://github.com/cloneofsimo/lora">LORA</a>. You can also refer to this tweet by AK to quote/retweet/like here on <a href="https://twitter.com/_akhaliq/status/1601120767009513472">Twitter</a>.This Gradio Space is an attempt to explore this novel LORA approach to fine-tune Stable diffusion models, using the power and flexibility of Gradio! The higher number of steps results in longer training time and better fine-tuned SD models.<br><br><b>To use this Space well:</b><br>- First, upload your set of images (4-5), then enter the number of fine-tuning steps, and then press the 'Train LORA model' button. This will produce your fine-tuned model weights.<br>- Enter a prompt, set the alpha value using the Slider (nearer to 1 implies overfitting to the uploaded images), and then press the 'Inference' button. This will produce an image by the newly fine-tuned model.<br><b>Bonus:</b>You can download your fine-tuned model weights from the Gradio file component. The smaller size of LORA models (around 3-4 MB files) is the main highlight of this 'Low-rank Adaptation' approach of fine-tuning.""") | |
with gr.Row(): | |
in_images = gr.File(label="Upload images to fine-tune for LORA", file_count="multiple") | |
#in_prompt = gr.Textbox(label="Enter a ") | |
in_steps = gr.Number(label="Enter number of steps") | |
in_alpha = gr.Slider(0.1,1.0, step=0.01, label="Set Alpha level - higher value has more chances to overfit") | |
with gr.Row(): | |
b1 = gr.Button(value="Train LORA model") | |
b2 = gr.Button(value="Inference using LORA model") | |
with gr.Row(): | |
in_prompt = gr.Textbox(label="Enter a prompt for fine-tuned LORA model", visible=True) | |
out_image = gr.Image(label="Image generated by LORA model") | |
out_file = gr.File(label="Lora trained model weights", ) | |
b1.click(fn = accelerate_train_lora, inputs=in_steps, outputs=out_file) | |
b2.click(fn = monkeypatching, inputs=[in_alpha, in_prompt], outputs=out_image) | |
demo.queue(concurrency_count=3) | |
demo.launch(debug=True, show_error=True) |