Spaces:

ds1david
/

sculpt

Runtime error

App Files Files Community

ds1david commited on Mar 18

Commit

3920f5c

1 Parent(s): 1eb87a5

New logic

Browse files

Files changed (2) hide show

app.py +77 -55
requirements.txt +2 -0

app.py CHANGED Viewed

@@ -3,83 +3,105 @@ import torch
 import jax
 import numpy as np
 from PIL import Image
 from diffusers import StableDiffusionXLImg2ImgPipeline
 from transformers import DPTFeatureExtractor, DPTForDepthEstimation
-from super_resolve import process as thera_process  # Assume imports do Thera
-# Configurações
-DEVICE = "cpu"  # ou "cuda" se disponível
-JAX_DEVICE = jax.devices("cpu")[0]  # Usar CPU para JAX
-# 1. Carregar modelos do Thera (EDSR/RDN)
-# (Implementar conforme código original do Thera)
-model_edsr, params_edsr = None, None  # Carregar usando pickle/HF Hub
-# 2. Carregar SDXL Img2Img + LoRA
-print("Carregando SDXL Img2Img com LoRA...")
 pipe = StableDiffusionXLImg2ImgPipeline.from_pretrained(
     "stabilityai/stable-diffusion-xl-base-1.0",
     torch_dtype=torch.float32
-).to(DEVICE)
 pipe.load_lora_weights("KappaNeuro/bas-relief", weight_name="BAS-RELIEF.safetensors")
-# 3. Carregar modelo de profundidade
-print("Carregando DPT...")
 feature_extractor = DPTFeatureExtractor.from_pretrained("Intel/dpt-large")
-depth_model = DPTForDepthEstimation.from_pretrained("Intel/dpt-large").to(DEVICE)
-def enhance_depth_map(depth_arr):
-    depth_normalized = (depth_arr - depth_arr.min()) / (depth_arr.max() - depth_arr.min() + 1e-8)
-    return Image.fromarray((depth_normalized * 255).astype(np.uint8))
 def full_pipeline(image, prompt, scale_factor=2.0):
-    # 1. Super Resolução com Thera
-    source = np.array(image) / 255.0
-    target_shape = (int(image.height * scale_factor), int(image.width * scale_factor))
-    upscaled = thera_process(source, model_edsr, params_edsr, target_shape, do_ensemble=True)
-    upscaled_pil = Image.fromarray((upscaled * 255).astype(np.uint8))
-    # 2. Gerar Bas-Relief com SDXL Img2Img
-    full_prompt = f"BAS-RELIEF {prompt}, intricate carving, marble relief"
-    bas_relief = pipe(
-        prompt=full_prompt,
-        image=upscaled_pil,
-        strength=0.7,
-        num_inference_steps=25,
-        guidance_scale=7.5
-    ).images[0]
-    # 3. Calcular Depth Map
-    inputs = feature_extractor(bas_relief, return_tensors="pt").to(DEVICE)
-    with torch.no_grad():
-        outputs = depth_model(**inputs)
-        depth = outputs.predicted_depth
-    depth_map = torch.nn.functional.interpolate(
-        depth.unsqueeze(1),
-        size=bas_relief.size[::-1],
-        mode="bicubic"
-    ).squeeze().cpu().numpy()
-    return upscaled_pil, bas_relief, enhance_depth_map(depth_map)
-# Interface Gradio
-with gr.Blocks(title="Super Resolução + Bas-Relief") as app:
-    gr.Markdown("## 📈 Super Resolução + 🗿 Bas-Relief + 🗺️ Mapa de Profundidade")
     with gr.Row():
         with gr.Column():
             img_input = gr.Image(type="pil", label="Imagem de Entrada")
-            prompt = gr.Textbox("ancient sculpture, marble", label="Descrição do Relevo")
             scale = gr.Slider(1.0, 4.0, value=2.0, label="Fator de Escala")
             btn = gr.Button("Processar")
         with gr.Column():
-            img_upscaled = gr.Image(label="Imagem Super Resolvida")
-            img_basrelief = gr.Image(label="Relevo Escultural")
             img_depth = gr.Image(label="Mapa de Profundidade")
     btn.click(

 import jax
 import numpy as np
 from PIL import Image
+import pickle
+from huggingface_hub import hf_hub_download
 from diffusers import StableDiffusionXLImg2ImgPipeline
 from transformers import DPTFeatureExtractor, DPTForDepthEstimation
+from model import build_thera  # Importar do código original do Thera
+# Configurar dispositivos
+JAX_DEVICE = jax.devices("cpu")[0]
+TORCH_DEVICE = "cpu"
+# 1. Carregar modelos do Thera ------------------------------------------------------------------
+def load_thera_model(repo_id, filename):
+    model_path = hf_hub_download(repo_id=repo_id, filename=filename)
+    with open(model_path, 'rb') as fh:
+        check = pickle.load(fh)
+        params, backbone, size = check['model'], check['backbone'], check['size']
+    model = build_thera(3, backbone, size)
+    return model, params
+print("Carregando Thera EDSR...")
+model_edsr, params_edsr = load_thera_model("prs-eth/thera-edsr-pro", "model.pkl")
+# 2. Carregar SDXL + LoRA ----------------------------------------------------------------------
+print("Carregando SDXL + LoRA...")
 pipe = StableDiffusionXLImg2ImgPipeline.from_pretrained(
     "stabilityai/stable-diffusion-xl-base-1.0",
     torch_dtype=torch.float32
+).to(TORCH_DEVICE)
 pipe.load_lora_weights("KappaNeuro/bas-relief", weight_name="BAS-RELIEF.safetensors")
+# 3. Carregar modelo de profundidade -----------------------------------------------------------
+print("Carregando DPT Depth...")
 feature_extractor = DPTFeatureExtractor.from_pretrained("Intel/dpt-large")
+depth_model = DPTForDepthEstimation.from_pretrained("Intel/dpt-large").to(TORCH_DEVICE)
+# Pipeline principal ---------------------------------------------------------------------------
 def full_pipeline(image, prompt, scale_factor=2.0):
+    try:
+        # 1. Super Resolução com Thera
+        source = np.array(image.convert("RGB")) / 255.0
+        target_shape = (int(image.height * scale_factor), int(image.width * scale_factor))
+        # Converter para JAX array
+        source_jax = jax.device_put(source, JAX_DEVICE)
+        # Processar com Thera
+        upscaled = model_edsr.apply(
+            params_edsr,
+            source_jax,
+            target_shape,
+            do_ensemble=True
+        )
+        upscaled_pil = Image.fromarray((np.array(upscaled) * 255).astype(np.uint8))
+        # 2. Gerar Bas-Relief
+        full_prompt = f"BAS-RELIEF {prompt}, intricate carving, marble relief"
+        bas_relief = pipe(
+            prompt=full_prompt,
+            image=upscaled_pil,
+            strength=0.7,
+            num_inference_steps=25,
+            guidance_scale=7.5
+        ).images[0]
+        # 3. Calcular Depth Map
+        inputs = feature_extractor(bas_relief, return_tensors="pt").to(TORCH_DEVICE)
+        with torch.no_grad():
+            outputs = depth_model(**inputs)
+            depth = outputs.predicted_depth
+        depth_map = torch.nn.functional.interpolate(
+            depth.unsqueeze(1),
+            size=bas_relief.size[::-1],
+            mode="bicubic"
+        ).squeeze().cpu().numpy()
+        return upscaled_pil, bas_relief, (depth_map - depth_map.min()) / (depth_map.max() - depth_map.min())
+    except Exception as e:
+        raise gr.Error(f"Erro no processamento: {str(e)}")
+# Interface Gradio -----------------------------------------------------------------------------
+with gr.Blocks(title="Super Res + Bas-Relief") as app:
+    gr.Markdown("## 🔍 Super Resolução + 🗿 Bas-Relief + 🗺️ Profundidade")
     with gr.Row():
         with gr.Column():
             img_input = gr.Image(type="pil", label="Imagem de Entrada")
+            prompt = gr.Textbox("insanely detailed and complex engraving relief, ultra-high definition, rich in detail, and 16K resolution.", label="Descrição")
             scale = gr.Slider(1.0, 4.0, value=2.0, label="Fator de Escala")
             btn = gr.Button("Processar")
         with gr.Column():
+            img_upscaled = gr.Image(label="Super Resolvida")
+            img_basrelief = gr.Image(label="Bas-Relief")
             img_depth = gr.Image(label="Mapa de Profundidade")
     btn.click(

requirements.txt CHANGED Viewed

@@ -7,6 +7,7 @@ diffusers
 einops==0.6.1
 flax==0.6.10
 flaxmodels==0.1.3
 jax==0.4.11
 jaxlib==0.4.11+cuda11.cudnn86
 jaxtyping==0.2.20
@@ -24,6 +25,7 @@ opt-einsum==3.3.0
 optax==0.2.0
 orbax-checkpoint==0.2.4
 peft
 scipy==1.10.1
 timm==0.9.6
 torch

 einops==0.6.1
 flax==0.6.10
 flaxmodels==0.1.3
+huggingface_hub
 jax==0.4.11
 jaxlib==0.4.11+cuda11.cudnn86
 jaxtyping==0.2.20
 optax==0.2.0
 orbax-checkpoint==0.2.4
 peft
+pillow
 scipy==1.10.1
 timm==0.9.6
 torch