Spaces:

ds1david
/

sculpt

Runtime error

App Files Files Community

ds1david commited on Mar 18

Commit

a7111d1

1 Parent(s): 3920f5c

New logic

Browse files

Files changed (1) hide show

app.py +30 -15

app.py CHANGED Viewed

@@ -1,20 +1,26 @@
 import gradio as gr
 import torch
 import jax
 import numpy as np
 from PIL import Image
 import pickle
 from huggingface_hub import hf_hub_download
 from diffusers import StableDiffusionXLImg2ImgPipeline
-from transformers import DPTFeatureExtractor, DPTForDepthEstimation
-from model import build_thera  # Importar do código original do Thera
 # Configurar dispositivos
 JAX_DEVICE = jax.devices("cpu")[0]
 TORCH_DEVICE = "cpu"
-# 1. Carregar modelos do Thera ------------------------------------------------------------------
 def load_thera_model(repo_id, filename):
     model_path = hf_hub_download(repo_id=repo_id, filename=filename)
     with open(model_path, 'rb') as fh:
@@ -27,7 +33,7 @@ def load_thera_model(repo_id, filename):
 print("Carregando Thera EDSR...")
 model_edsr, params_edsr = load_thera_model("prs-eth/thera-edsr-pro", "model.pkl")
-# 2. Carregar SDXL + LoRA ----------------------------------------------------------------------
 print("Carregando SDXL + LoRA...")
 pipe = StableDiffusionXLImg2ImgPipeline.from_pretrained(
     "stabilityai/stable-diffusion-xl-base-1.0",
@@ -35,33 +41,36 @@ pipe = StableDiffusionXLImg2ImgPipeline.from_pretrained(
 ).to(TORCH_DEVICE)
 pipe.load_lora_weights("KappaNeuro/bas-relief", weight_name="BAS-RELIEF.safetensors")
-# 3. Carregar modelo de profundidade -----------------------------------------------------------
 print("Carregando DPT Depth...")
-feature_extractor = DPTFeatureExtractor.from_pretrained("Intel/dpt-large")
 depth_model = DPTForDepthEstimation.from_pretrained("Intel/dpt-large").to(TORCH_DEVICE)
-# Pipeline principal ---------------------------------------------------------------------------
 def full_pipeline(image, prompt, scale_factor=2.0):
     try:
         # 1. Super Resolução com Thera
-        source = np.array(image.convert("RGB")) / 255.0
         target_shape = (int(image.height * scale_factor), int(image.width * scale_factor))
-        # Converter para JAX array
         source_jax = jax.device_put(source, JAX_DEVICE)
         # Processar com Thera
         upscaled = model_edsr.apply(
             params_edsr,
             source_jax,
             target_shape,
             do_ensemble=True
         )
         upscaled_pil = Image.fromarray((np.array(upscaled) * 255).astype(np.uint8))
         # 2. Gerar Bas-Relief
-        full_prompt = f"BAS-RELIEF {prompt}, intricate carving, marble relief"
         bas_relief = pipe(
             prompt=full_prompt,
             image=upscaled_pil,
@@ -82,26 +91,32 @@ def full_pipeline(image, prompt, scale_factor=2.0):
             mode="bicubic"
         ).squeeze().cpu().numpy()
-        return upscaled_pil, bas_relief, (depth_map - depth_map.min()) / (depth_map.max() - depth_map.min())
     except Exception as e:
         raise gr.Error(f"Erro no processamento: {str(e)}")
-# Interface Gradio -----------------------------------------------------------------------------
 with gr.Blocks(title="Super Res + Bas-Relief") as app:
     gr.Markdown("## 🔍 Super Resolução + 🗿 Bas-Relief + 🗺️ Profundidade")
     with gr.Row():
         with gr.Column():
             img_input = gr.Image(type="pil", label="Imagem de Entrada")
-            prompt = gr.Textbox("insanely detailed and complex engraving relief, ultra-high definition, rich in detail, and 16K resolution.", label="Descrição")
             scale = gr.Slider(1.0, 4.0, value=2.0, label="Fator de Escala")
             btn = gr.Button("Processar")
         with gr.Column():
-            img_upscaled = gr.Image(label="Super Resolvida")
-            img_basrelief = gr.Image(label="Bas-Relief")
             img_depth = gr.Image(label="Mapa de Profundidade")
     btn.click(

 import gradio as gr
 import torch
 import jax
+import jax.numpy as jnp
 import numpy as np
 from PIL import Image
 import pickle
+import warnings
 from huggingface_hub import hf_hub_download
 from diffusers import StableDiffusionXLImg2ImgPipeline
+from transformers import DPTImageProcessor, DPTForDepthEstimation
+from model import build_thera
+# Configurações e supressão de avisos
+warnings.filterwarnings("ignore", category=FutureWarning)
+warnings.filterwarnings("ignore", category=UserWarning)
 # Configurar dispositivos
 JAX_DEVICE = jax.devices("cpu")[0]
 TORCH_DEVICE = "cpu"
+# 1. Carregar modelos do Thera ----------------------------------------------------------------
 def load_thera_model(repo_id, filename):
     model_path = hf_hub_download(repo_id=repo_id, filename=filename)
     with open(model_path, 'rb') as fh:
 print("Carregando Thera EDSR...")
 model_edsr, params_edsr = load_thera_model("prs-eth/thera-edsr-pro", "model.pkl")
+# 2. Carregar SDXL + LoRA ---------------------------------------------------------------------
 print("Carregando SDXL + LoRA...")
 pipe = StableDiffusionXLImg2ImgPipeline.from_pretrained(
     "stabilityai/stable-diffusion-xl-base-1.0",
 ).to(TORCH_DEVICE)
 pipe.load_lora_weights("KappaNeuro/bas-relief", weight_name="BAS-RELIEF.safetensors")
+# 3. Carregar modelo de profundidade ----------------------------------------------------------
 print("Carregando DPT Depth...")
+feature_extractor = DPTImageProcessor.from_pretrained("Intel/dpt-large")
 depth_model = DPTForDepthEstimation.from_pretrained("Intel/dpt-large").to(TORCH_DEVICE)
+# Pipeline principal --------------------------------------------------------------------------
 def full_pipeline(image, prompt, scale_factor=2.0):
     try:
         # 1. Super Resolução com Thera
+        image = image.convert("RGB")
+        source = np.array(image) / 255.0
         target_shape = (int(image.height * scale_factor), int(image.width * scale_factor))
+        # Preparar parâmetros para JAX
         source_jax = jax.device_put(source, JAX_DEVICE)
+        t = jnp.array([1.0 / (scale_factor ** 2)], dtype=jnp.float32)
         # Processar com Thera
         upscaled = model_edsr.apply(
             params_edsr,
             source_jax,
+            t,
             target_shape,
             do_ensemble=True
         )
         upscaled_pil = Image.fromarray((np.array(upscaled) * 255).astype(np.uint8))
         # 2. Gerar Bas-Relief
+        full_prompt = f"BAS-RELIEF {prompt}, insanely detailed and complex engraving relief, ultra-high definition, rich in detail, 16K resolution"
         bas_relief = pipe(
             prompt=full_prompt,
             image=upscaled_pil,
             mode="bicubic"
         ).squeeze().cpu().numpy()
+        depth_normalized = (depth_map - depth_map.min()) / (depth_map.max() - depth_map.min())
+        depth_pil = Image.fromarray((depth_normalized * 255).astype(np.uint8))
+        return upscaled_pil, bas_relief, depth_pil
     except Exception as e:
         raise gr.Error(f"Erro no processamento: {str(e)}")
+# Interface Gradio ----------------------------------------------------------------------------
 with gr.Blocks(title="Super Res + Bas-Relief") as app:
     gr.Markdown("## 🔍 Super Resolução + 🗿 Bas-Relief + 🗺️ Profundidade")
     with gr.Row():
         with gr.Column():
             img_input = gr.Image(type="pil", label="Imagem de Entrada")
+            prompt = gr.Textbox(
+                label="Descrição do Relevo",
+                value="insanely detailed and complex engraving relief, ultra-high definition, rich in detail, and 16K resolution."
+            )
             scale = gr.Slider(1.0, 4.0, value=2.0, label="Fator de Escala")
             btn = gr.Button("Processar")
         with gr.Column():
+            img_upscaled = gr.Image(label="Imagem Super Resolvida")
+            img_basrelief = gr.Image(label="Resultado Bas-Relief")
             img_depth = gr.Image(label="Mapa de Profundidade")
     btn.click(