Spaces:

radames
/

Enhance-This-HiDiffusion-SDXL

Running on Zero

App Files Files Community

radames commited on May 8, 2024

Commit

b212cf7

1 Parent(s): a080665

sobel

Browse files

Files changed (2) hide show

app.py +3 -7
canny_gpu.py +117 -0

app.py CHANGED Viewed

@@ -8,12 +8,11 @@ from diffusers import (
     StableDiffusionXLControlNetImg2ImgPipeline,
     DDIMScheduler,
 )
 from compel import Compel, ReturnedEmbeddingsType
 from PIL import Image
 import os
 import time
-import cv2
 import numpy as np
 IS_SPACES_ZERO = os.environ.get("SPACES_ZERO_GPU", "0") == "1"
@@ -64,6 +63,7 @@ if not IS_SPACES_ZERO:
     # pipe.enable_xformers_memory_efficient_attention()
     pipe.enable_model_cpu_offload()
 pipe.enable_vae_tiling()
 def pad_image(image):
@@ -106,11 +106,7 @@ def predict(
     conditioning, pooled = compel([prompt, negative_prompt])
     generator = torch.manual_seed(seed)
     last_time = time.time()
-    canny_image = np.array(padded_image)
-    canny_image = cv2.Canny(canny_image, 100, 200)
-    canny_image = canny_image[:, :, None]
-    canny_image = np.concatenate([canny_image, canny_image, canny_image], axis=2)
-    canny_image = Image.fromarray(canny_image)
     images = pipe(
         image=padded_image,
         control_image=canny_image,

     StableDiffusionXLControlNetImg2ImgPipeline,
     DDIMScheduler,
 )
+from canny_gpu import SobelOperator
 from compel import Compel, ReturnedEmbeddingsType
 from PIL import Image
 import os
 import time
 import numpy as np
 IS_SPACES_ZERO = os.environ.get("SPACES_ZERO_GPU", "0") == "1"
     # pipe.enable_xformers_memory_efficient_attention()
     pipe.enable_model_cpu_offload()
 pipe.enable_vae_tiling()
+canny_torch = SobelOperator(device=device)
 def pad_image(image):
     conditioning, pooled = compel([prompt, negative_prompt])
     generator = torch.manual_seed(seed)
     last_time = time.time()
+    canny_image = canny_torch(padded_image, 0.01, 0.2)
     images = pipe(
         image=padded_image,
         control_image=canny_image,

canny_gpu.py ADDED Viewed

	@@ -0,0 +1,117 @@

+import torch
+import torch.nn as nn
+from torchvision.transforms import ToTensor, ToPILImage
+from PIL import Image
+class SobelOperator(nn.Module):
+    SOBEL_KERNEL_X = torch.tensor(
+        [[-1.0, 0.0, 1.0], [-2.0, 0.0, 2.0], [-1.0, 0.0, 1.0]]
+    )
+    SOBEL_KERNEL_Y = torch.tensor(
+        [[-1.0, -2.0, -1.0], [0.0, 0.0, 0.0], [1.0, 2.0, 1.0]]
+    )
+    def __init__(self, device="cuda"):
+        super(SobelOperator, self).__init__()
+        self.device = device
+        self.edge_conv_x = nn.Conv2d(1, 1, kernel_size=3, padding=1, bias=False).to(
+            self.device
+        )
+        self.edge_conv_y = nn.Conv2d(1, 1, kernel_size=3, padding=1, bias=False).to(
+            self.device
+        )
+        self.edge_conv_x.weight = nn.Parameter(
+            self.SOBEL_KERNEL_X.view((1, 1, 3, 3)).to(self.device)
+        )
+        self.edge_conv_y.weight = nn.Parameter(
+            self.SOBEL_KERNEL_Y.view((1, 1, 3, 3)).to(self.device)
+        )
+    @torch.no_grad()
+    def forward(
+        self,
+        image: Image.Image,
+        low_threshold: float,
+        high_threshold: float,
+        output_type="pil",
+    ) -> Image.Image | torch.Tensor | tuple[Image.Image, torch.Tensor]:
+        # Convert PIL image to PyTorch tensor
+        image_gray = image.convert("L")
+        image_tensor = ToTensor()(image_gray).unsqueeze(0).to(self.device)
+        # Compute gradients
+        edge_x = self.edge_conv_x(image_tensor)
+        edge_y = self.edge_conv_y(image_tensor)
+        edge = torch.sqrt(torch.square(edge_x) + torch.square(edge_y))
+        # Apply thresholding
+        edge.div_(edge.max())  # Normalize to 0-1 (in-place operation)
+        edge[edge >= high_threshold] = 1.0
+        edge[edge <= low_threshold] = 0.0
+        # Convert the result back to a PIL image
+        if output_type == "pil":
+            return ToPILImage()(edge.squeeze(0).cpu())
+        elif output_type == "tensor":
+            return edge
+        elif output_type == "pil,tensor":
+            return ToPILImage()(edge.squeeze(0).cpu()), edge
+class ScharrOperator(nn.Module):
+    SCHARR_KERNEL_X = torch.tensor(
+        [[-3.0, 0.0, 3.0], [-10.0, 0.0, 10.0], [-3.0, 0.0, 3.0]]
+    )
+    SCHARR_KERNEL_Y = torch.tensor(
+        [[-3.0, -10.0, -3.0], [0.0, 0.0, 0.0], [3.0, 10.0, 3.0]]
+    )
+    def __init__(self, device="cuda"):
+        super(ScharrOperator, self).__init__()
+        self.device = device
+        self.edge_conv_x = nn.Conv2d(1, 1, kernel_size=3, padding=1, bias=False).to(
+            self.device
+        )
+        self.edge_conv_y = nn.Conv2d(1, 1, kernel_size=3, padding=1, bias=False).to(
+            self.device
+        )
+        self.edge_conv_x.weight = nn.Parameter(
+            self.SCHARR_KERNEL_X.view((1, 1, 3, 3)).to(self.device)
+        )
+        self.edge_conv_y.weight = nn.Parameter(
+            self.SCHARR_KERNEL_Y.view((1, 1, 3, 3)).to(self.device)
+        )
+    @torch.no_grad()
+    def forward(
+        self,
+        image: Image.Image,
+        low_threshold: float,
+        high_threshold: float,
+        output_type="pil",
+        invert: bool = False,
+    ) -> Image.Image | torch.Tensor | tuple[Image.Image, torch.Tensor]:
+        # Convert PIL image to PyTorch tensor
+        image_gray = image.convert("L")
+        image_tensor = ToTensor()(image_gray).unsqueeze(0).to(self.device)
+        # Compute gradients
+        edge_x = self.edge_conv_x(image_tensor)
+        edge_y = self.edge_conv_y(image_tensor)
+        edge = torch.abs(edge_x) + torch.abs(edge_y)
+        # Apply thresholding
+        edge.div_(edge.max())  # Normalize to 0-1 (in-place operation)
+        edge[edge >= high_threshold] = 1.0
+        edge[edge <= low_threshold] = 0.0
+        if invert:
+            edge = 1 - edge
+        # Convert the result back to a PIL image
+        if output_type == "pil":
+            return ToPILImage()(edge.squeeze(0).cpu())
+        elif output_type == "tensor":
+            return edge
+        elif output_type == "pil,tensor":
+            return ToPILImage()(edge.squeeze(0).cpu()), edge