Spaces:

NightRaven109
/

PBRGeneration

Running on Zero

App Files Files Community

NightRaven109 commited on Nov 23, 2024

Commit

5319ec3

verified ·

1 Parent(s): 1e0e767

Update app.py

Browse files

Files changed (1) hide show

app.py +145 -9

app.py CHANGED Viewed

@@ -12,6 +12,110 @@ model_configs = {
     'vitl': {'encoder': 'vitl', 'features': 256, 'out_channels': [256, 512, 1024, 1024]}
 }
 def get_image_intensity(img, gamma_correction=1.0):
     """
     Extract intensity map from an image using HSV color space
@@ -43,6 +147,34 @@ def blend_numpy_images(image1, image2, blend_factor=0.4, mode="normal"):
     blended = (blended * 255.0).clip(0, 255).astype(np.uint8)
     return blended
 # Initialize model globally
 def initialize_model():
     encoder = 'vitl'
@@ -73,10 +205,10 @@ MODEL = initialize_model()
 @spaces.GPU
 def process_image(input_image):
     """
-    Process the input image and return depth maps, intensity map, and blended result
     """
     if input_image is None:
-        return None, None, None, None
     # Move model to GPU for processing
     MODEL.to('cuda')
@@ -110,16 +242,19 @@ def process_image(input_image):
         mode="normal"
     )
-    return depth_normalized, depth_colormap, intensity_map, blended_result
 @spaces.GPU
 def gradio_interface(input_img):
     try:
-        depth_raw, depth_colored, intensity, blended = process_image(input_img)
-        return [input_img, depth_raw, depth_colored, intensity, blended]
     except Exception as e:
         print(f"Error processing image: {str(e)}")
-        return [input_img, None, None, None, None]
 # Define interface
 iface = gr.Interface(
@@ -130,10 +265,11 @@ iface = gr.Interface(
         gr.Image(label="Raw Depth Map"),
         gr.Image(label="Colored Depth Map"),
         gr.Image(label="Intensity Map"),
-        gr.Image(label="Blended (Depth + Intensity)")
     ],
-    title="Depth and Intensity Estimation",
-    description="Upload an image to generate its depth map, intensity map, and blended result.",
     examples=["image.jpg"]
 )

     'vitl': {'encoder': 'vitl', 'features': 256, 'out_channels': [256, 512, 1024, 1024]}
 }
+class NormalMapSimple:
+    @classmethod
+    def INPUT_TYPES(s):
+        return {
+            "required": {
+                "images": ("IMAGE",),
+                "scale_XY": ("FLOAT",{"default": 1, "min": 0, "max": 100, "step": 0.001}),
+            },
+        }
+    RETURN_TYPES = ("IMAGE",)
+    FUNCTION = "normal_map"
+    CATEGORY = "image/filters"
+    def normal_map(self, images, scale_XY):
+        t = images.detach().clone().cpu().numpy().astype(np.float32)
+        L = np.mean(t[:,:,:,:3], axis=3)
+        for i in range(t.shape[0]):
+            t[i,:,:,0] = cv2.Scharr(L[i], -1, 1, 0, cv2.BORDER_REFLECT) * -1
+            t[i,:,:,1] = cv2.Scharr(L[i], -1, 0, 1, cv2.BORDER_REFLECT)
+        t[:,:,:,2] = 1
+        t = torch.from_numpy(t)
+        t[:,:,:,:2] *= scale_XY
+        t[:,:,:,:3] = torch.nn.functional.normalize(t[:,:,:,:3], dim=3) / 2 + 0.5
+        return (t,)
+class ConvertNormals:
+    @classmethod
+    def INPUT_TYPES(s):
+        return {
+            "required": {
+                "normals": ("IMAGE",),
+                "input_mode": (["BAE", "MiDaS", "Standard", "DirectX"],),
+                "output_mode": (["BAE", "MiDaS", "Standard", "DirectX"],),
+                "scale_XY": ("FLOAT",{"default": 1, "min": 0, "max": 100, "step": 0.001}),
+                "normalize": ("BOOLEAN", {"default": True}),
+                "fix_black": ("BOOLEAN", {"default": True}),
+            },
+            "optional": {
+                "optional_fill": ("IMAGE",),
+            },
+        }
+    RETURN_TYPES = ("IMAGE",)
+    FUNCTION = "convert_normals"
+    CATEGORY = "image/filters"
+    def convert_normals(self, normals, input_mode, output_mode, scale_XY, normalize, fix_black, optional_fill=None):
+        try:
+            t = normals.detach().clone()
+            if input_mode == "BAE":
+                t[:,:,:,0] = 1 - t[:,:,:,0] # invert R
+            elif input_mode == "MiDaS":
+                t[:,:,:,:3] = torch.stack([1 - t[:,:,:,2], t[:,:,:,1], t[:,:,:,0]], dim=3) # BGR -> RGB and invert R
+            elif input_mode == "DirectX":
+                t[:,:,:,1] = 1 - t[:,:,:,1] # invert G
+            if fix_black:
+                key = torch.clamp(1 - t[:,:,:,2] * 2, min=0, max=1)
+                if optional_fill is None:
+                    t[:,:,:,0] += key * 0.5
+                    t[:,:,:,1] += key * 0.5
+                    t[:,:,:,2] += key
+                else:
+                    fill = optional_fill.detach().clone()
+                    if fill.shape[1:3] != t.shape[1:3]:
+                        fill = torch.nn.functional.interpolate(fill.movedim(-1,1), size=(t.shape[1], t.shape[2]), mode='bilinear').movedim(1,-1)
+                    if fill.shape[0] != t.shape[0]:
+                        fill = fill[0].unsqueeze(0).expand(t.shape[0], -1, -1, -1)
+                    t[:,:,:,:3] += fill[:,:,:,:3] * key.unsqueeze(3).expand(-1, -1, -1, 3)
+            t[:,:,:,:2] = (t[:,:,:,:2] - 0.5) * scale_XY + 0.5
+            if normalize:
+                # Transform to [-1, 1] range
+                t_norm = t[:,:,:,:3] * 2 - 1
+                # Calculate the length of each vector
+                lengths = torch.sqrt(torch.sum(t_norm**2, dim=3, keepdim=True))
+                # Avoid division by zero
+                lengths = torch.clamp(lengths, min=1e-6)
+                # Normalize each vector to unit length
+                t_norm = t_norm / lengths
+                # Transform back to [0, 1] range
+                t[:,:,:,:3] = (t_norm + 1) / 2
+            if output_mode == "BAE":
+                t[:,:,:,0] = 1 - t[:,:,:,0] # invert R
+            elif output_mode == "MiDaS":
+                t[:,:,:,:3] = torch.stack([t[:,:,:,2], t[:,:,:,1], 1 - t[:,:,:,0]], dim=3) # invert R and BGR -> RGB
+            elif output_mode == "DirectX":
+                t[:,:,:,1] = 1 - t[:,:,:,1] # invert G
+            return (t,)
+        except Exception as e:
+            print(f"Error in convert_normals: {str(e)}")
+            return (normals,)
 def get_image_intensity(img, gamma_correction=1.0):
     """
     Extract intensity map from an image using HSV color space
     blended = (blended * 255.0).clip(0, 255).astype(np.uint8)
     return blended
+def process_normal_map(image):
+    """
+    Process image through NormalMapSimple and ConvertNormals
+    """
+    # Convert numpy image to torch tensor with batch dimension
+    image_tensor = torch.from_numpy(image).unsqueeze(0).float() / 255.0
+    # Create instances of the classes
+    normal_map_generator = NormalMapSimple()
+    normal_converter = ConvertNormals()
+    # Generate initial normal map
+    normal_map = normal_map_generator.normal_map(image_tensor, scale_XY=1.0)[0]
+    # Convert normal map from Standard to DirectX
+    converted_normal = normal_converter.convert_normals(
+        normal_map,
+        input_mode="Standard",
+        output_mode="DirectX",
+        scale_XY=1.0,
+        normalize=True,
+        fix_black=True
+    )[0]
+    # Convert back to numpy array
+    result = (converted_normal.squeeze(0).numpy() * 255).astype(np.uint8)
+    return result
 # Initialize model globally
 def initialize_model():
     encoder = 'vitl'
 @spaces.GPU
 def process_image(input_image):
     """
+    Process the input image and return depth maps, intensity map, blended result, and normal map
     """
     if input_image is None:
+        return None, None, None, None, None
     # Move model to GPU for processing
     MODEL.to('cuda')
         mode="normal"
     )
+    # Generate normal map from blended result
+    normal_map = process_normal_map(blended_result)
+    return depth_normalized, depth_colormap, intensity_map, blended_result, normal_map
 @spaces.GPU
 def gradio_interface(input_img):
     try:
+        depth_raw, depth_colored, intensity, blended, normal = process_image(input_img)
+        return [input_img, depth_raw, depth_colored, intensity, blended, normal]
     except Exception as e:
         print(f"Error processing image: {str(e)}")
+        return [input_img, None, None, None, None, None]
 # Define interface
 iface = gr.Interface(
         gr.Image(label="Raw Depth Map"),
         gr.Image(label="Colored Depth Map"),
         gr.Image(label="Intensity Map"),
+        gr.Image(label="Blended (Depth + Intensity)"),
+        gr.Image(label="Normal Map")
     ],
+    title="Depth, Intensity, and Normal Map Estimation",
+    description="Upload an image to generate its depth map, intensity map, blended result, and normal map.",
     examples=["image.jpg"]
 )