mirror of
https://github.com/justUmen/Bjornulf_custom_nodes.git
synced 2026-03-21 12:42:11 -03:00
497 lines
20 KiB
Python
497 lines
20 KiB
Python
import numpy as np
|
|
import scipy.ndimage as ndi
|
|
import torch
|
|
|
|
class BodyPartSelectorMask:
|
|
@classmethod
|
|
def INPUT_TYPES(cls):
|
|
return {
|
|
"required": {
|
|
"mask": ("MASK",),
|
|
"selection": (["head", "hands", "feet"],),
|
|
}
|
|
}
|
|
|
|
RETURN_TYPES = ("MASK",)
|
|
FUNCTION = "process"
|
|
CATEGORY = "Bjornulf"
|
|
|
|
def process_single(self, mask_np, selection):
|
|
"""
|
|
Process a single 2D mask to select head, hands, or feet based on position.
|
|
|
|
Args:
|
|
mask_np: 2D numpy array (H, W)
|
|
selection: str, one of "head", "hands", "feet"
|
|
|
|
Returns:
|
|
2D numpy array with selected shapes
|
|
"""
|
|
# Convert to binary mask
|
|
binary_mask = (mask_np > 0.5).astype(np.uint8)
|
|
|
|
# Label connected components
|
|
labeled_array, num_features = ndi.label(binary_mask)
|
|
if num_features < 5:
|
|
raise ValueError(f"Expected at least 5 components, found {num_features}")
|
|
|
|
# Compute sizes of all components (excluding background)
|
|
sizes = np.bincount(labeled_array.ravel())[1:]
|
|
# Select the five largest components
|
|
largest_indices = np.argsort(sizes)[-5:][::-1] # Top 5 in descending order
|
|
largest_labels = largest_indices + 1 # Map to label numbers (1-based)
|
|
|
|
# Compute centroids for the five largest components
|
|
centroids = []
|
|
for label in largest_labels:
|
|
positions = np.argwhere(labeled_array == label)
|
|
if len(positions) > 0:
|
|
centroid_row = positions[:, 0].mean() # Average row
|
|
centroid_col = positions[:, 1].mean() # Average column
|
|
centroids.append((label, centroid_row, centroid_col))
|
|
|
|
# Sort by centroid row (ascending, since row 0 is top)
|
|
centroids.sort(key=lambda x: x[1])
|
|
|
|
# Assign components based on vertical position
|
|
head_label = centroids[0][0] # Smallest row (top)
|
|
hand_labels = [centroids[1][0], centroids[2][0]] # Middle two
|
|
feet_labels = [centroids[3][0], centroids[4][0]] # Largest rows (bottom)
|
|
|
|
# Select labels based on user input
|
|
if selection == "head":
|
|
selected_labels = [head_label]
|
|
elif selection == "hands":
|
|
selected_labels = hand_labels
|
|
elif selection == "feet":
|
|
selected_labels = feet_labels
|
|
else:
|
|
raise ValueError("Selection must be 'head', 'hands', or 'feet'")
|
|
|
|
# Create new mask with selected components
|
|
new_mask = np.isin(labeled_array, selected_labels).astype(np.float32)
|
|
return new_mask
|
|
|
|
def process(self, mask, selection):
|
|
"""
|
|
Process the input mask(s) and return a new mask with selected parts.
|
|
|
|
Args:
|
|
mask: torch tensor, either 2D (H, W) or 3D (N, H, W)
|
|
selection: str, one of "head", "hands", "feet"
|
|
|
|
Returns:
|
|
Tuple containing the output mask tensor
|
|
"""
|
|
mask_np = mask.cpu().numpy()
|
|
|
|
if mask_np.ndim == 2:
|
|
# Single mask
|
|
result = self.process_single(mask_np, selection)
|
|
result = result[None, ...] # Add batch dimension: (1, H, W)
|
|
elif mask_np.ndim == 3:
|
|
# Batched masks
|
|
results = [self.process_single(mask_np[i], selection)
|
|
for i in range(mask_np.shape[0])]
|
|
result = np.stack(results, axis=0) # Stack to (N, H, W)
|
|
else:
|
|
raise ValueError("Mask must be 2D (H, W) or 3D (N, H, W)")
|
|
|
|
return (torch.from_numpy(result),)
|
|
class LargestMaskOnly:
|
|
@classmethod
|
|
def INPUT_TYPES(cls):
|
|
return {
|
|
"required": {
|
|
"mask": ("MASK",),
|
|
"num_masks": ("INT", {"default": 1, "min": 1, "max": 10}),
|
|
}
|
|
}
|
|
|
|
RETURN_TYPES = ("MASK",)
|
|
FUNCTION = "process"
|
|
CATEGORY = "Bjornulf"
|
|
|
|
def process_single(self, mask_np, num_masks):
|
|
"""Process a single mask to keep the top num_masks largest components."""
|
|
# Convert to binary mask
|
|
binary_mask = (mask_np > 0.5).astype(np.uint8)
|
|
# Label connected components
|
|
labeled_array, num_features = ndi.label(binary_mask)
|
|
|
|
if num_features > 0:
|
|
# Get sizes of all components, excluding background (label 0)
|
|
sizes = np.bincount(labeled_array.ravel())[1:]
|
|
# Determine how many components to keep
|
|
k = min(num_masks, num_features)
|
|
if k > 0:
|
|
# Get indices of the top k largest components (descending order)
|
|
top_indices = np.argsort(sizes)[::-1][:k]
|
|
# Map indices to labels (add 1 since sizes[1:] starts at label 1)
|
|
top_labels = top_indices + 1
|
|
# Create mask with only the top k components
|
|
largest_mask = np.isin(labeled_array, top_labels).astype(np.float32)
|
|
else:
|
|
largest_mask = np.zeros_like(binary_mask, dtype=np.float32)
|
|
else:
|
|
# No components found, return an empty mask
|
|
largest_mask = np.zeros_like(binary_mask, dtype=np.float32)
|
|
|
|
return largest_mask
|
|
|
|
def process(self, mask, num_masks):
|
|
"""Process the input mask(s) and return the top num_masks largest components."""
|
|
# Convert mask to numpy array
|
|
mask_np = mask.cpu().numpy()
|
|
|
|
if mask_np.ndim == 2:
|
|
# Single mask: process and add batch dimension
|
|
result = self.process_single(mask_np, num_masks)
|
|
result = result[None, ...] # Shape becomes (1, H, W)
|
|
elif mask_np.ndim == 3:
|
|
# Batched masks: process each mask independently
|
|
results = [self.process_single(mask_np[i], num_masks) for i in range(mask_np.shape[0])]
|
|
result = np.stack(results, axis=0) # Shape remains (N, H, W)
|
|
else:
|
|
raise ValueError("Invalid mask shape: expected 2D (H, W) or 3D (N, H, W)")
|
|
|
|
# Convert back to torch tensor and return as a tuple
|
|
return (torch.from_numpy(result),)
|
|
|
|
class BoundingRectangleMask:
|
|
@classmethod
|
|
def INPUT_TYPES(cls):
|
|
return {
|
|
"required": {
|
|
"mask": ("MASK",),
|
|
"up": ("INT", {"default": 0, "min": -10000, "max": 10000}),
|
|
"down": ("INT", {"default": 0, "min": -10000, "max": 10000}),
|
|
"right": ("INT", {"default": 0, "min": -10000, "max": 10000}),
|
|
"left": ("INT", {"default": 0, "min": -10000, "max": 10000}),
|
|
}
|
|
}
|
|
|
|
RETURN_TYPES = ("MASK",)
|
|
FUNCTION = "process"
|
|
CATEGORY = "Bjornulf"
|
|
|
|
def process_single(self, mask_np, up, down, right, left):
|
|
active = mask_np > 0.5
|
|
if not np.any(active):
|
|
return np.zeros_like(mask_np, dtype=np.float32)
|
|
|
|
rows_with_active = np.any(active, axis=1)
|
|
cols_with_active = np.any(active, axis=0)
|
|
min_row = np.where(rows_with_active)[0][0]
|
|
max_row = np.where(rows_with_active)[0][-1]
|
|
min_col = np.where(cols_with_active)[0][0]
|
|
max_col = np.where(cols_with_active)[0][-1]
|
|
|
|
min_row_adj = min_row - up
|
|
max_row_adj = max_row + down
|
|
min_col_adj = min_col - left
|
|
max_col_adj = max_col + right
|
|
|
|
H, W = mask_np.shape
|
|
min_row_adj = max(0, min_row_adj)
|
|
max_row_adj = min(H - 1, max_row_adj)
|
|
min_col_adj = max(0, min_col_adj)
|
|
max_col_adj = min(W - 1, max_col_adj)
|
|
|
|
if min_row_adj > max_row_adj or min_col_adj > max_col_adj:
|
|
return np.zeros_like(mask_np, dtype=np.float32)
|
|
|
|
new_mask = np.zeros_like(mask_np, dtype=np.float32)
|
|
new_mask[min_row_adj:max_row_adj + 1, min_col_adj:max_col_adj + 1] = 1.0
|
|
return new_mask
|
|
|
|
def process(self, mask, up, down, right, left):
|
|
mask_np = mask.cpu().numpy()
|
|
|
|
if mask_np.ndim == 2:
|
|
result = self.process_single(mask_np, up, down, right, left)
|
|
result = result[None, ...]
|
|
elif mask_np.ndim == 3:
|
|
results = [self.process_single(mask_np[i], up, down, right, left)
|
|
for i in range(mask_np.shape[0])]
|
|
result = np.stack(results, axis=0)
|
|
else:
|
|
raise ValueError("Mask must be 2D (H, W) or 3D (N, H, W)")
|
|
|
|
return (torch.from_numpy(result),)
|
|
|
|
class BoundingRectangleMaskBlur:
|
|
@classmethod
|
|
def INPUT_TYPES(cls):
|
|
return {
|
|
"required": {
|
|
"mask": ("MASK",),
|
|
"up": ("INT", {"default": 0, "min": -10000, "max": 10000}),
|
|
"down": ("INT", {"default": 0, "min": -10000, "max": 10000}),
|
|
"right": ("INT", {"default": 0, "min": -10000, "max": 10000}),
|
|
"left": ("INT", {"default": 0, "min": -10000, "max": 10000}),
|
|
"blur_up": ("FLOAT", {"default": 0.0, "min": 0.0, "max": 100.0, "step": 0.1}),
|
|
"blur_down": ("FLOAT", {"default": 0.0, "min": 0.0, "max": 100.0, "step": 0.1}),
|
|
"blur_left": ("FLOAT", {"default": 0.0, "min": 0.0, "max": 100.0, "step": 0.1}),
|
|
"blur_right": ("FLOAT", {"default": 0.0, "min": 0.0, "max": 100.0, "step": 0.1}),
|
|
"tapered_corners": ("BOOLEAN", {"default": True}),
|
|
}
|
|
}
|
|
|
|
RETURN_TYPES = ("MASK",)
|
|
FUNCTION = "process"
|
|
CATEGORY = "Bjornulf"
|
|
|
|
def _get_bounding_box(self, mask_np):
|
|
"""Extract bounding box coordinates from active mask pixels."""
|
|
active = mask_np > 0.5
|
|
if not np.any(active):
|
|
return None
|
|
|
|
rows_with_active = np.any(active, axis=1)
|
|
cols_with_active = np.any(active, axis=0)
|
|
|
|
min_row = np.where(rows_with_active)[0][0]
|
|
max_row = np.where(rows_with_active)[0][-1]
|
|
min_col = np.where(cols_with_active)[0][0]
|
|
max_col = np.where(cols_with_active)[0][-1]
|
|
|
|
return min_row, max_row, min_col, max_col
|
|
|
|
def _expand_bounding_box(self, bbox, up, down, left, right, shape):
|
|
"""Expand bounding box by specified amounts, clamped to image bounds."""
|
|
min_row, max_row, min_col, max_col = bbox
|
|
H, W = shape
|
|
|
|
min_row_adj = max(0, min_row - up)
|
|
max_row_adj = min(H - 1, max_row + down)
|
|
min_col_adj = max(0, min_col - left)
|
|
max_col_adj = min(W - 1, max_col + right)
|
|
|
|
# Check for invalid bounds
|
|
if min_row_adj > max_row_adj or min_col_adj > max_col_adj:
|
|
return None
|
|
|
|
return min_row_adj, max_row_adj, min_col_adj, max_col_adj
|
|
|
|
def _create_directional_blur_mask(self, mask, direction, blur_amount):
|
|
"""Create a mask blurred in one specific direction."""
|
|
if blur_amount <= 0:
|
|
return np.zeros_like(mask)
|
|
|
|
H, W = mask.shape
|
|
|
|
# Find the edge of the mask in the specified direction
|
|
mask_binary = mask > 0.5
|
|
if not np.any(mask_binary):
|
|
return np.zeros_like(mask)
|
|
|
|
# Create blur based on direction
|
|
if direction == 'up':
|
|
# Find top edge
|
|
top_rows = np.any(mask_binary, axis=1)
|
|
if not np.any(top_rows):
|
|
return np.zeros_like(mask)
|
|
top_edge = np.where(top_rows)[0][0]
|
|
|
|
# Create gradient going upward from top edge
|
|
result = np.zeros_like(mask)
|
|
for row in range(top_edge + 1):
|
|
distance = top_edge - row
|
|
strength = np.exp(-(distance ** 2) / (2 * blur_amount ** 2))
|
|
result[row, :] = strength * np.any(mask_binary[top_edge:, :], axis=0)
|
|
|
|
elif direction == 'down':
|
|
# Find bottom edge
|
|
top_rows = np.any(mask_binary, axis=1)
|
|
if not np.any(top_rows):
|
|
return np.zeros_like(mask)
|
|
bottom_edge = np.where(top_rows)[0][-1]
|
|
|
|
# Create gradient going downward from bottom edge
|
|
result = np.zeros_like(mask)
|
|
for row in range(bottom_edge, H):
|
|
distance = row - bottom_edge
|
|
strength = np.exp(-(distance ** 2) / (2 * blur_amount ** 2))
|
|
result[row, :] = strength * np.any(mask_binary[:bottom_edge+1, :], axis=0)
|
|
|
|
elif direction == 'left':
|
|
# Find left edge
|
|
left_cols = np.any(mask_binary, axis=0)
|
|
if not np.any(left_cols):
|
|
return np.zeros_like(mask)
|
|
left_edge = np.where(left_cols)[0][0]
|
|
|
|
# Create gradient going leftward from left edge
|
|
result = np.zeros_like(mask)
|
|
for col in range(left_edge + 1):
|
|
distance = left_edge - col
|
|
strength = np.exp(-(distance ** 2) / (2 * blur_amount ** 2))
|
|
result[:, col] = strength * np.any(mask_binary[:, left_edge:], axis=1)
|
|
|
|
elif direction == 'right':
|
|
# Find right edge
|
|
left_cols = np.any(mask_binary, axis=0)
|
|
if not np.any(left_cols):
|
|
return np.zeros_like(mask)
|
|
right_edge = np.where(left_cols)[0][-1]
|
|
|
|
# Create gradient going rightward from right edge
|
|
result = np.zeros_like(mask)
|
|
for col in range(right_edge, W):
|
|
distance = col - right_edge
|
|
strength = np.exp(-(distance ** 2) / (2 * blur_amount ** 2))
|
|
result[:, col] = strength * np.any(mask_binary[:, :right_edge+1], axis=1)
|
|
|
|
return result
|
|
|
|
def _create_corner_blend(self, mask, blur_up, blur_down, blur_left, blur_right):
|
|
"""Create smooth corner blending for diagonal blur combinations using individual blur values."""
|
|
H, W = mask.shape
|
|
result = np.zeros_like(mask)
|
|
|
|
# Find mask boundaries
|
|
mask_binary = mask > 0.5
|
|
if not np.any(mask_binary):
|
|
return result
|
|
|
|
rows_with_mask = np.any(mask_binary, axis=1)
|
|
cols_with_mask = np.any(mask_binary, axis=0)
|
|
|
|
if not np.any(rows_with_mask) or not np.any(cols_with_mask):
|
|
return result
|
|
|
|
top_edge = np.where(rows_with_mask)[0][0]
|
|
bottom_edge = np.where(rows_with_mask)[0][-1]
|
|
left_edge = np.where(cols_with_mask)[0][0]
|
|
right_edge = np.where(cols_with_mask)[0][-1]
|
|
|
|
# Create coordinate grids
|
|
y_coords, x_coords = np.mgrid[0:H, 0:W]
|
|
|
|
# Top-left corner
|
|
if blur_up > 0 and blur_left > 0:
|
|
# Calculate separate distances and strengths for each direction
|
|
dist_from_top = np.maximum(0, top_edge - y_coords)
|
|
dist_from_left = np.maximum(0, left_edge - x_coords)
|
|
|
|
# Calculate strength based on individual blur values
|
|
strength_top = np.exp(-(dist_from_top**2) / (2 * blur_up**2))
|
|
strength_left = np.exp(-(dist_from_left**2) / (2 * blur_left**2))
|
|
|
|
# Combine strengths multiplicatively for smooth corner transition
|
|
strength = strength_top * strength_left
|
|
|
|
# Only apply in the top-left quadrant
|
|
corner_mask = (y_coords <= top_edge) & (x_coords <= left_edge)
|
|
result = np.maximum(result, strength * corner_mask)
|
|
|
|
# Top-right corner
|
|
if blur_up > 0 and blur_right > 0:
|
|
dist_from_top = np.maximum(0, top_edge - y_coords)
|
|
dist_from_right = np.maximum(0, x_coords - right_edge)
|
|
|
|
strength_top = np.exp(-(dist_from_top**2) / (2 * blur_up**2))
|
|
strength_right = np.exp(-(dist_from_right**2) / (2 * blur_right**2))
|
|
strength = strength_top * strength_right
|
|
|
|
corner_mask = (y_coords <= top_edge) & (x_coords >= right_edge)
|
|
result = np.maximum(result, strength * corner_mask)
|
|
|
|
# Bottom-left corner
|
|
if blur_down > 0 and blur_left > 0:
|
|
dist_from_bottom = np.maximum(0, y_coords - bottom_edge)
|
|
dist_from_left = np.maximum(0, left_edge - x_coords)
|
|
|
|
strength_bottom = np.exp(-(dist_from_bottom**2) / (2 * blur_down**2))
|
|
strength_left = np.exp(-(dist_from_left**2) / (2 * blur_left**2))
|
|
strength = strength_bottom * strength_left
|
|
|
|
corner_mask = (y_coords >= bottom_edge) & (x_coords <= left_edge)
|
|
result = np.maximum(result, strength * corner_mask)
|
|
|
|
# Bottom-right corner
|
|
if blur_down > 0 and blur_right > 0:
|
|
dist_from_bottom = np.maximum(0, y_coords - bottom_edge)
|
|
dist_from_right = np.maximum(0, x_coords - right_edge)
|
|
|
|
strength_bottom = np.exp(-(dist_from_bottom**2) / (2 * blur_down**2))
|
|
strength_right = np.exp(-(dist_from_right**2) / (2 * blur_right**2))
|
|
strength = strength_bottom * strength_right
|
|
|
|
corner_mask = (y_coords >= bottom_edge) & (x_coords >= right_edge)
|
|
result = np.maximum(result, strength * corner_mask)
|
|
|
|
return result
|
|
|
|
def _apply_directional_blur(self, mask, blur_up, blur_down, blur_left, blur_right, tapered_corners):
|
|
"""Apply independent directional blur with optional smooth corner blending."""
|
|
result = mask.copy()
|
|
|
|
# Create blur masks for each direction
|
|
blur_masks = []
|
|
|
|
if blur_up > 0:
|
|
blur_masks.append(self._create_directional_blur_mask(mask, 'up', blur_up))
|
|
|
|
if blur_down > 0:
|
|
blur_masks.append(self._create_directional_blur_mask(mask, 'down', blur_down))
|
|
|
|
if blur_left > 0:
|
|
blur_masks.append(self._create_directional_blur_mask(mask, 'left', blur_left))
|
|
|
|
if blur_right > 0:
|
|
blur_masks.append(self._create_directional_blur_mask(mask, 'right', blur_right))
|
|
|
|
# Combine all blur masks with the original
|
|
for blur_mask in blur_masks:
|
|
result = np.maximum(result, blur_mask)
|
|
|
|
# Add smooth corner blending only if tapered_corners is enabled
|
|
if tapered_corners:
|
|
corner_blend = self._create_corner_blend(mask, blur_up, blur_down, blur_left, blur_right)
|
|
result = np.maximum(result, corner_blend)
|
|
|
|
return result
|
|
|
|
def process_single(self, mask_np, up, down, right, left, blur_up, blur_down, blur_left, blur_right, tapered_corners):
|
|
"""Process a single mask with bounding box expansion and directional blur."""
|
|
# Get bounding box of active pixels
|
|
bbox = self._get_bounding_box(mask_np)
|
|
if bbox is None:
|
|
return np.zeros_like(mask_np, dtype=np.float32)
|
|
|
|
# Expand bounding box
|
|
expanded_bbox = self._expand_bounding_box(bbox, up, down, left, right, mask_np.shape)
|
|
if expanded_bbox is None:
|
|
return np.zeros_like(mask_np, dtype=np.float32)
|
|
|
|
# Create base rectangular mask
|
|
min_row_adj, max_row_adj, min_col_adj, max_col_adj = expanded_bbox
|
|
new_mask = np.zeros_like(mask_np, dtype=np.float32)
|
|
new_mask[min_row_adj:max_row_adj + 1, min_col_adj:max_col_adj + 1] = 1.0
|
|
|
|
# Apply directional blur
|
|
new_mask = self._apply_directional_blur(new_mask, blur_up, blur_down, blur_left, blur_right, tapered_corners)
|
|
|
|
return new_mask
|
|
|
|
def process(self, mask, up, down, right, left, blur_up, blur_down, blur_left, blur_right, tapered_corners):
|
|
"""Main processing function supporting both 2D and 3D masks."""
|
|
mask_np = mask.cpu().numpy()
|
|
|
|
if mask_np.ndim == 2:
|
|
result = self.process_single(mask_np, up, down, right, left, blur_up, blur_down, blur_left, blur_right, tapered_corners)
|
|
result = result[None, ...]
|
|
elif mask_np.ndim == 3:
|
|
results = []
|
|
for i in range(mask_np.shape[0]):
|
|
single_result = self.process_single(
|
|
mask_np[i], up, down, right, left, blur_up, blur_down, blur_left, blur_right, tapered_corners
|
|
)
|
|
results.append(single_result)
|
|
result = np.stack(results, axis=0)
|
|
else:
|
|
raise ValueError("Mask must be 2D (H, W) or 3D (N, H, W)")
|
|
|
|
return (torch.from_numpy(result),) |