Spaces:

QingyanBai
/

Ditto

Running on Zero

App Files Files Community

Ditto / custom_nodes /comfyui-tensorops /nodes /layer_mask.py

QingyanBai

Upload 750 files

a42ebba verified about 2 months ago

raw

history blame contribute delete

4.7 kB

	import PIL
	from typing import List
	import numpy as np
	import torchvision.transforms.functional as F
	import torch

	def multiply_grayscale_images(image1, image2):
	# Convert the images to NumPy arrays
	image1_np = np.array(image1)
	image2_np = np.array(image2)

	# Perform element-wise multiplication (ensure to use np.float32 to avoid overflow)
	multiplied_image = image1_np.astype(np.float32) * image2_np.astype(np.float32)

	# Normalize the result to the range 0-255 (if needed)
	multiplied_image = np.clip(multiplied_image, 0, 255)

	# Convert back to uint8 (8-bit grayscale image)
	multiplied_image = multiplied_image.astype(np.uint8)

	# Convert back to an image and save the result
	result_image = PIL.Image.fromarray(multiplied_image)
	return result_image

	def create_color_masks(image: PIL.Image.Image):
	# Load the image
	image = image.convert("RGB")
	image_np = np.array(image) # Convert to numpy array (Height x Width x 3)
	# Find unique colors in the image
	unique_colors = np.unique(image_np.reshape(-1, 3), axis=0)
	output = []
	# Create masks for each color
	for color in unique_colors:
	if sum(color) == 0:
	continue
	mask = np.all(image_np == color, axis=-1)
	color_str = '_'.join(map(str, color)) # Create a string representation of the color
	output.append((color_str, mask))
	# Skip Background Mask Image
	background_area = 0.0
	background_mask_index = -1
	for idx, (color_str, mask) in enumerate(output):
	area = np.sum(mask > 0) / (mask.shape[0] * mask.shape[1])
	if area > background_area:
	background_area = area
	background_mask_index = idx
	# Final Elements
	elements = []
	for idx, (color_str, mask) in enumerate(output):
	if idx == background_mask_index:
	print(background_mask_index)
	continue
	mask_image = PIL.Image.fromarray(mask.astype(np.uint8) * 255)
	elements.append((color_str, mask_image))
	# Final Background
	final_background_mask_image = PIL.Image.new("L", (image.size[0], image.size[1]), 255)
	draw = PIL.ImageDraw.Draw(final_background_mask_image)
	for idx, (color_str, mask_image) in enumerate(elements):
	final_background_mask_image = multiply_grayscale_images(final_background_mask_image, PIL.ImageOps.invert(mask_image))

	return final_background_mask_image, elements


	def create_text_masks(polygons, width, height):
	# Loop over each polygon in the list
	text_masks = []
	for i, polygon_coords in enumerate(polygons):
	# Create a new grayscale image (L mode) with a black background (0)
	mask = PIL.Image.new('L', (width, height), 0)

	# Create a drawing object
	draw = PIL.ImageDraw.Draw(mask)

	# Convert the list of polygon coordinates into a format ImageDraw can use (list of tuples)
	polygon_points = [(polygon_coords[j], polygon_coords[j + 1]) for j in range(0, len(polygon_coords), 2)]

	# Draw the polygon with white (255) fill
	draw.polygon(polygon_points, fill=255)
	text_masks.append(mask)
	return text_masks

	class GetLayerMask:

	@classmethod
	def INPUT_TYPES(s):
	return {
	"required": {
	"image": ("IMAGE",),
	"json_data": ("JSON",),
	},
	}

	RETURN_TYPES = ("MASK", "MASK", "JSON")

	FUNCTION = "main"

	CATEGORY = "tensorops"

	def main(self, image: torch.Tensor, json_data: str):
	# Create PIL.Image
	image = image.permute(0, 3, 1, 2)
	image_pil = F.to_pil_image(image[0])
	# Create bg and elements
	bg, elements = create_color_masks(image_pil)
	# Create Text Masks
	print("items", json_data)
	items = [item for item in json_data]
	text_polygon_list = []
	text_label_list = []
	text_masks = []

	for item in items:
	text_polygon_list.append(item["polygon"])
	text_label_list.append(item["label"])

	for mask_image in create_text_masks(text_polygon_list, bg.size[0], bg.size[1]):
	img = np.array(mask_image).astype(np.float32) / 255.0
	img = torch.from_numpy(img)[None,]
	text_masks.append(img)

	output = []
	bg = np.array(bg).astype(np.float32) / 255.0
	bg = torch.from_numpy(bg)[None,]
	output.append(bg)
	for _, mask_image in elements:
	img = np.array(mask_image).astype(np.float32) / 255.0
	img = torch.from_numpy(img)[None,]
	output.append(img)
	return (torch.cat(output, dim=0), torch.cat(text_masks, dim=0), text_label_list)