InvokeAI/invokeai/app/invocations/mask.py

import numpy as np
import torch
from PIL import Image

from invokeai.app.invocations.baseinvocation import BaseInvocation, Classification, InvocationContext, invocation
from invokeai.app.invocations.fields import ImageField, InputField, TensorField, WithBoard, WithMetadata
from invokeai.app.invocations.primitives import ImageOutput, MaskOutput


@invocation(
    "rectangle_mask",
    title="Create Rectangle Mask",
    tags=["conditioning"],
    category="conditioning",
    version="1.0.1",
)
class RectangleMaskInvocation(BaseInvocation, WithMetadata):
    """Create a rectangular mask."""

    width: int = InputField(description="The width of the entire mask.")
    height: int = InputField(description="The height of the entire mask.")
    x_left: int = InputField(description="The left x-coordinate of the rectangular masked region (inclusive).")
    y_top: int = InputField(description="The top y-coordinate of the rectangular masked region (inclusive).")
    rectangle_width: int = InputField(description="The width of the rectangular masked region.")
    rectangle_height: int = InputField(description="The height of the rectangular masked region.")

    def invoke(self, context: InvocationContext) -> MaskOutput:
        mask = torch.zeros((1, self.height, self.width), dtype=torch.bool)
        mask[:, self.y_top : self.y_top + self.rectangle_height, self.x_left : self.x_left + self.rectangle_width] = (
            True
        )

        mask_tensor_name = context.tensors.save(mask)
        return MaskOutput(
            mask=TensorField(tensor_name=mask_tensor_name),
            width=self.width,
            height=self.height,
        )


@invocation(
    "alpha_mask_to_tensor",
    title="Alpha Mask to Tensor",
    tags=["conditioning"],
    category="conditioning",
    version="1.0.0",
    classification=Classification.Beta,
)
class AlphaMaskToTensorInvocation(BaseInvocation):
    """Convert a mask image to a tensor. Opaque regions are 1 and transparent regions are 0."""

    image: ImageField = InputField(description="The mask image to convert.")
    invert: bool = InputField(default=False, description="Whether to invert the mask.")

    def invoke(self, context: InvocationContext) -> MaskOutput:
        image = context.images.get_pil(self.image.image_name)
        mask = torch.zeros((1, image.height, image.width), dtype=torch.bool)
        if self.invert:
            mask[0] = torch.tensor(np.array(image)[:, :, 3] == 0, dtype=torch.bool)
        else:
            mask[0] = torch.tensor(np.array(image)[:, :, 3] > 0, dtype=torch.bool)

        return MaskOutput(
            mask=TensorField(tensor_name=context.tensors.save(mask)),
            height=mask.shape[1],
            width=mask.shape[2],
        )


@invocation(
    "invert_tensor_mask",
    title="Invert Tensor Mask",
    tags=["conditioning"],
    category="conditioning",
    version="1.0.0",
    classification=Classification.Beta,
)
class InvertTensorMaskInvocation(BaseInvocation):
    """Inverts a tensor mask."""

    mask: TensorField = InputField(description="The tensor mask to convert.")

    def invoke(self, context: InvocationContext) -> MaskOutput:
        mask = context.tensors.load(self.mask.tensor_name)
        inverted = ~mask

        return MaskOutput(
            mask=TensorField(tensor_name=context.tensors.save(inverted)),
            height=inverted.shape[1],
            width=inverted.shape[2],
        )


@invocation(
    "image_mask_to_tensor",
    title="Image Mask to Tensor",
    tags=["conditioning"],
    category="conditioning",
    version="1.0.0",
)
class ImageMaskToTensorInvocation(BaseInvocation, WithMetadata):
    """Convert a mask image to a tensor. Converts the image to grayscale and uses thresholding at the specified value."""

    image: ImageField = InputField(description="The mask image to convert.")
    cutoff: int = InputField(ge=0, le=255, description="Cutoff (<)", default=128)
    invert: bool = InputField(default=False, description="Whether to invert the mask.")

    def invoke(self, context: InvocationContext) -> MaskOutput:
        image = context.images.get_pil(self.image.image_name, mode="L")

        mask = torch.zeros((1, image.height, image.width), dtype=torch.bool)
        if self.invert:
            mask[0] = torch.tensor(np.array(image)[:, :] >= self.cutoff, dtype=torch.bool)
        else:
            mask[0] = torch.tensor(np.array(image)[:, :] < self.cutoff, dtype=torch.bool)

        return MaskOutput(
            mask=TensorField(tensor_name=context.tensors.save(mask)),
            height=mask.shape[1],
            width=mask.shape[2],
        )


@invocation(
    "tensor_mask_to_image",
    title="Tensor Mask to Image",
    tags=["mask"],
    category="mask",
    version="1.0.0",
)
class MaskTensorToImageInvocation(BaseInvocation, WithMetadata, WithBoard):
    """Convert a mask tensor to an image."""

    mask: TensorField = InputField(description="The mask tensor to convert.")

    def invoke(self, context: InvocationContext) -> ImageOutput:
        mask = context.tensors.load(self.mask.tensor_name)
        # Ensure that the mask is binary.
        if mask.dtype != torch.bool:
            mask = mask > 0.5
        mask_np = (mask.float() * 255).byte().cpu().numpy()

        mask_pil = Image.fromarray(mask_np, mode="L")
        image_dto = context.images.save(image=mask_pil)
        return ImageOutput.build(image_dto)
feat(nodes): add alpha mask to tensor invocation 2024-04-09 10:27:03 +00:00			`import numpy as np`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00			`import torch`
Return a MaskOutput from SegmentAnythingModelInvocation. And add a MaskTensorToImageInvocation. 2024-07-31 21:15:48 +00:00			`from PIL import Image`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00
feat(nodes): add beta classification to mask tensor nodes 2024-04-19 13:00:44 +00:00			`from invokeai.app.invocations.baseinvocation import BaseInvocation, Classification, InvocationContext, invocation`
Return a MaskOutput from SegmentAnythingModelInvocation. And add a MaskTensorToImageInvocation. 2024-07-31 21:15:48 +00:00			`from invokeai.app.invocations.fields import ImageField, InputField, TensorField, WithBoard, WithMetadata`
			`from invokeai.app.invocations.primitives import ImageOutput, MaskOutput`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00

			`@invocation(`
			`"rectangle_mask",`
			`title="Create Rectangle Mask",`
			`tags=["conditioning"],`
			`category="conditioning",`
Fix field ordering Changed fields to go in w/h x/y order. 2024-04-09 19:17:55 +00:00			`version="1.0.1",`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00			`)`
			`class RectangleMaskInvocation(BaseInvocation, WithMetadata):`
			`"""Create a rectangular mask."""`

			`width: int = InputField(description="The width of the entire mask.")`
Fix field ordering Changed fields to go in w/h x/y order. 2024-04-09 19:17:55 +00:00			`height: int = InputField(description="The height of the entire mask.")`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00			`x_left: int = InputField(description="The left x-coordinate of the rectangular masked region (inclusive).")`
Fix field ordering Changed fields to go in w/h x/y order. 2024-04-09 19:17:55 +00:00			`y_top: int = InputField(description="The top y-coordinate of the rectangular masked region (inclusive).")`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00			`rectangle_width: int = InputField(description="The width of the rectangular masked region.")`
Fix field ordering Changed fields to go in w/h x/y order. 2024-04-09 19:17:55 +00:00			`rectangle_height: int = InputField(description="The height of the rectangular masked region.")`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00
			`def invoke(self, context: InvocationContext) -> MaskOutput:`
			`mask = torch.zeros((1, self.height, self.width), dtype=torch.bool)`
fix ruff 2024-05-29 23:46:46 +00:00			`mask[:, self.y_top : self.y_top + self.rectangle_height, self.x_left : self.x_left + self.rectangle_width] = (`
			`True`
			`)`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00
Rename MaskField to be a generice TensorField. 2024-04-08 18:16:22 +00:00			`mask_tensor_name = context.tensors.save(mask)`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00			`return MaskOutput(`
Rename MaskField to be a generice TensorField. 2024-04-08 18:16:22 +00:00			`mask=TensorField(tensor_name=mask_tensor_name),`
Add RectangleMaskInvocation. 2024-03-08 15:30:55 +00:00			`width=self.width,`
			`height=self.height,`
			`)`
feat(nodes): add alpha mask to tensor invocation 2024-04-09 10:27:03 +00:00

			`@invocation(`
			`"alpha_mask_to_tensor",`
			`title="Alpha Mask to Tensor",`
			`tags=["conditioning"],`
			`category="conditioning",`
			`version="1.0.0",`
feat(nodes): add beta classification to mask tensor nodes 2024-04-19 13:00:44 +00:00			`classification=Classification.Beta,`
feat(nodes): add alpha mask to tensor invocation 2024-04-09 10:27:03 +00:00			`)`
			`class AlphaMaskToTensorInvocation(BaseInvocation):`
			`"""Convert a mask image to a tensor. Opaque regions are 1 and transparent regions are 0."""`

			`image: ImageField = InputField(description="The mask image to convert.")`
fix(nodes): handle invert in alpha_mask_to_tensor 2024-04-15 02:37:30 +00:00			`invert: bool = InputField(default=False, description="Whether to invert the mask.")`
feat(nodes): add alpha mask to tensor invocation 2024-04-09 10:27:03 +00:00
			`def invoke(self, context: InvocationContext) -> MaskOutput:`
			`image = context.images.get_pil(self.image.image_name)`
			`mask = torch.zeros((1, image.height, image.width), dtype=torch.bool)`
fix(nodes): handle invert in alpha_mask_to_tensor 2024-04-15 02:37:30 +00:00			`if self.invert:`
			`mask[0] = torch.tensor(np.array(image)[:, :, 3] == 0, dtype=torch.bool)`
			`else:`
			`mask[0] = torch.tensor(np.array(image)[:, :, 3] > 0, dtype=torch.bool)`
feat(nodes): add alpha mask to tensor invocation 2024-04-09 10:27:03 +00:00
			`return MaskOutput(`
feat(nodes): add InvertTensorMaskInvocation 2024-04-19 03:54:38 +00:00			`mask=TensorField(tensor_name=context.tensors.save(mask)),`
			`height=mask.shape[1],`
			`width=mask.shape[2],`
			`)`


			`@invocation(`
			`"invert_tensor_mask",`
			`title="Invert Tensor Mask",`
			`tags=["conditioning"],`
			`category="conditioning",`
			`version="1.0.0",`
feat(nodes): add beta classification to mask tensor nodes 2024-04-19 13:00:44 +00:00			`classification=Classification.Beta,`
feat(nodes): add InvertTensorMaskInvocation 2024-04-19 03:54:38 +00:00			`)`
			`class InvertTensorMaskInvocation(BaseInvocation):`
			`"""Inverts a tensor mask."""`

			`mask: TensorField = InputField(description="The tensor mask to convert.")`

			`def invoke(self, context: InvocationContext) -> MaskOutput:`
			`mask = context.tensors.load(self.mask.tensor_name)`
			`inverted = ~mask`

			`return MaskOutput(`
			`mask=TensorField(tensor_name=context.tensors.save(inverted)),`
			`height=inverted.shape[1],`
			`width=inverted.shape[2],`
feat(nodes): add alpha mask to tensor invocation 2024-04-09 10:27:03 +00:00			`)`
feat(nodes): image mask to tensor invocation Thanks @JPPhoto! 2024-04-20 11:58:16 +00:00

			`@invocation(`
			`"image_mask_to_tensor",`
			`title="Image Mask to Tensor",`
			`tags=["conditioning"],`
			`category="conditioning",`
			`version="1.0.0",`
			`)`
			`class ImageMaskToTensorInvocation(BaseInvocation, WithMetadata):`
			`"""Convert a mask image to a tensor. Converts the image to grayscale and uses thresholding at the specified value."""`

			`image: ImageField = InputField(description="The mask image to convert.")`
			`cutoff: int = InputField(ge=0, le=255, description="Cutoff (<)", default=128)`
			`invert: bool = InputField(default=False, description="Whether to invert the mask.")`

			`def invoke(self, context: InvocationContext) -> MaskOutput:`
			`image = context.images.get_pil(self.image.image_name, mode="L")`

			`mask = torch.zeros((1, image.height, image.width), dtype=torch.bool)`
			`if self.invert:`
			`mask[0] = torch.tensor(np.array(image)[:, :] >= self.cutoff, dtype=torch.bool)`
			`else:`
			`mask[0] = torch.tensor(np.array(image)[:, :] < self.cutoff, dtype=torch.bool)`

			`return MaskOutput(`
			`mask=TensorField(tensor_name=context.tensors.save(mask)),`
			`height=mask.shape[1],`
			`width=mask.shape[2],`
			`)`
Return a MaskOutput from SegmentAnythingModelInvocation. And add a MaskTensorToImageInvocation. 2024-07-31 21:15:48 +00:00

			`@invocation(`
			`"tensor_mask_to_image",`
			`title="Tensor Mask to Image",`
			`tags=["mask"],`
			`category="mask",`
			`version="1.0.0",`
			`)`
			`class MaskTensorToImageInvocation(BaseInvocation, WithMetadata, WithBoard):`
			`"""Convert a mask tensor to an image."""`

			`mask: TensorField = InputField(description="The mask tensor to convert.")`

			`def invoke(self, context: InvocationContext) -> ImageOutput:`
			`mask = context.tensors.load(self.mask.tensor_name)`
			`# Ensure that the mask is binary.`
			`if mask.dtype != torch.bool:`
			`mask = mask > 0.5`
(minor) Tweak order of mask operations. 2024-08-01 14:12:24 +00:00			`mask_np = (mask.float() * 255).byte().cpu().numpy()`
Return a MaskOutput from SegmentAnythingModelInvocation. And add a MaskTensorToImageInvocation. 2024-07-31 21:15:48 +00:00
			`mask_pil = Image.fromarray(mask_np, mode="L")`
			`image_dto = context.images.save(image=mask_pil)`
			`return ImageOutput.build(image_dto)`