feat: metadata refactor

- Refactor how metadata is handled to support a user-defined metadata in graphs - Update workflow embed handling - Update UI to work with these changes - Update tests to support metadata/workflow changes
2024-08-30 20:32:17 +00:00 · 2023-10-17 17:23:10 +11:00
parent c2da74c587
commit f0db4d36e4
66 changed files with 1807 additions and 1798 deletions
--- a/invokeai/app/invocations/image.py
+++ b/invokeai/app/invocations/image.py
@ -7,13 +7,21 @@ import cv2
 import numpy
 from PIL import Image, ImageChops, ImageFilter, ImageOps

-from invokeai.app.invocations.metadata import CoreMetadata
 from invokeai.app.invocations.primitives import BoardField, ColorField, ImageField, ImageOutput
 from invokeai.app.services.image_records.image_records_common import ImageCategory, ResourceOrigin
 from invokeai.backend.image_util.invisible_watermark import InvisibleWatermark
 from invokeai.backend.image_util.safety_checker import SafetyChecker

-from .baseinvocation import BaseInvocation, FieldDescriptions, Input, InputField, InvocationContext, invocation
+from .baseinvocation import (
+    BaseInvocation,
+    FieldDescriptions,
+    Input,
+    InputField,
+    InvocationContext,
+    WithMetadata,
+    WithWorkflow,
+    invocation,
+)


@invocation("show_image", title="Show Image", tags=["image"], category="image", version="1.0.0")
@ -36,14 +44,8 @@ class ShowImageInvocation(BaseInvocation):
        )


-@invocation(
-    "blank_image",
-    title="Blank Image",
-    tags=["image"],
-    category="image",
-    version="1.0.0",
-)
-class BlankImageInvocation(BaseInvocation):
+@invocation("blank_image", title="Blank Image", tags=["image"], category="image", version="1.0.0")
+class BlankImageInvocation(BaseInvocation, WithMetadata, WithWorkflow):
    """Creates a blank image and forwards it to the pipeline"""

    width: int = InputField(default=512, description="The width of the image")
@ -61,6 +63,7 @@ class BlankImageInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -71,14 +74,8 @@ class BlankImageInvocation(BaseInvocation):
        )


-@invocation(
-    "img_crop",
-    title="Crop Image",
-    tags=["image", "crop"],
-    category="image",
-    version="1.0.0",
-)
-class ImageCropInvocation(BaseInvocation):
+@invocation("img_crop", title="Crop Image", tags=["image", "crop"], category="image", version="1.0.0")
+class ImageCropInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Crops an image to a specified box. The box can be outside of the image."""

    image: ImageField = InputField(description="The image to crop")
@ -100,6 +97,7 @@ class ImageCropInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -110,14 +108,8 @@ class ImageCropInvocation(BaseInvocation):
        )


-@invocation(
-    "img_paste",
-    title="Paste Image",
-    tags=["image", "paste"],
-    category="image",
-    version="1.0.1",
-)
-class ImagePasteInvocation(BaseInvocation):
+@invocation("img_paste", title="Paste Image", tags=["image", "paste"], category="image", version="1.0.1")
+class ImagePasteInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Pastes an image into another image."""

    base_image: ImageField = InputField(description="The base image")
@ -159,6 +151,7 @@ class ImagePasteInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -169,14 +162,8 @@ class ImagePasteInvocation(BaseInvocation):
        )


-@invocation(
-    "tomask",
-    title="Mask from Alpha",
-    tags=["image", "mask"],
-    category="image",
-    version="1.0.0",
-)
-class MaskFromAlphaInvocation(BaseInvocation):
+@invocation("tomask", title="Mask from Alpha", tags=["image", "mask"], category="image", version="1.0.0")
+class MaskFromAlphaInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Extracts the alpha channel of an image as a mask."""

    image: ImageField = InputField(description="The image to create the mask from")
@ -196,6 +183,7 @@ class MaskFromAlphaInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -206,14 +194,8 @@ class MaskFromAlphaInvocation(BaseInvocation):
        )


-@invocation(
-    "img_mul",
-    title="Multiply Images",
-    tags=["image", "multiply"],
-    category="image",
-    version="1.0.0",
-)
-class ImageMultiplyInvocation(BaseInvocation):
+@invocation("img_mul", title="Multiply Images", tags=["image", "multiply"], category="image", version="1.0.0")
+class ImageMultiplyInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Multiplies two images together using `PIL.ImageChops.multiply()`."""

    image1: ImageField = InputField(description="The first image to multiply")
@ -232,6 +214,7 @@ class ImageMultiplyInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -245,14 +228,8 @@ class ImageMultiplyInvocation(BaseInvocation):
 IMAGE_CHANNELS = Literal["A", "R", "G", "B"]


-@invocation(
-    "img_chan",
-    title="Extract Image Channel",
-    tags=["image", "channel"],
-    category="image",
-    version="1.0.0",
-)
-class ImageChannelInvocation(BaseInvocation):
+@invocation("img_chan", title="Extract Image Channel", tags=["image", "channel"], category="image", version="1.0.0")
+class ImageChannelInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Gets a channel from an image."""

    image: ImageField = InputField(description="The image to get the channel from")
@ -270,6 +247,7 @@ class ImageChannelInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -283,14 +261,8 @@ class ImageChannelInvocation(BaseInvocation):
 IMAGE_MODES = Literal["L", "RGB", "RGBA", "CMYK", "YCbCr", "LAB", "HSV", "I", "F"]


-@invocation(
-    "img_conv",
-    title="Convert Image Mode",
-    tags=["image", "convert"],
-    category="image",
-    version="1.0.0",
-)
-class ImageConvertInvocation(BaseInvocation):
+@invocation("img_conv", title="Convert Image Mode", tags=["image", "convert"], category="image", version="1.0.0")
+class ImageConvertInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Converts an image to a different mode."""

    image: ImageField = InputField(description="The image to convert")
@ -308,6 +280,7 @@ class ImageConvertInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -318,14 +291,8 @@ class ImageConvertInvocation(BaseInvocation):
        )


-@invocation(
-    "img_blur",
-    title="Blur Image",
-    tags=["image", "blur"],
-    category="image",
-    version="1.0.0",
-)
-class ImageBlurInvocation(BaseInvocation):
+@invocation("img_blur", title="Blur Image", tags=["image", "blur"], category="image", version="1.0.0")
+class ImageBlurInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Blurs an image"""

    image: ImageField = InputField(description="The image to blur")
@ -348,6 +315,7 @@ class ImageBlurInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -378,23 +346,14 @@ PIL_RESAMPLING_MAP = {
 }


-@invocation(
-    "img_resize",
-    title="Resize Image",
-    tags=["image", "resize"],
-    category="image",
-    version="1.0.0",
-)
-class ImageResizeInvocation(BaseInvocation):
+@invocation("img_resize", title="Resize Image", tags=["image", "resize"], category="image", version="1.0.0")
+class ImageResizeInvocation(BaseInvocation, WithMetadata, WithWorkflow):
    """Resizes an image to specific dimensions"""

    image: ImageField = InputField(description="The image to resize")
    width: int = InputField(default=512, gt=0, description="The width to resize to (px)")
    height: int = InputField(default=512, gt=0, description="The height to resize to (px)")
    resample_mode: PIL_RESAMPLING_MODES = InputField(default="bicubic", description="The resampling mode")
-    metadata: Optional[CoreMetadata] = InputField(
-        default=None, description=FieldDescriptions.core_metadata, ui_hidden=True
-    )

    def invoke(self, context: InvocationContext) -> ImageOutput:
        image = context.services.images.get_pil_image(self.image.image_name)
@ -413,7 +372,7 @@ class ImageResizeInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
-            metadata=self.metadata.model_dump() if self.metadata else None,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -424,14 +383,8 @@ class ImageResizeInvocation(BaseInvocation):
        )


-@invocation(
-    "img_scale",
-    title="Scale Image",
-    tags=["image", "scale"],
-    category="image",
-    version="1.0.0",
-)
-class ImageScaleInvocation(BaseInvocation):
+@invocation("img_scale", title="Scale Image", tags=["image", "scale"], category="image", version="1.0.0")
+class ImageScaleInvocation(BaseInvocation, WithMetadata, WithWorkflow):
    """Scales an image by a factor"""

    image: ImageField = InputField(description="The image to scale")
@ -461,6 +414,7 @@ class ImageScaleInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -471,14 +425,8 @@ class ImageScaleInvocation(BaseInvocation):
        )


-@invocation(
-    "img_lerp",
-    title="Lerp Image",
-    tags=["image", "lerp"],
-    category="image",
-    version="1.0.0",
-)
-class ImageLerpInvocation(BaseInvocation):
+@invocation("img_lerp", title="Lerp Image", tags=["image", "lerp"], category="image", version="1.0.0")
+class ImageLerpInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Linear interpolation of all pixels of an image"""

    image: ImageField = InputField(description="The image to lerp")
@ -500,6 +448,7 @@ class ImageLerpInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -510,14 +459,8 @@ class ImageLerpInvocation(BaseInvocation):
        )


-@invocation(
-    "img_ilerp",
-    title="Inverse Lerp Image",
-    tags=["image", "ilerp"],
-    category="image",
-    version="1.0.0",
-)
-class ImageInverseLerpInvocation(BaseInvocation):
+@invocation("img_ilerp", title="Inverse Lerp Image", tags=["image", "ilerp"], category="image", version="1.0.0")
+class ImageInverseLerpInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Inverse linear interpolation of all pixels of an image"""

    image: ImageField = InputField(description="The image to lerp")
@ -539,6 +482,7 @@ class ImageInverseLerpInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -549,20 +493,11 @@ class ImageInverseLerpInvocation(BaseInvocation):
        )


-@invocation(
-    "img_nsfw",
-    title="Blur NSFW Image",
-    tags=["image", "nsfw"],
-    category="image",
-    version="1.0.0",
-)
-class ImageNSFWBlurInvocation(BaseInvocation):
+@invocation("img_nsfw", title="Blur NSFW Image", tags=["image", "nsfw"], category="image", version="1.0.0")
+class ImageNSFWBlurInvocation(BaseInvocation, WithMetadata, WithWorkflow):
    """Add blur to NSFW-flagged images"""

    image: ImageField = InputField(description="The image to check")
-    metadata: Optional[CoreMetadata] = InputField(
-        default=None, description=FieldDescriptions.core_metadata, ui_hidden=True
-    )

    def invoke(self, context: InvocationContext) -> ImageOutput:
        image = context.services.images.get_pil_image(self.image.image_name)
@ -583,7 +518,7 @@ class ImageNSFWBlurInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
-            metadata=self.metadata.model_dump() if self.metadata else None,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -607,14 +542,11 @@ class ImageNSFWBlurInvocation(BaseInvocation):
    category="image",
    version="1.0.0",
 )
-class ImageWatermarkInvocation(BaseInvocation):
+class ImageWatermarkInvocation(BaseInvocation, WithMetadata, WithWorkflow):
    """Add an invisible watermark to an image"""

    image: ImageField = InputField(description="The image to check")
    text: str = InputField(default="InvokeAI", description="Watermark text")
-    metadata: Optional[CoreMetadata] = InputField(
-        default=None, description=FieldDescriptions.core_metadata, ui_hidden=True
-    )

    def invoke(self, context: InvocationContext) -> ImageOutput:
        image = context.services.images.get_pil_image(self.image.image_name)
@ -626,7 +558,7 @@ class ImageWatermarkInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
-            metadata=self.metadata.model_dump() if self.metadata else None,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -637,14 +569,8 @@ class ImageWatermarkInvocation(BaseInvocation):
        )


-@invocation(
-    "mask_edge",
-    title="Mask Edge",
-    tags=["image", "mask", "inpaint"],
-    category="image",
-    version="1.0.0",
-)
-class MaskEdgeInvocation(BaseInvocation):
+@invocation("mask_edge", title="Mask Edge", tags=["image", "mask", "inpaint"], category="image", version="1.0.0")
+class MaskEdgeInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Applies an edge mask to an image"""

    image: ImageField = InputField(description="The image to apply the mask to")
@ -678,6 +604,7 @@ class MaskEdgeInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -695,7 +622,7 @@ class MaskEdgeInvocation(BaseInvocation):
    category="image",
    version="1.0.0",
 )
-class MaskCombineInvocation(BaseInvocation):
+class MaskCombineInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Combine two masks together by multiplying them using `PIL.ImageChops.multiply()`."""

    mask1: ImageField = InputField(description="The first mask to combine")
@ -714,6 +641,7 @@ class MaskCombineInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -724,14 +652,8 @@ class MaskCombineInvocation(BaseInvocation):
        )


-@invocation(
-    "color_correct",
-    title="Color Correct",
-    tags=["image", "color"],
-    category="image",
-    version="1.0.0",
-)
-class ColorCorrectInvocation(BaseInvocation):
+@invocation("color_correct", title="Color Correct", tags=["image", "color"], category="image", version="1.0.0")
+class ColorCorrectInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """
    Shifts the colors of a target image to match the reference image, optionally
    using a mask to only color-correct certain regions of the target image.
@ -830,6 +752,7 @@ class ColorCorrectInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -840,14 +763,8 @@ class ColorCorrectInvocation(BaseInvocation):
        )


-@invocation(
-    "img_hue_adjust",
-    title="Adjust Image Hue",
-    tags=["image", "hue"],
-    category="image",
-    version="1.0.0",
-)
-class ImageHueAdjustmentInvocation(BaseInvocation):
+@invocation("img_hue_adjust", title="Adjust Image Hue", tags=["image", "hue"], category="image", version="1.0.0")
+class ImageHueAdjustmentInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Adjusts the Hue of an image."""

    image: ImageField = InputField(description="The image to adjust")
@ -875,6 +792,7 @@ class ImageHueAdjustmentInvocation(BaseInvocation):
            node_id=self.id,
            is_intermediate=self.is_intermediate,
            session_id=context.graph_execution_state_id,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -950,7 +868,7 @@ CHANNEL_FORMATS = {
    category="image",
    version="1.0.0",
 )
-class ImageChannelOffsetInvocation(BaseInvocation):
+class ImageChannelOffsetInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Add or subtract a value from a specific color channel of an image."""

    image: ImageField = InputField(description="The image to adjust")
@ -984,6 +902,7 @@ class ImageChannelOffsetInvocation(BaseInvocation):
            node_id=self.id,
            is_intermediate=self.is_intermediate,
            session_id=context.graph_execution_state_id,
+            metadata=self.metadata,
            workflow=self.workflow,
        )

@ -1020,7 +939,7 @@ class ImageChannelOffsetInvocation(BaseInvocation):
    category="image",
    version="1.0.0",
 )
-class ImageChannelMultiplyInvocation(BaseInvocation):
+class ImageChannelMultiplyInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Scale a specific color channel of an image."""

    image: ImageField = InputField(description="The image to adjust")
@ -1060,6 +979,7 @@ class ImageChannelMultiplyInvocation(BaseInvocation):
            is_intermediate=self.is_intermediate,
            session_id=context.graph_execution_state_id,
            workflow=self.workflow,
+            metadata=self.metadata,
        )

        return ImageOutput(
@ -1079,16 +999,11 @@ class ImageChannelMultiplyInvocation(BaseInvocation):
    version="1.0.1",
    use_cache=False,
 )
-class SaveImageInvocation(BaseInvocation):
+class SaveImageInvocation(BaseInvocation, WithWorkflow, WithMetadata):
    """Saves an image. Unlike an image primitive, this invocation stores a copy of the image."""

    image: ImageField = InputField(description=FieldDescriptions.image)
-    board: Optional[BoardField] = InputField(default=None, description=FieldDescriptions.board, input=Input.Direct)
-    metadata: Optional[CoreMetadata] = InputField(
-        default=None,
-        description=FieldDescriptions.core_metadata,
-        ui_hidden=True,
-    )
+    board: BoardField = InputField(default=None, description=FieldDescriptions.board, input=Input.Direct)

    def invoke(self, context: InvocationContext) -> ImageOutput:
        image = context.services.images.get_pil_image(self.image.image_name)
@ -1101,7 +1016,7 @@ class SaveImageInvocation(BaseInvocation):
            node_id=self.id,
            session_id=context.graph_execution_state_id,
            is_intermediate=self.is_intermediate,
-            metadata=self.metadata.model_dump() if self.metadata else None,
+            metadata=self.metadata,
            workflow=self.workflow,
        )