Make GroundedSAMInvocation work with any input image mode (RGB, RGBA, grayscale).

2024-08-30 20:32:17 +00:00 · 2024-07-30 15:55:57 -04:00 · 2024-07-30 15:55:57 -04:00 · 6b10b59abe
commit 6b10b59abe
parent 918f77bce0
1 changed files with 2 additions and 1 deletions
--- a/invokeai/app/invocations/grounded_sam.py
+++ b/invokeai/app/invocations/grounded_sam.py
@ -60,7 +60,8 @@ class GroundedSAMInvocation(BaseInvocation):

    @torch.no_grad()
    def invoke(self, context: InvocationContext) -> ImageOutput:
-        image_pil = context.images.get_pil(self.image.image_name)
+        # The models expect a 3-channel RGB image.
+        image_pil = context.images.get_pil(self.image.image_name, mode="RGB")

        detections = self._detect(
            context=context, image=image_pil, labels=[self.prompt], threshold=self.detection_threshold