Fix bug in InvokeInt8Params that was causing it to use double the necessary VRAM.

2025-07-26 05:17:55 +00:00 · 2024-08-21 19:01:11 +00:00
parent fd68a2475b
commit 19a68afb3a
1 changed files with 1 additions and 1 deletions
--- a/invokeai/backend/quantization/bnb_llm_int8.py
+++ b/invokeai/backend/quantization/bnb_llm_int8.py
@ -22,7 +22,7 @@ class InvokeInt8Params(bnb.nn.Int8Params):
            return super().cuda(device)
        elif self.CB is not None and self.SCB is not None:
            self.data = self.data.cuda()
-            self.CB = self.CB.cuda()
+            self.CB = self.data
            self.SCB = self.SCB.cuda()
        else:
            # we store the 8-bit rows-major weight