Merge pull request #110 from sajattack/half-precision-embeddings

Support full-precision embeddings in half precision inference mode
2024-08-30 20:32:17 +00:00 · 2022-08-28 15:36:26 -04:00
parent 3b2569ebdd 555f13e469
commit a7ac93a899
2 changed files with 7 additions and 5 deletions
--- a/ldm/modules/embedding_manager.py
+++ b/ldm/modules/embedding_manager.py
@ -215,11 +215,13 @@ class EmbeddingManager(nn.Module):
            ckpt_path,
        )

-    def load(self, ckpt_path):
+    def load(self, ckpt_path, full=True):
        ckpt = torch.load(ckpt_path, map_location='cpu')
-
-        self.string_to_token_dict = ckpt['string_to_token']
-        self.string_to_param_dict = ckpt['string_to_param']
+        self.string_to_token_dict = ckpt["string_to_token"]
+        self.string_to_param_dict = ckpt["string_to_param"]
+        if not full:
+            for key, value in self.string_to_param_dict.items():
+                self.string_to_param_dict[key] = torch.nn.Parameter(value.half())

    def get_embedding_norms_squared(self):
        all_params = torch.cat(
--- a/ldm/simplet2i.py
+++ b/ldm/simplet2i.py
@ -498,7 +498,7 @@ class T2I:
                self.device = self._get_device()
                model = self._load_model_from_config(config, self.weights)
                if self.embedding_path is not None:
-                    model.embedding_manager.load(self.embedding_path)
+                    model.embedding_manager.load(self.embedding_path, self.full_precision)
                self.model = model.to(self.device)
                # model.to doesn't change the cond_stage_model.device used to move the tokenizer output, so set it here
                self.model.cond_stage_model.device = self.device