further improvements to model loading

- code for committing config changes to models.yaml now in module rather than in invoke script - model marked "default" is now loaded if model not specified on command line - uncache changed models when edited, so that they reload properly - removed liaon from models.yaml and added stable-diffusion-1.5
2024-08-30 20:32:17 +00:00 · 2022-10-21 00:28:54 -04:00
parent a705a5a0aa
commit 83e6ab08aa
5 changed files with 91 additions and 27 deletions
--- a/ldm/generate.py
+++ b/ldm/generate.py
@ -35,6 +35,9 @@ from ldm.invoke.devices import choose_torch_device, choose_precision
 from ldm.invoke.conditioning import get_uc_and_c
 from ldm.invoke.model_cache import ModelCache

+# this is fallback model in case no default is defined
+FALLBACK_MODEL_NAME='stable-diffusion-1.4'
+
 def fix_func(orig):
    if hasattr(torch.backends, 'mps') and torch.backends.mps.is_available():
        def new_func(*args, **kw):
@ -127,7 +130,7 @@ class Generate:

    def __init__(
            self,
-            model                 = 'stable-diffusion-1.4',
+            model                 = None,
            conf                  = 'configs/models.yaml',
            embedding_path        = None,
            sampler_name          = 'k_lms',
@ -143,7 +146,6 @@ class Generate:
            free_gpu_mem=False,
    ):
        mconfig             = OmegaConf.load(conf)
-        self.model_name     = model
        self.height         = None
        self.width          = None
        self.model_cache    = None
@ -188,6 +190,8 @@ class Generate:

        # model caching system for fast switching
        self.model_cache = ModelCache(mconfig,self.device,self.precision)
+        print(f'DEBUG: model={model}, default_model={self.model_cache.default_model()}')
+        self.model_name  = model or self.model_cache.default_model() or FALLBACK_MODEL_NAME

        # for VRAM usage statistics
        self.session_peakmem = torch.cuda.max_memory_allocated() if self._has_cuda else None