Path->str in call to expand_prompts

add root argument
more debugging statements
2024-08-30 20:32:17 +00:00 · 2023-04-15 15:19:07 -04:00 · 2023-04-15 15:08:44 -04:00 · 2023-04-15 14:56:47 -04:00 · 2023-04-12 22:53:47 -04:00 · 2023-04-12 20:48:23 -04:00
36 changed files with 418 additions and 588 deletions
--- a/.github/CODEOWNERS
+++ b/.github/CODEOWNERS
@ -1,13 +1,13 @@
 # continuous integration
-/.github/workflows/  @lstein @blessedcoolant
+/.github/workflows/ @mauwii @lstein @blessedcoolant

 # documentation
-/docs/ @lstein  @blessedcoolant
-mkdocs.yml  @lstein @ebr
+/docs/ @lstein @mauwii @blessedcoolant
+mkdocs.yml @mauwii @lstein

 # installation and configuration
-/pyproject.toml  @lstein @ebr
-/docker/ @lstein
+/pyproject.toml @mauwii @lstein @ebr
+/docker/ @mauwii
 /scripts/ @ebr @lstein @blessedcoolant
 /installer/ @ebr @lstein 
 ldm/invoke/config @lstein @ebr
@ -21,13 +21,13 @@ invokeai/configs @lstein @ebr  @blessedcoolant

 # generation and model management
 /ldm/*.py @lstein @blessedcoolant
-/ldm/generate.py @lstein @gregghelt2
+/ldm/generate.py @lstein @keturn
 /ldm/invoke/args.py @lstein @blessedcoolant
 /ldm/invoke/ckpt* @lstein @blessedcoolant
 /ldm/invoke/ckpt_generator @lstein @blessedcoolant
 /ldm/invoke/CLI.py @lstein @blessedcoolant
-/ldm/invoke/config @lstein @ebr  @blessedcoolant
-/ldm/invoke/generator @gregghelt2 @damian0815
+/ldm/invoke/config @lstein @ebr @mauwii @blessedcoolant
+/ldm/invoke/generator @keturn @damian0815
 /ldm/invoke/globals.py @lstein @blessedcoolant 
 /ldm/invoke/merge_diffusers.py @lstein @blessedcoolant
 /ldm/invoke/model_manager.py @lstein @blessedcoolant
@ -36,17 +36,17 @@ invokeai/configs @lstein @ebr  @blessedcoolant
 /ldm/invoke/restoration @lstein @blessedcoolant

 # attention, textual inversion, model configuration
-/ldm/models @damian0815 @gregghelt2 @blessedcoolant
+/ldm/models @damian0815 @keturn @blessedcoolant
 /ldm/modules/textual_inversion_manager.py @lstein @blessedcoolant
-/ldm/modules/attention.py @damian0815 @gregghelt2
-/ldm/modules/diffusionmodules @damian0815 @gregghelt2
-/ldm/modules/distributions @damian0815 @gregghelt2
-/ldm/modules/ema.py  @damian0815 @gregghelt2
+/ldm/modules/attention.py @damian0815 @keturn
+/ldm/modules/diffusionmodules @damian0815 @keturn
+/ldm/modules/distributions @damian0815 @keturn
+/ldm/modules/ema.py  @damian0815 @keturn
 /ldm/modules/embedding_manager.py @lstein
-/ldm/modules/encoders @damian0815 @gregghelt2
-/ldm/modules/image_degradation @damian0815 @gregghelt2
-/ldm/modules/losses  @damian0815 @gregghelt2
-/ldm/modules/x_transformer.py @damian0815 @gregghelt2
+/ldm/modules/encoders @damian0815 @keturn
+/ldm/modules/image_degradation @damian0815 @keturn
+/ldm/modules/losses  @damian0815 @keturn
+/ldm/modules/x_transformer.py @damian0815 @keturn

 # Nodes
 apps/ @Kyle0654 @jpphoto
--- a/.gitignore
+++ b/.gitignore
@ -233,3 +233,5 @@ installer/install.sh
 installer/update.bat
 installer/update.sh

+# no longer stored in source directory
+models
--- a/docs/features/LORAS.md
+++ b/docs/features/LORAS.md
@ -41,16 +41,6 @@ Windows systems). If the `loras` folder does not already exist, just
 create it. The vast majority of LoRA models use the Kohya file format,
 which is a type of `.safetensors` file.

-!!! warning "LoRA Naming Restrictions"
-
-    InvokeAI will only recognize LoRA files that contain the
-    characters a-z, A-Z, 0-9 and the underscore character
-    _. Other characters, including the hyphen, will cause the
-    LoRA file not to load. These naming restrictions may be
-    relaxed in the future, but for now you will need to rename
-    files that contain hyphens, commas, brackets, and other
-    non-word characters.
-
 You may change where InvokeAI looks for the `loras` folder by passing the
 `--lora_directory` option to the `invoke.sh`/`invoke.bat` launcher, or
 by placing the option in `invokeai.init`. For example:
--- a/docs/features/index.md
+++ b/docs/features/index.md
@ -33,11 +33,6 @@ title: Overview
        Restore mangled faces and make images larger with upscaling. Also see
        the [Embiggen Upscaling Guide](EMBIGGEN.md).

-    -   The [Using LoRA Models](LORAS.md)
-
-        Add custom subjects and styles using HuggingFace's repository of
-        embeddings.
-	
    -   The [Concepts Library](CONCEPTS.md)

        Add custom subjects and styles using HuggingFace's repository of
--- a/docs/installation/deprecated_documentation/INSTALL_LINUX.md
+++ b/docs/installation/deprecated_documentation/INSTALL_LINUX.md
@ -79,7 +79,7 @@ title: Manual Installation, Linux
        and obtaining an access token for downloading. It will then download and
        install the weights files for you.

-        Please look [here](../020_INSTALL_MANUAL.md) for a manual process for doing
+        Please look [here](../INSTALL_MANUAL.md) for a manual process for doing
        the same thing.

 7.  Start generating images!
--- a/docs/installation/deprecated_documentation/INSTALL_WINDOWS.md
+++ b/docs/installation/deprecated_documentation/INSTALL_WINDOWS.md
@ -75,7 +75,7 @@ Note that you will need NVIDIA drivers, Python 3.10, and Git installed beforehan
          obtaining an access token for downloading. It will then download and install the
          weights files for you.

-          Please look [here](../020_INSTALL_MANUAL.md) for a manual process for doing the
+          Please look [here](../INSTALL_MANUAL.md) for a manual process for doing the
          same thing.

 8. Start generating images!
--- a/docs/requirements-mkdocs.txt
+++ b/docs/requirements-mkdocs.txt
@ -1,5 +0,0 @@
-mkdocs
-mkdocs-material>=8, <9
-mkdocs-git-revision-date-localized-plugin
-mkdocs-redirects==1.2.0
-
--- a/installer/lib/installer.py
+++ b/installer/lib/installer.py
@ -243,15 +243,16 @@ class InvokeAiInstance:

        # Note that we're installing pinned versions of torch and
        # torchvision here, which *should* correspond to what is
-        # in pyproject.toml.
+        # in pyproject.toml. This is to prevent torch 2.0 from
+        # being installed and immediately uninstalled and replaced with 1.13
        pip = local[self.pip]

        (
            pip[
                "install",
                "--require-virtualenv",
-                "torch~=2.0.0",
-                "torchvision>=0.14.1",
+                "torch~=1.13.1",
+                "torchvision~=0.14.1",
                "--force-reinstall",
                "--find-links" if find_links is not None else None,
                find_links,
--- a/invokeai/backend/invoke_ai_web_server.py
+++ b/invokeai/backend/invoke_ai_web_server.py
@ -25,11 +25,12 @@ from invokeai.backend.modules.parameters import parameters_to_command
 import invokeai.frontend.dist as frontend
 from ldm.generate import Generate
 from ldm.invoke.args import Args, APP_ID, APP_VERSION, calculate_init_img_hash
-from ldm.invoke.concepts_lib import get_hf_concepts_lib
+from ldm.invoke.concepts_lib import HuggingFaceConceptsLibrary
 from ldm.invoke.conditioning import (
    get_tokens_for_prompt_object,
    get_prompt_structure,
    split_weighted_subprompts,
+    get_tokenizer,
 )
 from ldm.invoke.generator.diffusers_pipeline import PipelineIntermediateState
 from ldm.invoke.generator.inpaint import infill_methods
@ -37,11 +38,11 @@ from ldm.invoke.globals import (
    Globals,
    global_converted_ckpts_dir,
    global_models_dir,
+    global_lora_models_dir,
 )
 from ldm.invoke.pngwriter import PngWriter, retrieve_metadata
 from compel.prompt_parser import Blend
 from ldm.invoke.merge_diffusers import merge_diffusion_models
-from ldm.modules.lora_manager import LoraManager

 # Loading Arguments
 opt = Args()
@ -523,12 +524,20 @@ class InvokeAIWebServer:
        @socketio.on("getLoraModels")
        def get_lora_models():
            try:
-                model = self.generate.model
-                lora_mgr = LoraManager(model)
-                loras = lora_mgr.list_compatible_loras()
+                lora_path = global_lora_models_dir()
+                loras = []
+                for root, _, files in os.walk(lora_path):
+                    models = [
+                        Path(root, x)
+                        for x in files
+                        if Path(x).suffix in [".ckpt", ".pt", ".safetensors"]
+                    ]
+                    loras = loras + models
+
                found_loras = []
-                for lora in sorted(loras, key=str.casefold):
-                    found_loras.append({"name":lora,"location":str(loras[lora])})
+                for lora in sorted(loras, key=lambda s: s.stem.lower()):
+                    location = str(lora.resolve()).replace("\\", "/")
+                    found_loras.append({"name": lora.stem, "location": location})
                socketio.emit("foundLoras", found_loras)
            except Exception as e:
                self.handle_exceptions(e)
@ -538,7 +547,7 @@ class InvokeAIWebServer:
            try:
                local_triggers = self.generate.model.textual_inversion_manager.get_all_trigger_strings()
                locals = [{'name': x} for x in sorted(local_triggers, key=str.casefold)]
-                concepts = get_hf_concepts_lib().list_concepts(minimum_likes=5)
+                concepts = HuggingFaceConceptsLibrary().list_concepts(minimum_likes=5)
                concepts = [{'name': f'<{x}>'} for x in sorted(concepts, key=str.casefold) if f'<{x}>' not in local_triggers]
                socketio.emit("foundTextualInversionTriggers", {'local_triggers': locals, 'huggingface_concepts': concepts})
            except Exception as e:
@ -1305,7 +1314,7 @@ class InvokeAIWebServer:
                    None
                    if type(parsed_prompt) is Blend
                    else get_tokens_for_prompt_object(
-                        self.generate.model.tokenizer, parsed_prompt
+                        get_tokenizer(self.generate.model), parsed_prompt
                    )
                )
                attention_maps_image_base64_url = (
--- a/invokeai/configs/INITIAL_MODELS.yaml
+++ b/invokeai/configs/INITIAL_MODELS.yaml
@ -80,8 +80,7 @@ trinart-2.0:
     repo_id: stabilityai/sd-vae-ft-mse
   recommended: False
 waifu-diffusion-1.4:
-   description: An SD-2.1 model trained on 5.4M anime/manga-style images (4.27 GB)
-   revision: main
+   description: An SD-1.5 model trained on 680k anime/manga-style images (2.13 GB)
   repo_id: hakurei/waifu-diffusion
   format: diffusers
   vae:
--- a/invokeai/frontend/dist/assets/index-f56b39bc.js
+++ b/invokeai/frontend/dist/assets/index-f56b39bc.js
--- a/invokeai/frontend/dist/index.html
+++ b/invokeai/frontend/dist/index.html
@ -5,7 +5,7 @@
    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
    <title>InvokeAI - A Stable Diffusion Toolkit</title>
    <link rel="shortcut icon" type="icon" href="./assets/favicon-0d253ced.ico" />
-    <script type="module" crossorigin src="./assets/index-b12e648e.js"></script>
+    <script type="module" crossorigin src="./assets/index-f56b39bc.js"></script>
    <link rel="stylesheet" href="./assets/index-2ab0eb58.css">
  </head>

--- a/invokeai/frontend/src/app/socketio/listeners.ts
+++ b/invokeai/frontend/src/app/socketio/listeners.ts
@ -33,10 +33,6 @@ import {
  setIntermediateImage,
 } from 'features/gallery/store/gallerySlice';

-import {
-  getLoraModels,
-  getTextualInversionTriggers,
-} from 'app/socketio/actions';
 import type { RootState } from 'app/store';
 import { addImageToStagingArea } from 'features/canvas/store/canvasSlice';
 import {
@ -467,8 +463,6 @@ const makeSocketIOListeners = (
      const { model_name, model_list } = data;
      dispatch(setModelList(model_list));
      dispatch(setCurrentStatus(i18n.t('common.statusModelChanged')));
-      dispatch(getLoraModels());
-      dispatch(getTextualInversionTriggers());
      dispatch(setIsProcessing(false));
      dispatch(setIsCancelable(true));
      dispatch(
--- a/invokeai/frontend/stats.html
+++ b/invokeai/frontend/stats.html
--- a/ldm/generate.py
+++ b/ldm/generate.py
@ -13,16 +13,11 @@ import time
 import traceback
 from typing import List

-import warnings
-with warnings.catch_warnings():
-    warnings.filterwarnings("ignore", category=UserWarning)
-    import torch
-    
 import cv2
 import diffusers
 import numpy as np
 import skimage
-
+import torch
 import transformers
 from diffusers.pipeline_utils import DiffusionPipeline
 from diffusers.utils.import_utils import is_xformers_available
@ -638,8 +633,9 @@ class Generate:
        except RuntimeError:
            # Clear the CUDA cache on an exception
            self.clear_cuda_cache()
-            print("** Could not generate image.")
-            raise
+
+            print(traceback.format_exc(), file=sys.stderr)
+            print(">> Could not generate image.")

        toc = time.time()
        print("\n>> Usage stats:")
@ -984,15 +980,13 @@ class Generate:
        seed_everything(random.randrange(0, np.iinfo(np.uint32).max))
        if self.embedding_path and not model_data.get("ti_embeddings_loaded"):
            print(f'>> Loading embeddings from {self.embedding_path}')
-            with warnings.catch_warnings():
-                warnings.filterwarnings("ignore", category=UserWarning)
-                for root, _, files in os.walk(self.embedding_path):
-                    for name in files:
-                        ti_path = os.path.join(root, name)
-                        self.model.textual_inversion_manager.load_textual_inversion(
-                            ti_path, defer_injecting_tokens=True
-                        )
-                model_data["ti_embeddings_loaded"] = True
+            for root, _, files in os.walk(self.embedding_path):
+                for name in files:
+                    ti_path = os.path.join(root, name)
+                    self.model.textual_inversion_manager.load_textual_inversion(
+                        ti_path, defer_injecting_tokens=True
+                    )
+            model_data["ti_embeddings_loaded"] = True
        print(
            f'>> Textual inversion triggers: {", ".join(sorted(self.model.textual_inversion_manager.get_all_trigger_strings()))}'
        )
--- a/ldm/invoke/CLI.py
+++ b/ldm/invoke/CLI.py
@ -9,6 +9,7 @@ from pathlib import Path
 from typing import Union

 import click
+
 from compel import PromptParser

 if sys.platform == "darwin":
@ -16,6 +17,8 @@ if sys.platform == "darwin":

 import pyparsing  # type: ignore

+print(f'DEBUG: [1] All system modules imported', file=sys.stderr)
+
 import ldm.invoke

 from ..generate import Generate
@ -30,13 +33,21 @@ from .pngwriter import PngWriter, retrieve_metadata, write_metadata
 from .readline import Completer, get_completer
 from ..util import url_attachment_name

+print(f'DEBUG: [2] All invokeai modules imported', file=sys.stderr)
+
 # global used in multiple functions (fix)
 infile = None

 def main():
    """Initialize command-line parsers and the diffusion model"""
    global infile
-
+    
+    print('DEBUG: [3] Entered main()', file=sys.stderr)
+    print('DEBUG: INVOKEAI ENVIRONMENT:')
+    print('>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>')
+    print("\n".join([f'{x}:{os.environ[x]}' for x in os.environ.keys()]))
+    print('>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>>')
+    
    opt = Args()
    args = opt.parse_args()
    if not args:
@ -65,9 +76,13 @@ def main():
    Globals.sequential_guidance = args.sequential_guidance
    Globals.ckpt_convert = True  # always true as of 2.3.4 for LoRA support

+    print(f'DEBUG: [4] Globals initialized', file=sys.stderr)
+
    # run any post-install patches needed
    run_patches()

+    print(f'DEBUG: [5] Patches run', file=sys.stderr)
+
    print(f">> Internet connectivity is {Globals.internet_available}")

    if not args.conf:
@ -83,8 +98,9 @@ def main():
    # loading here to avoid long delays on startup
    # these two lines prevent a horrible warning message from appearing
    # when the frozen CLIP tokenizer is imported
+    print(f'DEBUG: [6] Importing torch modules', file=sys.stderr)
+    
    import transformers  # type: ignore
-
    from ldm.generate import Generate

    transformers.logging.set_verbosity_error()
@ -92,6 +108,7 @@ def main():

    diffusers.logging.set_verbosity_error()

+    print(f'DEBUG: [7] loading restoration models', file=sys.stderr)
    # Loading Face Restoration and ESRGAN Modules
    gfpgan, codeformer, esrgan = load_face_restoration(opt)

@ -113,6 +130,7 @@ def main():
        Globals.lora_models_dir = opt.lora_path

    # migrate legacy models
+    print(f'DEBUG: [8] migrating  models', file=sys.stderr)
    ModelManager.migrate_models()

    # load the infile as a list of lines
@ -130,6 +148,7 @@ def main():

    model = opt.model or retrieve_last_used_model()

+    print(f'DEBUG: [9] Creating generate object', file=sys.stderr)
    # creating a Generate object:
    try:
        gen = Generate(
@ -156,6 +175,7 @@ def main():
        print(">> changed to seamless tiling mode")

    # preload the model
+    print(f'DEBUG: [10] Loading default model', file=sys.stderr)
    try:
        gen.load_model()
    except KeyError:
@ -203,6 +223,7 @@ def main():
 # TODO: main_loop() has gotten busy. Needs to be refactored.
 def main_loop(gen, opt, completer):
    """prompt/read/execute loop"""
+    print(f'DEBUG: [11] In main loop', file=sys.stderr)
    global infile
    done = False
    doneAfterInFile = infile is not None
@ -1321,15 +1342,16 @@ def install_missing_config_files():
    install ckpt configuration files that may have been added to the
    distro after original root directory configuration
    """
-    import invokeai.configs as conf
-    from shutil import copyfile
+    pass
+    # import invokeai.configs as conf
+    # from shutil import copyfile
    
-    root_configs = Path(global_config_dir(), 'stable-diffusion')
-    repo_configs = Path(conf.__path__[0], 'stable-diffusion')
-    for src in repo_configs.iterdir():
-        dest = root_configs / src.name
-        if not dest.exists():
-            copyfile(src,dest)
+    # root_configs = Path(global_config_dir(), 'stable-diffusion')
+    # repo_configs = Path(conf.__path__[0], 'stable-diffusion')
+    # for src in repo_configs.iterdir():
+    #     dest = root_configs / src.name
+    #     if not dest.exists():
+    #         copyfile(src,dest)
    
 def do_version_update(root_version: version.Version, app_version: Union[str, version.Version]):
    """
--- a/ldm/invoke/_version.py
+++ b/ldm/invoke/_version.py
@ -1,2 +1 @@
-__version__='2.3.5.post1'
-
+__version__='2.3.4'
--- a/ldm/invoke/concepts_lib.py
+++ b/ldm/invoke/concepts_lib.py
@ -12,14 +12,6 @@ from urllib import request, error as ul_error
 from huggingface_hub import HfFolder, hf_hub_url, ModelSearchArguments, ModelFilter, HfApi
 from ldm.invoke.globals import Globals

-singleton = None
-
-def get_hf_concepts_lib():
-    global singleton
-    if singleton is None:
-        singleton = HuggingFaceConceptsLibrary()
-    return singleton
-
 class HuggingFaceConceptsLibrary(object):
    def __init__(self, root=None):
        '''
--- a/ldm/invoke/conditioning.py
+++ b/ldm/invoke/conditioning.py
@ -15,10 +15,19 @@ from compel import Compel
 from compel.prompt_parser import FlattenedPrompt, Blend, Fragment, CrossAttentionControlSubstitute, PromptParser, \
    Conjunction
 from .devices import torch_dtype
-from .generator.diffusers_pipeline import StableDiffusionGeneratorPipeline
 from ..models.diffusion.shared_invokeai_diffusion import InvokeAIDiffuserComponent
 from ldm.invoke.globals import Globals

+def get_tokenizer(model) -> CLIPTokenizer:
+    # TODO remove legacy ckpt fallback handling
+    return (getattr(model, 'tokenizer', None) # diffusers
+            or model.cond_stage_model.tokenizer) # ldm
+
+def get_text_encoder(model) -> Any:
+    # TODO remove legacy ckpt fallback handling
+    return (getattr(model, 'text_encoder', None)  # diffusers
+            or UnsqueezingLDMTransformer(model.cond_stage_model.transformer)) # ldm
+
 class UnsqueezingLDMTransformer:
    def __init__(self, ldm_transformer):
        self.ldm_transformer = ldm_transformer
@ -32,15 +41,15 @@ class UnsqueezingLDMTransformer:
        return insufficiently_unsqueezed_tensor.unsqueeze(0)


-def get_uc_and_c_and_ec(prompt_string,
-                        model: StableDiffusionGeneratorPipeline,
-                        log_tokens=False, skip_normalize_legacy_blend=False):
+def get_uc_and_c_and_ec(prompt_string, model, log_tokens=False, skip_normalize_legacy_blend=False):
    # lazy-load any deferred textual inversions.
    # this might take a couple of seconds the first time a textual inversion is used.
    model.textual_inversion_manager.create_deferred_token_ids_for_any_trigger_terms(prompt_string)

-    compel = Compel(tokenizer=model.tokenizer,
-                    text_encoder=model.text_encoder,
+    tokenizer = get_tokenizer(model)
+    text_encoder = get_text_encoder(model)
+    compel = Compel(tokenizer=tokenizer,
+                    text_encoder=text_encoder,
                    textual_inversion_manager=model.textual_inversion_manager,
                    dtype_for_device_getter=torch_dtype)

@ -69,20 +78,14 @@ def get_uc_and_c_and_ec(prompt_string,
    negative_conjunction = Compel.parse_prompt_string(negative_prompt_string)
    negative_prompt: FlattenedPrompt | Blend = negative_conjunction.prompts[0]

-    tokens_count = get_max_token_count(model.tokenizer, positive_prompt)
    if log_tokens or getattr(Globals, "log_tokenization", False):
-        log_tokenization(positive_prompt, negative_prompt, tokenizer=model.tokenizer)
+        log_tokenization(positive_prompt, negative_prompt, tokenizer=tokenizer)

-    # some LoRA models also mess with the text encoder, so they must be active while compel builds conditioning tensors
-    lora_conditioning_ec = InvokeAIDiffuserComponent.ExtraConditioningInfo(tokens_count_including_eos_bos=tokens_count,
-                                                                                            lora_conditions=lora_conditions)
-    with InvokeAIDiffuserComponent.custom_attention_context(model.unet,
-                                                            extra_conditioning_info=lora_conditioning_ec,
-                                                            step_count=-1):
-        c, options = compel.build_conditioning_tensor_for_prompt_object(positive_prompt)
-        uc, _ = compel.build_conditioning_tensor_for_prompt_object(negative_prompt)
+    c, options = compel.build_conditioning_tensor_for_prompt_object(positive_prompt)
+    uc, _ = compel.build_conditioning_tensor_for_prompt_object(negative_prompt)
+
+    tokens_count = get_max_token_count(tokenizer, positive_prompt)

-    # now build the "real" ec
    ec = InvokeAIDiffuserComponent.ExtraConditioningInfo(tokens_count_including_eos_bos=tokens_count,
                                                         cross_attention_control_args=options.get(
                                                             'cross_attention_control', None),
--- a/ldm/invoke/config/invokeai_update.py
+++ b/ldm/invoke/config/invokeai_update.py
@ -39,7 +39,7 @@ def invokeai_is_running()->bool:
            if matches:
                print(f':exclamation: [bold red]An InvokeAI instance appears to be running as process {p.pid}[/red bold]')
                return True
-        except (psutil.AccessDenied,psutil.NoSuchProcess):
+        except psutil.AccessDenied:
            continue
    return False
        
--- a/ldm/invoke/config/model_install.py
+++ b/ldm/invoke/config/model_install.py
@ -196,6 +196,16 @@ class addModelsForm(npyscreen.FormMultiPage):
            scroll_exit=True,
        )
        self.nextrely += 1
+        self.convert_models = self.add_widget_intelligent(
+            npyscreen.TitleSelectOne,
+            name="== CONVERT IMPORTED MODELS INTO DIFFUSERS==",
+            values=["Keep original format", "Convert to diffusers"],
+            value=0,
+            begin_entry_at=4,
+            max_height=4,
+            hidden=True,  # will appear when imported models box is edited
+            scroll_exit=True,
+        )
        self.cancel = self.add_widget_intelligent(
            npyscreen.ButtonPress,
            name="CANCEL",
@ -230,6 +240,8 @@ class addModelsForm(npyscreen.FormMultiPage):
            self.show_directory_fields.addVisibleWhenSelected(i)

        self.show_directory_fields.when_value_edited = self._clear_scan_directory
+        self.import_model_paths.when_value_edited = self._show_hide_convert
+        self.autoload_directory.when_value_edited = self._show_hide_convert

    def resize(self):
        super().resize()
@ -240,6 +252,13 @@ class addModelsForm(npyscreen.FormMultiPage):
        if not self.show_directory_fields.value:
            self.autoload_directory.value = ""

+    def _show_hide_convert(self):
+        model_paths = self.import_model_paths.value or ""
+        autoload_directory = self.autoload_directory.value or ""
+        self.convert_models.hidden = (
+            len(model_paths) == 0 and len(autoload_directory) == 0
+        )
+
    def _get_starter_model_labels(self) -> List[str]:
        window_width, window_height = get_terminal_size()
        label_width = 25
@ -299,6 +318,7 @@ class addModelsForm(npyscreen.FormMultiPage):
        .scan_directory: Path to a directory of models to scan and import
        .autoscan_on_startup:  True if invokeai should scan and import at startup time
        .import_model_paths:   list of URLs, repo_ids and file paths to import
+        .convert_to_diffusers: if True, convert legacy checkpoints into diffusers
        """
        # we're using a global here rather than storing the result in the parentapp
        # due to some bug in npyscreen that is causing attributes to be lost
@ -334,6 +354,7 @@ class addModelsForm(npyscreen.FormMultiPage):

        # URLs and the like
        selections.import_model_paths = self.import_model_paths.value.split()
+        selections.convert_to_diffusers = self.convert_models.value[0] == 1


 class AddModelApplication(npyscreen.NPSAppManaged):
@ -346,6 +367,7 @@ class AddModelApplication(npyscreen.NPSAppManaged):
            scan_directory=None,
            autoscan_on_startup=None,
            import_model_paths=None,
+            convert_to_diffusers=None,
        )

    def onStart(self):
@ -365,6 +387,7 @@ def process_and_execute(opt: Namespace, selections: Namespace):
    directory_to_scan = selections.scan_directory
    scan_at_startup = selections.autoscan_on_startup
    potential_models_to_install = selections.import_model_paths
+    convert_to_diffusers = selections.convert_to_diffusers

    install_requested_models(
        install_initial_models=models_to_install,
@ -372,6 +395,7 @@ def process_and_execute(opt: Namespace, selections: Namespace):
        scan_directory=Path(directory_to_scan) if directory_to_scan else None,
        external_models=potential_models_to_install,
        scan_at_startup=scan_at_startup,
+        convert_to_diffusers=convert_to_diffusers,
        precision="float32"
        if opt.full_precision
        else choose_precision(torch.device(choose_torch_device())),
--- a/ldm/invoke/config/model_install_backend.py
+++ b/ldm/invoke/config/model_install_backend.py
@ -11,7 +11,6 @@ from tempfile import TemporaryFile

 import requests
 from diffusers import AutoencoderKL
-from diffusers import logging as dlogging
 from huggingface_hub import hf_hub_url
 from omegaconf import OmegaConf
 from omegaconf.dictconfig import DictConfig
@ -69,6 +68,7 @@ def install_requested_models(
        scan_directory: Path = None,
        external_models: List[str] = None,
        scan_at_startup: bool = False,
+        convert_to_diffusers: bool = False,
        precision: str = "float16",
        purge_deleted: bool = False,
        config_file_path: Path = None,
@ -114,16 +114,17 @@ def install_requested_models(
            try:
                model_manager.heuristic_import(
                    path_url_or_repo,
+                    convert=convert_to_diffusers,
                    config_file_callback=_pick_configuration_file,
                    commit_to_conf=config_file_path
                )
            except KeyboardInterrupt:
                sys.exit(-1)
-            except Exception as e:
-                print(f'An exception has occurred: {str(e)}')
+            except Exception:
+                pass

    if scan_at_startup and scan_directory.is_dir():
-        argument = '--autoconvert'
+        argument = '--autoconvert' if convert_to_diffusers else '--autoimport'
        initfile = Path(Globals.root, Globals.initfile)
        replacement = Path(Globals.root, f'{Globals.initfile}.new')
        directory = str(scan_directory).replace('\\','/')
@ -295,21 +296,13 @@ def _download_diffusion_weights(
    mconfig: DictConfig, access_token: str, precision: str = "float32"
 ):
    repo_id = mconfig["repo_id"]
-    revision = mconfig.get('revision',None)
    model_class = (
        StableDiffusionGeneratorPipeline
        if mconfig.get("format", None) == "diffusers"
        else AutoencoderKL
    )
-    extra_arg_list = [{"revision": revision}] if revision \
-        else [{"revision": "fp16"}, {}] if precision == "float16" \
-             else [{}]
+    extra_arg_list = [{"revision": "fp16"}, {}] if precision == "float16" else [{}]
    path = None
-
-    # quench safety checker warnings
-    verbosity = dlogging.get_verbosity()
-    dlogging.set_verbosity_error()
-    
    for extra_args in extra_arg_list:
        try:
            path = download_from_hf(
@ -325,7 +318,6 @@ def _download_diffusion_weights(
                print(f"An unexpected error occurred while downloading the model: {e})")
        if path:
            break
-    dlogging.set_verbosity(verbosity)
    return path


@ -456,8 +448,6 @@ def new_config_file_contents(
        stanza["description"] = mod["description"]
        stanza["repo_id"] = mod["repo_id"]
        stanza["format"] = mod["format"]
-        if "revision" in mod:
-            stanza["revision"] = mod["revision"]
        # diffusers don't need width and height (probably .ckpt doesn't either)
        # so we no longer require these in INITIAL_MODELS.yaml
        if "width" in mod:
@ -482,9 +472,10 @@ def new_config_file_contents(

        conf[model] = stanza

-    # if no default model was chosen, then we select the first one in the list
+    # if no default model was chosen, then we select the first
+    # one in the list
    if not default_selected:
-        conf[list(conf.keys())[0]]["default"] = True
+        conf[list(successfully_downloaded.keys())[0]]["default"] = True

    return OmegaConf.to_yaml(conf)

--- a/ldm/invoke/dynamic_prompts.py
+++ b/ldm/invoke/dynamic_prompts.py
@ -32,7 +32,8 @@ def expand_prompts(
    template_file: Path,
    run_invoke: bool = False,
    invoke_model: str = None,
-    invoke_outdir: Path = None,
+    invoke_outdir: str = None,
+    invoke_root: str = None,
    processes_per_gpu: int = 1,
 ):
    """
@ -61,6 +62,8 @@ def expand_prompts(
            invokeai_args = [shutil.which("invokeai"), "--from_file", "-"]
            if invoke_model:
                invokeai_args.extend(("--model", invoke_model))
+            if invoke_root:
+                invokeai_args.extend(("--root", invoke_root))
            if invoke_outdir:
                outdir = os.path.expanduser(invoke_outdir)
                invokeai_args.extend(("--outdir", outdir))
@ -79,6 +82,11 @@ def expand_prompts(
            )
            import ldm.invoke.CLI

+            print(f'DEBUG: BATCH PARENT ENVIRONMENT:')
+            print('<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<')
+            print("\n".join([f'{x}:{os.environ[x]}' for x in os.environ.keys()]))
+            print('<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<')
+            
            parent_conn, child_conn = Pipe()
            children = set()
            for i in range(processes_to_launch):
@ -111,6 +119,13 @@ def expand_prompts(
        for p in children:
            p.terminate()

+def _dummy_cli_main():
+    counter = 0
+    while line := sys.stdin.readline():
+        print(f'[{counter}] {os.getpid()} got command {line.rstrip()}\n')
+        counter += 1
+        time.sleep(1)
+
 def _get_fn_format(directory:str, sequence:int)->str:
    """
    Get a filename that doesn't exceed filename length restrictions
@ -179,9 +194,9 @@ def _run_invoke(
    os.environ["CUDA_VISIBLE_DEVICES"] = f"{gpu}"
    sys.argv = args
    sys.stdin = MessageToStdin(conn_in)
-    sys.stdout = FilterStream(sys.stdout, include=re.compile("^\[\d+\]"))
-    with open(logfile, "w") as stderr, redirect_stderr(stderr):
-        entry_point()
+#    sys.stdout = FilterStream(sys.stdout, include=re.compile("^\[\d+\]"))
+#    with open(logfile, "w") as stderr, redirect_stderr(stderr):
+    entry_point()


 def _filter_output(stream: TextIOBase):
@ -238,6 +253,10 @@ def main():
        default=1,
        help="When executing invokeai, how many parallel processes to execute per CUDA GPU.",
    )
+    parser.add_argument(
+        '--root_dir',
+        default=None,
+        help='Path to directory containing "models", "outputs" and "configs". If not present will read from environment variable INVOKEAI_ROOT. Defaults to ~/invokeai'    )
    opt = parser.parse_args()

    if opt.example:
@ -261,6 +280,7 @@ def main():
        run_invoke=opt.invoke,
        invoke_model=opt.model,
        invoke_outdir=opt.outdir,
+        invoke_root=opt.root,
        processes_per_gpu=opt.processes_per_gpu,
    )

--- a/ldm/invoke/generator/diffusers_pipeline.py
+++ b/ldm/invoke/generator/diffusers_pipeline.py
@ -400,15 +400,8 @@ class StableDiffusionGeneratorPipeline(StableDiffusionPipeline):
    @property
    def _submodels(self) -> Sequence[torch.nn.Module]:
        module_names, _, _ = self.extract_init_dict(dict(self.config))
-        submodels = []
-        for name in module_names.keys():
-            if hasattr(self, name):
-                value = getattr(self, name)
-            else:
-                value = getattr(self.config, name)
-            if isinstance(value, torch.nn.Module):
-                submodels.append(value)
-        return submodels
+        values = [getattr(self, name) for name in module_names.keys()]
+        return [m for m in values if isinstance(m, torch.nn.Module)]

    def image_from_embeddings(self, latents: torch.Tensor, num_inference_steps: int,
                              conditioning_data: ConditioningData,
@ -474,12 +467,11 @@ class StableDiffusionGeneratorPipeline(StableDiffusionPipeline):
        if additional_guidance is None:
            additional_guidance = []
        extra_conditioning_info = conditioning_data.extra
-        with InvokeAIDiffuserComponent.custom_attention_context(self.invokeai_diffuser.model,
-                                                                extra_conditioning_info=extra_conditioning_info,
-                                                                step_count=len(self.scheduler.timesteps)
+        with self.invokeai_diffuser.custom_attention_context(extra_conditioning_info=extra_conditioning_info,
+                                                             step_count=len(self.scheduler.timesteps)
                                                             ):

-            yield PipelineIntermediateState(run_id=run_id, step=-1, timestep=self.scheduler.config.num_train_timesteps,
+            yield PipelineIntermediateState(run_id=run_id, step=-1, timestep=self.scheduler.num_train_timesteps,
                                            latents=latents)

            batch_size = latents.shape[0]
@ -763,7 +755,7 @@ class StableDiffusionGeneratorPipeline(StableDiffusionPipeline):
    @property
    def channels(self) -> int:
        """Compatible with DiffusionWrapper"""
-        return self.unet.config.in_channels
+        return self.unet.in_channels

    def decode_latents(self, latents):
        # Explicit call to get the vae loaded, since `decode` isn't the forward method.
--- a/ldm/invoke/model_manager.py
+++ b/ldm/invoke/model_manager.py
@ -372,6 +372,12 @@ class ModelManager(object):
        )
        from ldm.invoke.ckpt_to_diffuser import load_pipeline_from_original_stable_diffusion_ckpt

+#        try:
+#            if self.list_models()[self.current_model]['status'] == 'active':
+#                self.offload_model(self.current_model)
+#        except Exception:
+#            pass
+
        if self._has_cuda():
            torch.cuda.empty_cache()
        pipeline = load_pipeline_from_original_stable_diffusion_ckpt(
@ -417,9 +423,9 @@ class ModelManager(object):
            pipeline_args.update(cache_dir=global_cache_dir("hub"))
        if using_fp16:
            pipeline_args.update(torch_dtype=torch.float16)
-        revision = mconfig.get('revision') or ('fp16' if using_fp16 else None)
-        fp_args_list = [{"revision": revision}] if revision else []
-        fp_args_list.append({})
+            fp_args_list = [{"revision": "fp16"}, {}]
+        else:
+            fp_args_list = [{}]

        verbosity = dlogging.get_verbosity()
        dlogging.set_verbosity_error()
@ -433,7 +439,7 @@ class ModelManager(object):
                    **fp_args,
                )
            except OSError as e:
-                if 'Revision Not Found' in str(e):
+                if str(e).startswith("fp16 is not a valid"):
                    pass
                else:
                    print(
@ -1156,7 +1162,7 @@ class ModelManager(object):
        return self.device.type == "cuda"

    def _diffuser_sha256(
-        self, name_or_path: Union[str, Path], chunksize=16777216
+        self, name_or_path: Union[str, Path], chunksize=4096
    ) -> Union[str, bytes]:
        path = None
        if isinstance(name_or_path, Path):
--- a/ldm/invoke/readline.py
+++ b/ldm/invoke/readline.py
@ -13,7 +13,7 @@ import re
 import atexit
 from typing import List
 from ldm.invoke.args import Args
-from ldm.invoke.concepts_lib import get_hf_concepts_lib
+from ldm.invoke.concepts_lib import HuggingFaceConceptsLibrary
 from ldm.invoke.globals import Globals
 from ldm.modules.lora_manager import LoraManager

@ -287,7 +287,7 @@ class Completer(object):
    def _concept_completions(self, text, state):
        if self.concepts is None:
            # cache Concepts() instance so we can check for updates in concepts_list during runtime.
-            self.concepts = get_hf_concepts_lib()
+            self.concepts = HuggingFaceConceptsLibrary()
            self.embedding_terms.update(set(self.concepts.list_concepts()))
        else:
            self.embedding_terms.update(set(self.concepts.list_concepts()))
--- a/ldm/models/diffusion/cross_attention_control.py
+++ b/ldm/models/diffusion/cross_attention_control.py
@ -14,6 +14,7 @@ from torch import nn

 from compel.cross_attention_control import Arguments
 from diffusers.models.unet_2d_condition import UNet2DConditionModel
+from diffusers.models.cross_attention import AttnProcessor
 from ldm.invoke.devices import torch_dtype


@ -162,7 +163,7 @@ class Context:

 class InvokeAICrossAttentionMixin:
    """
-    Enable InvokeAI-flavoured Attention calculation, which does aggressive low-memory slicing and calls
+    Enable InvokeAI-flavoured CrossAttention calculation, which does aggressive low-memory slicing and calls
    through both to an attention_slice_wrangler and a slicing_strategy_getter for custom attention map wrangling
    and dymamic slicing strategy selection.
    """
@ -177,7 +178,7 @@ class InvokeAICrossAttentionMixin:
        Set custom attention calculator to be called when attention is calculated
        :param wrangler: Callback, with args (module, suggested_attention_slice, dim, offset, slice_size),
        which returns either the suggested_attention_slice or an adjusted equivalent.
-            `module` is the current Attention module for which the callback is being invoked.
+            `module` is the current CrossAttention module for which the callback is being invoked.
            `suggested_attention_slice` is the default-calculated attention slice
            `dim` is -1 if the attenion map has not been sliced, or 0 or 1 for dimension-0 or dimension-1 slicing.
                If `dim` is >= 0, `offset` and `slice_size` specify the slice start and length.
@ -287,7 +288,16 @@ class InvokeAICrossAttentionMixin:
        return self.einsum_op_tensor_mem(q, k, v, 32)


-def setup_cross_attention_control_attention_processors(unet: UNet2DConditionModel, context: Context):
+
+def restore_default_cross_attention(model, is_running_diffusers: bool, processors_to_restore: Optional[AttnProcessor]=None):
+    if is_running_diffusers:
+        unet = model
+        unet.set_attn_processor(processors_to_restore or CrossAttnProcessor())
+    else:
+        remove_attention_function(model)
+
+
+def override_cross_attention(model, context: Context, is_running_diffusers = False):
    """
    Inject attention parameters and functions into the passed in model to enable cross attention editing.

@ -313,19 +323,26 @@ def setup_cross_attention_control_attention_processors(unet: UNet2DConditionMode

    context.cross_attention_mask = mask.to(device)
    context.cross_attention_index_map = indices.to(device)
-    old_attn_processors = unet.attn_processors
-    if torch.backends.mps.is_available():
-        # see note in StableDiffusionGeneratorPipeline.__init__ about borked slicing on MPS
-        unet.set_attn_processor(SwapCrossAttnProcessor())
+    if is_running_diffusers:
+        unet = model
+        old_attn_processors = unet.attn_processors
+        if torch.backends.mps.is_available():
+            # see note in StableDiffusionGeneratorPipeline.__init__ about borked slicing on MPS
+            unet.set_attn_processor(SwapCrossAttnProcessor())
+        else:
+            # try to re-use an existing slice size
+            default_slice_size = 4
+            slice_size = next((p.slice_size for p in old_attn_processors.values() if type(p) is SlicedAttnProcessor), default_slice_size)
+            unet.set_attn_processor(SlicedSwapCrossAttnProcesser(slice_size=slice_size))
    else:
-        # try to re-use an existing slice size
-        default_slice_size = 4
-        slice_size = next((p.slice_size for p in old_attn_processors.values() if type(p) is SlicedAttnProcessor), default_slice_size)
-        unet.set_attn_processor(SlicedSwapCrossAttnProcesser(slice_size=slice_size))
+        context.register_cross_attention_modules(model)
+        inject_attention_function(model, context)
+
+


 def get_cross_attention_modules(model, which: CrossAttentionType) -> list[tuple[str, InvokeAICrossAttentionMixin]]:
-    from ldm.modules.attention import CrossAttention # avoid circular import # TODO: rename as in diffusers?
+    from ldm.modules.attention import CrossAttention # avoid circular import
    cross_attention_class: type = InvokeAIDiffusersCrossAttention if isinstance(model,UNet2DConditionModel) else CrossAttention
    which_attn = "attn1" if which is CrossAttentionType.SELF else "attn2"
    attention_module_tuples = [(name,module) for name, module in model.named_modules() if
@ -431,7 +448,7 @@ def get_mem_free_total(device):



-class InvokeAIDiffusersCrossAttention(diffusers.models.attention.Attention, InvokeAICrossAttentionMixin):
+class InvokeAIDiffusersCrossAttention(diffusers.models.attention.CrossAttention, InvokeAICrossAttentionMixin):

    def __init__(self, **kwargs):
        super().__init__(**kwargs)
@ -456,8 +473,8 @@ class InvokeAIDiffusersCrossAttention(diffusers.models.attention.Attention, Invo
 """
 # base implementation

-class AttnProcessor:
-    def __call__(self, attn: Attention, hidden_states, encoder_hidden_states=None, attention_mask=None):
+class CrossAttnProcessor:
+    def __call__(self, attn: CrossAttention, hidden_states, encoder_hidden_states=None, attention_mask=None):
        batch_size, sequence_length, _ = hidden_states.shape
        attention_mask = attn.prepare_attention_mask(attention_mask, sequence_length)

@ -486,7 +503,7 @@ from dataclasses import field, dataclass

 import torch

-from diffusers.models.attention_processor import Attention, AttnProcessor, SlicedAttnProcessor
+from diffusers.models.cross_attention import CrossAttention, CrossAttnProcessor, SlicedAttnProcessor


@dataclass
@ -531,7 +548,7 @@ class SlicedSwapCrossAttnProcesser(SlicedAttnProcessor):

    # TODO: dynamically pick slice size based on memory conditions

-    def __call__(self, attn: Attention, hidden_states, encoder_hidden_states=None, attention_mask=None,
+    def __call__(self, attn: CrossAttention, hidden_states, encoder_hidden_states=None, attention_mask=None,
                 # kwargs
                 swap_cross_attn_context: SwapCrossAttnContext=None):

--- a/ldm/models/diffusion/ddim.py
+++ b/ldm/models/diffusion/ddim.py
@ -12,6 +12,17 @@ class DDIMSampler(Sampler):
        self.invokeai_diffuser = InvokeAIDiffuserComponent(self.model,
                                                           model_forward_callback = lambda x, sigma, cond: self.model.apply_model(x, sigma, cond))

+    def prepare_to_sample(self, t_enc, **kwargs):
+        super().prepare_to_sample(t_enc, **kwargs)
+
+        extra_conditioning_info = kwargs.get('extra_conditioning_info', None)
+        all_timesteps_count = kwargs.get('all_timesteps_count', t_enc)
+
+        if extra_conditioning_info is not None and extra_conditioning_info.wants_cross_attention_control:
+            self.invokeai_diffuser.override_attention_processors(extra_conditioning_info, step_count = all_timesteps_count)
+        else:
+            self.invokeai_diffuser.restore_default_cross_attention()
+

    # This is the central routine
    @torch.no_grad()
--- a/ldm/models/diffusion/ksampler.py
+++ b/ldm/models/diffusion/ksampler.py
@ -38,6 +38,15 @@ class CFGDenoiser(nn.Module):
                                                           model_forward_callback=lambda x, sigma, cond: self.inner_model(x, sigma, cond=cond))


+    def prepare_to_sample(self, t_enc, **kwargs):
+
+        extra_conditioning_info = kwargs.get('extra_conditioning_info', None)
+
+        if extra_conditioning_info is not None and extra_conditioning_info.wants_cross_attention_control:
+            self.invokeai_diffuser.override_attention_processors(extra_conditioning_info, step_count = t_enc)
+        else:
+            self.invokeai_diffuser.restore_default_cross_attention()
+

    def forward(self, x, sigma, uncond, cond, cond_scale):
        next_x = self.invokeai_diffuser.do_diffusion_step(x, sigma, uncond, cond, cond_scale)
--- a/ldm/models/diffusion/plms.py
+++ b/ldm/models/diffusion/plms.py
@ -14,6 +14,17 @@ class PLMSSampler(Sampler):
    def __init__(self, model, schedule='linear', device=None, **kwargs):
        super().__init__(model,schedule,model.num_timesteps, device)

+    def prepare_to_sample(self, t_enc, **kwargs):
+        super().prepare_to_sample(t_enc, **kwargs)
+
+        extra_conditioning_info = kwargs.get('extra_conditioning_info', None)
+        all_timesteps_count = kwargs.get('all_timesteps_count', t_enc)
+
+        if extra_conditioning_info is not None and extra_conditioning_info.wants_cross_attention_control:
+            self.invokeai_diffuser.override_attention_processors(extra_conditioning_info, step_count = all_timesteps_count)
+        else:
+            self.invokeai_diffuser.restore_default_cross_attention()
+

    # this is the essential routine
    @torch.no_grad()
--- a/ldm/models/diffusion/shared_invokeai_diffusion.py
+++ b/ldm/models/diffusion/shared_invokeai_diffusion.py
@ -1,17 +1,18 @@
 from contextlib import contextmanager
 from dataclasses import dataclass
 from math import ceil
-from typing import Callable, Optional, Union, Any
+from typing import Callable, Optional, Union, Any, Dict

 import numpy as np
 import torch
-from diffusers import UNet2DConditionModel
+from diffusers.models.cross_attention import AttnProcessor
 from typing_extensions import TypeAlias

 from ldm.invoke.globals import Globals
 from ldm.models.diffusion.cross_attention_control import (
    Arguments,
-    setup_cross_attention_control_attention_processors,
+    restore_default_cross_attention,
+    override_cross_attention,
    Context,
    get_cross_attention_modules,
    CrossAttentionType,
@ -83,45 +84,66 @@ class InvokeAIDiffuserComponent:
        self.cross_attention_control_context = None
        self.sequential_guidance = Globals.sequential_guidance

-    @classmethod
    @contextmanager
    def custom_attention_context(
-        clss,
-        unet: UNet2DConditionModel, # note: also may futz with the text encoder depending on requested LoRAs
-        extra_conditioning_info: Optional[ExtraConditioningInfo],
-        step_count: int
+        self, extra_conditioning_info: Optional[ExtraConditioningInfo], step_count: int
    ):
-        old_attn_processors = None
+        old_attn_processor = None
        if extra_conditioning_info and (
            extra_conditioning_info.wants_cross_attention_control
            | extra_conditioning_info.has_lora_conditions
        ):
-            old_attn_processors = unet.attn_processors
-            # Load lora conditions into the model
-            if extra_conditioning_info.has_lora_conditions:
-                for condition in extra_conditioning_info.lora_conditions:
-                    condition() # target model is stored in condition state for some reason
-            if extra_conditioning_info.wants_cross_attention_control:
-                cross_attention_control_context = Context(
-                    arguments=extra_conditioning_info.cross_attention_control_args,
-                    step_count=step_count,
-                )
-                setup_cross_attention_control_attention_processors(
-                    unet,
-                    cross_attention_control_context,
-                )
+            old_attn_processor = self.override_attention_processors(
+                extra_conditioning_info, step_count=step_count
+            )

        try:
            yield None
        finally:
-            if old_attn_processors is not None:
-                unet.set_attn_processor(old_attn_processors)
+            if old_attn_processor is not None:
+                self.restore_default_cross_attention(old_attn_processor)
            if extra_conditioning_info and extra_conditioning_info.has_lora_conditions:
                for lora_condition in extra_conditioning_info.lora_conditions:
                    lora_condition.unload()
            # TODO resuscitate attention map saving
            # self.remove_attention_map_saving()

+    def override_attention_processors(
+        self, conditioning: ExtraConditioningInfo, step_count: int
+    ) -> Dict[str, AttnProcessor]:
+        """
+        setup cross attention .swap control. for diffusers this replaces the attention processor, so
+        the previous attention processor is returned so that the caller can restore it later.
+        """
+        old_attn_processors = self.model.attn_processors
+
+        # Load lora conditions into the model
+        if conditioning.has_lora_conditions:
+            for condition in conditioning.lora_conditions:
+                condition(self.model)
+
+        if conditioning.wants_cross_attention_control:
+            self.cross_attention_control_context = Context(
+                arguments=conditioning.cross_attention_control_args,
+                step_count=step_count,
+            )
+            override_cross_attention(
+                self.model,
+                self.cross_attention_control_context,
+                is_running_diffusers=self.is_running_diffusers,
+            )
+        return old_attn_processors
+
+    def restore_default_cross_attention(
+        self, processors_to_restore: Optional[dict[str, "AttnProcessor"]] = None
+    ):
+        self.cross_attention_control_context = None
+        restore_default_cross_attention(
+            self.model,
+            is_running_diffusers=self.is_running_diffusers,
+            processors_to_restore=processors_to_restore,
+        )
+
    def setup_attention_map_saving(self, saver: AttentionMapSaver):
        def callback(slice, dim, offset, slice_size, key):
            if dim is not None:
--- a/ldm/modules/embedding_manager.py
+++ b/ldm/modules/embedding_manager.py
@ -6,7 +6,7 @@ from torch import nn

 import sys

-from ldm.invoke.concepts_lib import get_hf_concepts_lib
+from ldm.invoke.concepts_lib import HuggingFaceConceptsLibrary
 from ldm.data.personalized import per_img_token_list
 from transformers import CLIPTokenizer
 from functools import partial
@ -39,7 +39,7 @@ class EmbeddingManager(nn.Module):
        super().__init__()

        self.embedder = embedder
-        self.concepts_library=get_hf_concepts_lib()
+        self.concepts_library=HuggingFaceConceptsLibrary()

        self.string_to_token_dict = {}
        self.string_to_param_dict = nn.ParameterDict()
--- a/ldm/modules/kohya_lora_manager.py
+++ b/ldm/modules/kohya_lora_manager.py
@ -1,16 +1,15 @@
-import json
+import re
 from pathlib import Path
 from typing import Optional

 import torch
+from compel import Compel
 from diffusers.models import UNet2DConditionModel
-from filelock import FileLock, Timeout
 from safetensors.torch import load_file
 from torch.utils.hooks import RemovableHandle
 from transformers import CLIPTextModel

-from ..invoke.globals import global_lora_models_dir, Globals
-from ..invoke.devices import choose_torch_device
+from ldm.invoke.devices import choose_torch_device

 """
 This module supports loading LoRA weights trained with https://github.com/kohya-ss/sd-scripts
@ -18,11 +17,6 @@ To be removed once support for diffusers LoRA weights is well supported
 """


-class IncompatibleModelException(Exception):
-    "Raised when there is an attempt to load a LoRA into a model that is incompatible with it"
-    pass
-
-
 class LoRALayer:
    lora_name: str
    name: str
@ -37,14 +31,18 @@ class LoRALayer:
        self.name = name
        self.scale = alpha / rank if (alpha and rank) else 1.0

-    def forward(self, lora, input_h):
+    def forward(self, lora, input_h, output):
        if self.mid is None:
-            weight = self.up(self.down(*input_h))
+            output = (
+                output
+                + self.up(self.down(*input_h)) * lora.multiplier * self.scale
+            )
        else:
-            weight = self.up(self.mid(self.down(*input_h)))
-
-        return weight * lora.multiplier * self.scale
-
+            output = (
+                output
+                + self.up(self.mid(self.down(*input_h))) * lora.multiplier * self.scale
+            )
+        return output

 class LoHALayer:
    lora_name: str
@ -66,7 +64,8 @@ class LoHALayer:
        self.name = name
        self.scale = alpha / rank if (alpha and rank) else 1.0

-    def forward(self, lora, input_h):
+    def forward(self, lora, input_h, output):
+
        if type(self.org_module) == torch.nn.Conv2d:
            op = torch.nn.functional.conv2d
            extra_args = dict(
@ -81,87 +80,21 @@ class LoHALayer:
            extra_args = {}

        if self.t1 is None:
-            weight = (self.w1_a @ self.w1_b) * (self.w2_a @ self.w2_b)
+            weight = ((self.w1_a @ self.w1_b) * (self.w2_a @ self.w2_b))

        else:
-            rebuild1 = torch.einsum(
-                "i j k l, j r, i p -> p r k l", self.t1, self.w1_b, self.w1_a
-            )
-            rebuild2 = torch.einsum(
-                "i j k l, j r, i p -> p r k l", self.t2, self.w2_b, self.w2_a
-            )
+            rebuild1 = torch.einsum('i j k l, j r, i p -> p r k l', self.t1, self.w1_b, self.w1_a)
+            rebuild2 = torch.einsum('i j k l, j r, i p -> p r k l', self.t2, self.w2_b, self.w2_a)
            weight = rebuild1 * rebuild2
-
+        
        bias = self.bias if self.bias is not None else 0
-        return op(
+        return output + op(
            *input_h,
            (weight + bias).view(self.org_module.weight.shape),
            None,
            **extra_args,
        ) * lora.multiplier * self.scale

-class LoKRLayer:
-    lora_name: str
-    name: str
-    scale: float
-
-    w1: Optional[torch.Tensor] = None
-    w1_a: Optional[torch.Tensor] = None
-    w1_b: Optional[torch.Tensor] = None
-    w2: Optional[torch.Tensor] = None
-    w2_a: Optional[torch.Tensor] = None
-    w2_b: Optional[torch.Tensor] = None
-    t2: Optional[torch.Tensor] = None
-    bias: Optional[torch.Tensor] = None
-
-    org_module: torch.nn.Module
-
-    def __init__(self, lora_name: str, name: str, rank=4, alpha=1.0):
-        self.lora_name = lora_name
-        self.name = name
-        self.scale = alpha / rank if (alpha and rank) else 1.0
-
-    def forward(self, lora, input_h):
-
-        if type(self.org_module) == torch.nn.Conv2d:
-            op = torch.nn.functional.conv2d
-            extra_args = dict(
-                stride=self.org_module.stride,
-                padding=self.org_module.padding,
-                dilation=self.org_module.dilation,
-                groups=self.org_module.groups,
-            )
-
-        else:
-            op = torch.nn.functional.linear
-            extra_args = {}
-
-        w1 = self.w1
-        if w1 is None:
-            w1 = self.w1_a @ self.w1_b
-
-        w2 = self.w2
-        if w2 is None:
-            if self.t2 is None:
-                w2 = self.w2_a @ self.w2_b
-            else:
-                w2 = torch.einsum('i j k l, i p, j r -> p r k l', self.t2, self.w2_a, self.w2_b)
-
-
-        if len(w2.shape) == 4:
-            w1 = w1.unsqueeze(2).unsqueeze(2)
-        w2 = w2.contiguous()
-        weight = torch.kron(w1, w2).reshape(self.org_module.weight.shape)
-
-
-        bias = self.bias if self.bias is not None else 0
-        return op(
-            *input_h, 
-            (weight + bias).view(self.org_module.weight.shape),
-            None,
-            **extra_args
-        ) * lora.multiplier * self.scale
-

 class LoRAModuleWrapper:
    unet: UNet2DConditionModel
@ -178,22 +111,12 @@ class LoRAModuleWrapper:
        self.applied_loras = {}
        self.loaded_loras = {}

-        self.UNET_TARGET_REPLACE_MODULE = [
-            "Transformer2DModel",
-            "Attention",
-            "ResnetBlock2D",
-            "Downsample2D",
-            "Upsample2D",
-            "SpatialTransformer",
-        ]
-        self.TEXT_ENCODER_TARGET_REPLACE_MODULE = [
-            "ResidualAttentionBlock",
-            "CLIPAttention",
-            "CLIPMLP",
-        ]
+        self.UNET_TARGET_REPLACE_MODULE = ["Transformer2DModel", "Attention", "ResnetBlock2D", "Downsample2D", "Upsample2D", "SpatialTransformer"]
+        self.TEXT_ENCODER_TARGET_REPLACE_MODULE = ["ResidualAttentionBlock", "CLIPAttention", "CLIPMLP"]
        self.LORA_PREFIX_UNET = "lora_unet"
        self.LORA_PREFIX_TEXT_ENCODER = "lora_te"

+
        def find_modules(
            prefix, root_module: torch.nn.Module, target_replace_modules
        ) -> dict[str, torch.nn.Module]:
@ -224,6 +147,7 @@ class LoRAModuleWrapper:
                self.LORA_PREFIX_UNET, unet, self.UNET_TARGET_REPLACE_MODULE
            )

+
    def lora_forward_hook(self, name):
        wrapper = self

@ -235,7 +159,7 @@ class LoRAModuleWrapper:
                layer = lora.layers.get(name, None)
                if layer is None:
                    continue
-                output += layer.forward(lora, input_h)
+                output = layer.forward(lora, input_h, output)
            return output

        return lora_forward
@ -256,7 +180,6 @@ class LoRAModuleWrapper:
    def clear_loaded_loras(self):
        self.loaded_loras.clear()

-
 class LoRA:
    name: str
    layers: dict[str, LoRALayer]
@ -282,6 +205,7 @@ class LoRA:
                state_dict_groupped[stem] = dict()
            state_dict_groupped[stem][leaf] = value

+
        for stem, values in state_dict_groupped.items():
            if stem.startswith(self.wrapper.LORA_PREFIX_TEXT_ENCODER):
                wrapped = self.wrapper.text_modules.get(stem, None)
@ -302,59 +226,34 @@ class LoRA:
            if "alpha" in values:
                alpha = values["alpha"].item()

-            if (
-                "bias_indices" in values
-                and "bias_values" in values
-                and "bias_size" in values
-            ):
+            if "bias_indices" in values and "bias_values" in values and "bias_size" in values:
                bias = torch.sparse_coo_tensor(
                    values["bias_indices"],
                    values["bias_values"],
                    tuple(values["bias_size"]),
                ).to(device=self.device, dtype=self.dtype)

+
            # lora and locon
            if "lora_down.weight" in values:
                value_down = values["lora_down.weight"]
-                value_mid = values.get("lora_mid.weight", None)
-                value_up = values["lora_up.weight"]
+                value_mid  = values.get("lora_mid.weight", None)
+                value_up   = values["lora_up.weight"]

                if type(wrapped) == torch.nn.Conv2d:
                    if value_mid is not None:
-                        layer_down = torch.nn.Conv2d(
-                            value_down.shape[1], value_down.shape[0], (1, 1), bias=False
-                        )
-                        layer_mid = torch.nn.Conv2d(
-                            value_mid.shape[1],
-                            value_mid.shape[0],
-                            wrapped.kernel_size,
-                            wrapped.stride,
-                            wrapped.padding,
-                            bias=False,
-                        )
+                        layer_down = torch.nn.Conv2d(value_down.shape[1], value_down.shape[0], (1, 1), bias=False)
+                        layer_mid  = torch.nn.Conv2d(value_mid.shape[1], value_mid.shape[0], wrapped.kernel_size, wrapped.stride, wrapped.padding, bias=False)
                    else:
-                        layer_down = torch.nn.Conv2d(
-                            value_down.shape[1],
-                            value_down.shape[0],
-                            wrapped.kernel_size,
-                            wrapped.stride,
-                            wrapped.padding,
-                            bias=False,
-                        )
-                        layer_mid = None
+                        layer_down = torch.nn.Conv2d(value_down.shape[1], value_down.shape[0], wrapped.kernel_size, wrapped.stride, wrapped.padding, bias=False)
+                        layer_mid  = None

-                    layer_up = torch.nn.Conv2d(
-                        value_up.shape[1], value_up.shape[0], (1, 1), bias=False
-                    )
+                    layer_up = torch.nn.Conv2d(value_up.shape[1], value_up.shape[0], (1, 1), bias=False)

                elif type(wrapped) == torch.nn.Linear:
-                    layer_down = torch.nn.Linear(
-                        value_down.shape[1], value_down.shape[0], bias=False
-                    )
-                    layer_mid = None
-                    layer_up = torch.nn.Linear(
-                        value_up.shape[1], value_up.shape[0], bias=False
-                    )
+                    layer_down = torch.nn.Linear(value_down.shape[1], value_down.shape[0], bias=False)
+                    layer_mid  = None
+                    layer_up   = torch.nn.Linear(value_up.shape[1], value_up.shape[0], bias=False)

                else:
                    print(
@ -362,90 +261,52 @@ class LoRA:
                    )
                    return

+
                with torch.no_grad():
                    layer_down.weight.copy_(value_down)
                    if layer_mid is not None:
                        layer_mid.weight.copy_(value_mid)
                    layer_up.weight.copy_(value_up)

+
                layer_down.to(device=self.device, dtype=self.dtype)
                if layer_mid is not None:
                    layer_mid.to(device=self.device, dtype=self.dtype)
                layer_up.to(device=self.device, dtype=self.dtype)

+
                rank = value_down.shape[0]

                layer = LoRALayer(self.name, stem, rank, alpha)
-                # layer.bias = bias # TODO: find and debug lora/locon with bias
+                #layer.bias = bias # TODO: find and debug lora/locon with bias
                layer.down = layer_down
                layer.mid = layer_mid
                layer.up = layer_up

            # loha
            elif "hada_w1_b" in values:
+
                rank = values["hada_w1_b"].shape[0]

                layer = LoHALayer(self.name, stem, rank, alpha)
                layer.org_module = wrapped
                layer.bias = bias

-                layer.w1_a = values["hada_w1_a"].to(
-                    device=self.device, dtype=self.dtype
-                )
-                layer.w1_b = values["hada_w1_b"].to(
-                    device=self.device, dtype=self.dtype
-                )
-                layer.w2_a = values["hada_w2_a"].to(
-                    device=self.device, dtype=self.dtype
-                )
-                layer.w2_b = values["hada_w2_b"].to(
-                    device=self.device, dtype=self.dtype
-                )
+                layer.w1_a = values["hada_w1_a"].to(device=self.device, dtype=self.dtype)
+                layer.w1_b = values["hada_w1_b"].to(device=self.device, dtype=self.dtype)
+                layer.w2_a = values["hada_w2_a"].to(device=self.device, dtype=self.dtype)
+                layer.w2_b = values["hada_w2_b"].to(device=self.device, dtype=self.dtype)

                if "hada_t1" in values:
-                    layer.t1 = values["hada_t1"].to(
-                        device=self.device, dtype=self.dtype
-                    )
+                    layer.t1 = values["hada_t1"].to(device=self.device, dtype=self.dtype)
                else:
                    layer.t1 = None

                if "hada_t2" in values:
-                    layer.t2 = values["hada_t2"].to(
-                        device=self.device, dtype=self.dtype
-                    )
+                    layer.t2 = values["hada_t2"].to(device=self.device, dtype=self.dtype)
                else:
                    layer.t2 = None

-            # lokr
-            elif "lokr_w1_b" in values or "lokr_w1" in values:
-
-                if "lokr_w1_b" in values:
-                    rank = values["lokr_w1_b"].shape[0]
-                elif "lokr_w2_b" in values:
-                    rank = values["lokr_w2_b"].shape[0]
-                else:
-                    rank = None # unscaled
-
-                layer = LoKRLayer(self.name, stem, rank, alpha)
-                layer.org_module = wrapped
-                layer.bias = bias
-
-                if "lokr_w1" in values:
-                    layer.w1 = values["lokr_w1"].to(device=self.device, dtype=self.dtype)
-                else:
-                    layer.w1_a = values["lokr_w1_a"].to(device=self.device, dtype=self.dtype)
-                    layer.w1_b = values["lokr_w1_b"].to(device=self.device, dtype=self.dtype)
-
-                if "lokr_w2" in values:
-                    layer.w2 = values["lokr_w2"].to(device=self.device, dtype=self.dtype)
-                else:
-                    layer.w2_a = values["lokr_w2_a"].to(device=self.device, dtype=self.dtype)
-                    layer.w2_b = values["lokr_w2_b"].to(device=self.device, dtype=self.dtype)
-
-                if "lokr_t2" in values:
-                    layer.t2 = values["lokr_t2"].to(device=self.device, dtype=self.dtype)
-
-
            else:
                print(
                    f">> Encountered unknown lora layer module in {self.name}: {stem} - {type(wrapped).__name__}"
@ -456,25 +317,14 @@ class LoRA:


 class KohyaLoraManager:
-    
-    def __init__(self, pipe):
-        self.vector_length_cache_path = self.lora_path / '.vectorlength.cache'
+    def __init__(self, pipe, lora_path):
        self.unet = pipe.unet
+        self.lora_path = lora_path
        self.wrapper = LoRAModuleWrapper(pipe.unet, pipe.text_encoder)
        self.text_encoder = pipe.text_encoder
        self.device = torch.device(choose_torch_device())
        self.dtype = pipe.unet.dtype

-    @classmethod
-    @property
-    def lora_path(cls)->Path:
-        return Path(global_lora_models_dir())
-
-    @classmethod
-    @property
-    def vector_length_cache_path(cls)->Path:
-        return cls.lora_path / '.vectorlength.cache'        
-
    def load_lora_module(self, name, path_file, multiplier: float = 1.0):
        print(f"   | Found lora {name} at {path_file}")
        if path_file.suffix == ".safetensors":
@ -482,9 +332,6 @@ class KohyaLoraManager:
        else:
            checkpoint = torch.load(path_file, map_location="cpu")

-        if not self.check_model_compatibility(checkpoint):
-            raise IncompatibleModelException
-
        lora = LoRA(name, self.device, self.dtype, self.wrapper, multiplier)
        lora.load_from_dict(checkpoint)
        self.wrapper.loaded_loras[name] = lora
@ -492,14 +339,12 @@ class KohyaLoraManager:
        return lora

    def apply_lora_model(self, name, mult: float = 1.0):
-        path_file = None
        for suffix in ["ckpt", "safetensors", "pt"]:
-            path_files = [x for x in Path(self.lora_path).glob(f"**/{name}.{suffix}")]
-            if len(path_files):
-                path_file = path_files[0]
+            path_file = Path(self.lora_path, f"{name}.{suffix}")
+            if path_file.exists():
                print(f"   | Loading lora {path_file.name} with weight {mult}")
                break
-        if not path_file:
+        if not path_file.exists():
            print(f"   ** Unable to find lora: {name}")
            return

@ -510,89 +355,13 @@ class KohyaLoraManager:
        lora.multiplier = mult
        self.wrapper.applied_loras[name] = lora

-    def unload_applied_lora(self, lora_name: str) -> bool:
-        """If the indicated LoRA has previously been applied then
-        unload it and return True. Return False if the LoRA was
-        not previously applied (for status reporting)
-        """
+    def unload_applied_lora(self, lora_name: str):
        if lora_name in self.wrapper.applied_loras:
            del self.wrapper.applied_loras[lora_name]
-            return True
-        return False

-    def unload_lora(self, lora_name: str) -> bool:
+    def unload_lora(self, lora_name: str):
        if lora_name in self.wrapper.loaded_loras:
            del self.wrapper.loaded_loras[lora_name]
-            return True
-        return False

    def clear_loras(self):
        self.wrapper.clear_applied_loras()
-
-    def check_model_compatibility(self, checkpoint) -> bool:
-        """Checks whether the LoRA checkpoint is compatible with the token vector
-        length of the model that this manager is associated with.
-        """
-        model_token_vector_length = (
-            self.text_encoder.get_input_embeddings().weight.data[0].shape[0]
-        )
-        lora_token_vector_length = self.vector_length_from_checkpoint(checkpoint)
-        return model_token_vector_length == lora_token_vector_length
-
-    @staticmethod
-    def vector_length_from_checkpoint(checkpoint: dict) -> int:
-        """Return the vector token length for the passed LoRA checkpoint object.
-        This is used to determine which SD model version the LoRA was based on.
-        768 -> SDv1
-        1024-> SDv2
-        """
-        key1 = "lora_te_text_model_encoder_layers_0_mlp_fc1.lora_down.weight"
-        key2 = "lora_te_text_model_encoder_layers_0_self_attn_k_proj.hada_w1_a"
-        lora_token_vector_length = (
-            checkpoint[key1].shape[1]
-            if key1 in checkpoint
-            else checkpoint[key2].shape[0]
-            if key2 in checkpoint
-            else 768
-        )
-        return lora_token_vector_length
-
-    @classmethod
-    def vector_length_from_checkpoint_file(self, checkpoint_path: Path) -> int:
-        with LoraVectorLengthCache(self.vector_length_cache_path) as cache:
-            if str(checkpoint_path) not in cache:
-                if checkpoint_path.suffix == ".safetensors":
-                    checkpoint = load_file(
-                        checkpoint_path.absolute().as_posix(), device="cpu"
-                    )
-                else:
-                    checkpoint = torch.load(checkpoint_path, map_location="cpu")
-                cache[str(checkpoint_path)] = KohyaLoraManager.vector_length_from_checkpoint(
-                    checkpoint
-                )
-            return cache[str(checkpoint_path)]
-
-class LoraVectorLengthCache(object):
-    def __init__(self, cache_path: Path):
-        self.cache_path = cache_path
-        self.lock = FileLock(Path(cache_path.parent, ".cachelock"))
-        self.cache = {}
-
-    def __enter__(self):
-        self.lock.acquire(timeout=10)
-        try:
-            if self.cache_path.exists():
-                with open(self.cache_path, "r") as json_file:
-                    self.cache = json.load(json_file)
-        except Timeout:
-            print(
-                "** Can't acquire lock on lora vector length cache. Operations will be slower"
-            )
-        except (json.JSONDecodeError, OSError):
-            self.cache_path.unlink()
-        return self.cache
-
-    def __exit__(self, type, value, traceback):
-        with open(self.cache_path, "w") as json_file:
-            json.dump(self.cache, json_file)
-        self.lock.release()
--- a/ldm/modules/lora_manager.py
+++ b/ldm/modules/lora_manager.py
@ -1,101 +1,66 @@
 import os
-from diffusers import StableDiffusionPipeline
 from pathlib import Path
-
-from diffusers import UNet2DConditionModel, StableDiffusionPipeline
 from ldm.invoke.globals import global_lora_models_dir
-from .kohya_lora_manager import KohyaLoraManager, IncompatibleModelException
+from .kohya_lora_manager import KohyaLoraManager
 from typing import Optional, Dict

 class LoraCondition:
    name: str
    weight: float

-    def __init__(self,
-                 name,
-                 weight: float = 1.0,
-                 unet: UNet2DConditionModel=None,  # for diffusers format LoRAs
-                 kohya_manager: Optional[KohyaLoraManager]=None,  # for KohyaLoraManager-compatible LoRAs
-                 ):
+    def __init__(self, name, weight: float = 1.0, kohya_manager: Optional[KohyaLoraManager]=None):
        self.name = name
        self.weight = weight
        self.kohya_manager = kohya_manager
-        self.unet = unet

-    def __call__(self):
+    def __call__(self, model):
        # TODO: make model able to load from huggingface, rather then just local files
        path = Path(global_lora_models_dir(), self.name)
        if path.is_dir():
-            if not self.unet:
-                print(f"   ** Unable to load diffusers-format LoRA {self.name}: unet is None")
-                return
-            if self.unet.load_attn_procs:
+            if model.load_attn_procs:
                file = Path(path, "pytorch_lora_weights.bin")
                if file.is_file():
                    print(f">> Loading LoRA: {path}")
-                    self.unet.load_attn_procs(path.absolute().as_posix())
+                    model.load_attn_procs(path.absolute().as_posix())
                else:
                    print(f"   ** Unable to find valid LoRA at: {path}")
            else:
                print("   ** Invalid Model to load LoRA")
        elif self.kohya_manager:
-            try:
-                self.kohya_manager.apply_lora_model(self.name,self.weight)
-            except IncompatibleModelException:
-                print(f"   ** LoRA {self.name} is incompatible with this model; will generate without the LoRA applied.")
+            self.kohya_manager.apply_lora_model(self.name,self.weight)
        else:
            print("   ** Unable to load LoRA")

    def unload(self):
-        if self.kohya_manager and self.kohya_manager.unload_applied_lora(self.name):
+        if self.kohya_manager:
            print(f'>> unloading LoRA {self.name}')
-            
+            self.kohya_manager.unload_applied_lora(self.name)

 class LoraManager:
-    def __init__(self, pipe: StableDiffusionPipeline):
+    def __init__(self, pipe):
        # Kohya class handles lora not generated through diffusers
-        self.kohya = KohyaLoraManager(pipe)
-        self.unet = pipe.unet
+        self.kohya = KohyaLoraManager(pipe, global_lora_models_dir())

    def set_loras_conditions(self, lora_weights: list):
        conditions = []
        if len(lora_weights) > 0:
            for lora in lora_weights:
-                conditions.append(LoraCondition(lora.model, lora.weight, self.unet, self.kohya))
+                conditions.append(LoraCondition(lora.model, lora.weight, self.kohya))

        if len(conditions) > 0:
            return conditions

        return None
-    
-    def list_compatible_loras(self)->Dict[str, Path]:
-        '''
-        List all the LoRAs in the global lora directory that
-        are compatible with the current model. Return a dictionary
-        of the lora basename and its path.
-        '''
-        model_length = self.kohya.text_encoder.get_input_embeddings().weight.data[0].shape[0]
-        return self.list_loras(model_length)

-    @staticmethod
-    def list_loras(token_vector_length:int=None)->Dict[str, Path]:
-        '''List the LoRAS in the global lora directory.
-        If token_vector_length is provided, then only return
-        LoRAS that have the indicated length:
-        768: v1 models
-        1024: v2 models
-        '''
+    @classmethod
+    def list_loras(self)->Dict[str, Path]:
        path = Path(global_lora_models_dir())
        models_found = dict()
        for root,_,files in os.walk(path):
            for x in files:
                name = Path(x).stem
                suffix = Path(x).suffix
-                if suffix not in [".ckpt", ".pt", ".safetensors"]:
-                    continue
-                path = Path(root,x)
-                if token_vector_length is None:
-                    models_found[name]=Path(root,x)  # unconditional addition
-                elif token_vector_length == KohyaLoraManager.vector_length_from_checkpoint_file(path):
-                    models_found[name]=Path(root,x)  # conditional on the base model matching
+                if suffix in [".ckpt", ".pt", ".safetensors"]:
+                    models_found[name]=Path(root,x)
        return models_found
+            
--- a/ldm/modules/textual_inversion_manager.py
+++ b/ldm/modules/textual_inversion_manager.py
@ -3,16 +3,14 @@ from dataclasses import dataclass
 from pathlib import Path
 from typing import Optional, Union

-import warnings
-with warnings.catch_warnings():
-    warnings.filterwarnings("ignore", category=UserWarning)
-    import safetensors.torch
-    import torch
+import safetensors.torch
+import torch
 from picklescan.scanner import scan_file_path
 from transformers import CLIPTextModel, CLIPTokenizer

 from compel.embeddings_provider import BaseTextualInversionManager
-from ldm.invoke.concepts_lib import get_hf_concepts_lib
+from ldm.invoke.concepts_lib import HuggingFaceConceptsLibrary
+

@dataclass
 class TextualInversion:
@ -36,7 +34,7 @@ class TextualInversionManager(BaseTextualInversionManager):
        self.tokenizer = tokenizer
        self.text_encoder = text_encoder
        self.full_precision = full_precision
-        self.hf_concepts_library = get_hf_concepts_lib()
+        self.hf_concepts_library = HuggingFaceConceptsLibrary()
        self.trigger_to_sourcefile = dict()
        default_textual_inversions: list[TextualInversion] = []
        self.textual_inversions = default_textual_inversions
--- a/pyproject.toml
+++ b/pyproject.toml
@ -32,9 +32,9 @@ dependencies = [
  "albumentations",
  "click",
  "clip_anytorch",
-  "compel~=1.1.5",
+  "compel~=1.1.0",
  "datasets",
-  "diffusers[torch]~=0.16.1",
+  "diffusers[torch]~=0.14",
  "dnspython==2.2.1",
  "einops",
  "eventlet",
@ -76,7 +76,7 @@ dependencies = [
  "taming-transformers-rom1504",
  "test-tube>=0.7.5",
  "torch-fidelity",
-  "torch~=2.0.0",
+  "torch~=1.13.1",
  "torchmetrics",
  "torchvision>=0.14.1",
  "transformers~=4.26",
@ -108,7 +108,7 @@ requires-python = ">=3.9, <3.11"
 "test" = ["pytest-cov", "pytest>6.0.0"]
 "xformers" = [
  "triton; sys_platform=='linux'",
-  "xformers~=0.0.19; sys_platform!='darwin'",
+  "xformers~=0.0.16; sys_platform!='darwin'",
 ]

 [project.scripts]
Author	SHA1	Message	Date
Lincoln Stein	dbd2161601	Path->str in call to expand_prompts	2023-04-15 15:19:07 -04:00
Lincoln Stein	1f83ac2eae	add root argument	2023-04-15 15:08:44 -04:00
Lincoln Stein	f7bb68d01c	more debugging statements	2023-04-15 14:56:47 -04:00
Lincoln Stein	8cddf9c5b3	added lots of debug statements	2023-04-12 22:53:47 -04:00
Lincoln Stein	9b546ccf06	comment out suspected bug	2023-04-12 20:48:23 -04:00
Lincoln Stein	73dbf73a95	dont capture stdout & stderr; print to console	2023-04-12 07:07:34 -04:00
Lincoln Stein	18a1f3893f	insert dummy function instead of invokeai	2023-04-11 22:38:51 -04:00