final tidying before marking PR as ready for review

- Replace AnyModelLoader with ModelLoaderRegistry - Fix type check errors in multiple files - Remove apparently unneeded `get_model_config_enum()` method from model manager - Remove last vestiges of old model manager - Updated tests and documentation resolve conflict with seamless.py
2024-08-30 20:32:17 +00:00 · 2024-02-18 17:27:42 +11:00 · 2024-02-18 17:27:42 +11:00 · 4191ca1a46
commit 4191ca1a46
parent ab46865e5b
74 changed files with 672 additions and 10362 deletions
--- a/docs/contributing/MODEL_MANAGER.md
+++ b/docs/contributing/MODEL_MANAGER.md
@ -1531,23 +1531,29 @@ Here is a typical initialization pattern:
 ```
 from invokeai.app.services.config import InvokeAIAppConfig
-from invokeai.app.services.model_records import ModelRecordServiceBase
+from invokeai.app.services.model_load import ModelLoadService, ModelLoaderRegistry
 from invokeai.app.services.model_load import ModelLoadService
 config = InvokeAIAppConfig.get_config()
-store = ModelRecordServiceBase.open(config)
+ram_cache = ModelCache(
-loader = ModelLoadService(config, store)
+	max_cache_size=config.ram_cache_size, max_vram_cache_size=config.vram_cache_size, logger=logger
 )
 convert_cache = ModelConvertCache(
 	cache_path=config.models_convert_cache_path, max_size=config.convert_cache_size
 )
 loader = ModelLoadService(
 	app_config=config,
 	ram_cache=ram_cache,
 	convert_cache=convert_cache,
 	registry=ModelLoaderRegistry
 )
 ```
-Note that we are relying on the contents of the application
+### load_model(model_config, [submodel_type], [context]) -> LoadedModel
 configuration to choose the implementation of
 `ModelRecordServiceBase`.
-### load_model_by_key(key, [submodel_type], [context]) -> LoadedModel
+The `load_model()` method takes an `AnyModelConfig` returned by
-
+`ModelRecordService.get_model()` and returns the corresponding loaded
-The `load_model_by_key()` method receives the unique key that
+model.  It loads the model into memory, gets the model ready for use,
-identifies the model.  It loads the model into memory, gets the model
+and returns a `LoadedModel` object.
 ready for use, and returns a `LoadedModel` object.
 The optional second argument, `subtype` is a `SubModelType` string
 enum, such as "vae". It is mandatory when used with a main model, and
@ -1593,25 +1599,6 @@ with model_info as vae:
 - `ModelNotFoundException`  -- key in database but model not found at path
 - `NotImplementedException` -- the loader doesn't know how to load this type of model
 ### load_model_by_attr(model_name, base_model, model_type, [submodel], [context]) -> LoadedModel
 This is similar to `load_model_by_key`, but instead it accepts the
 combination of the model's name, type and base, which it passes to the
 model record config store for retrieval. If successful, this method
 returns a `LoadedModel`. It can raise the following exceptions:
 ```
 UnknownModelException -- model with these attributes not known
 NotImplementedException -- the loader doesn't know how to load this type of model
 ValueError -- more than one model matches this combination of base/type/name
 ```
 ### load_model_by_config(config, [submodel], [context]) -> LoadedModel
 This method takes an `AnyModelConfig` returned by
 ModelRecordService.get_model() and returns the corresponding loaded
 model. It may raise a `NotImplementedException`.
 ### Emitting model loading events
 When the `context` argument is passed to `load_model_*()`, it will
@ -1656,7 +1643,7 @@ onnx models.
 To install a new loader, place it in
 `invokeai/backend/model_manager/load/model_loaders`. Inherit from
-`ModelLoader` and use the `@AnyModelLoader.register()` decorator to
+`ModelLoader` and use the `@ModelLoaderRegistry.register()` decorator to
 indicate what type of models the loader can handle.
 Here is a complete example from `generic_diffusers.py`, which is able
@ -1674,12 +1661,11 @@ from invokeai.backend.model_manager import (
    ModelType,
    SubModelType,
 )
-from ..load_base import AnyModelLoader
+from .. import ModelLoader, ModelLoaderRegistry
 from ..load_default import ModelLoader
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.CLIPVision, format=ModelFormat.Diffusers)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.CLIPVision, format=ModelFormat.Diffusers)
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.T2IAdapter, format=ModelFormat.Diffusers)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.T2IAdapter, format=ModelFormat.Diffusers)
 class GenericDiffusersLoader(ModelLoader):
    """Class to load simple diffusers models."""
@ -1728,3 +1714,74 @@ model. It does whatever it needs to do to get the model into diffusers
 format, and returns the Path of the resulting model. (The path should
 ordinarily be the same as `output_path`.)
 ## The ModelManagerService object
 For convenience, the API provides a `ModelManagerService` object which
 gives a single point of access to the major model manager
 services. This object is created at initialization time and can be
 found in the global `ApiDependencies.invoker.services.model_manager`
 object, or in `context.services.model_manager` from within an
 invocation.
 In the examples below, we have retrieved the manager using:
 ```
 mm = ApiDependencies.invoker.services.model_manager
 ```
 The following properties and methods will be available:
 ### mm.store
 This retrieves the `ModelRecordService` associated with the
 manager. Example:
 ```
 configs = mm.store.get_model_by_attr(name='stable-diffusion-v1-5')
 ```
 ### mm.install
 This retrieves the `ModelInstallService` associated with the manager.
 Example:
 ```
 job = mm.install.heuristic_import(`https://civitai.com/models/58390/detail-tweaker-lora-lora`)
 ```
 ### mm.load
 This retrieves the `ModelLoaderService` associated with the manager. Example:
 ```
 configs = mm.store.get_model_by_attr(name='stable-diffusion-v1-5')
 assert len(configs) > 0
 loaded_model = mm.load.load_model(configs[0])
 ```
 The model manager also offers a few convenience shortcuts for loading
 models:
 ### mm.load_model_by_config(model_config, [submodel], [context]) -> LoadedModel
 Same as `mm.load.load_model()`.
 ### mm.load_model_by_attr(model_name, base_model, model_type, [submodel], [context]) -> LoadedModel
 This accepts the combination of the model's name, type and base, which
 it passes to the model record config store for retrieval. If a unique
 model config is found, this method returns a `LoadedModel`. It can
 raise the following exceptions:
 ```
 UnknownModelException -- model with these attributes not known
 NotImplementedException -- the loader doesn't know how to load this type of model
 ValueError -- more than one model matches this combination of base/type/name
 ```
 ### mm.load_model_by_key(key, [submodel], [context]) -> LoadedModel
 This method takes a model key, looks it up using the
 `ModelRecordServiceBase` object in `mm.store`, and passes the returned
 model configuration to `load_model_by_config()`.  It may raise a
 `NotImplementedException`.
--- a/invokeai/app/api/routers/model_manager_v2.py
+++ b/invokeai/app/api/routers/model_manager_v2.py
@ -35,7 +35,7 @@ from invokeai.backend.model_manager.metadata import AnyModelRepoMetadata
 from ..dependencies import ApiDependencies
-model_manager_v2_router = APIRouter(prefix="/v2/models", tags=["model_manager_v2"])
+model_manager_router = APIRouter(prefix="/v2/models", tags=["model_manager"])
 class ModelsList(BaseModel):
@ -135,7 +135,7 @@ example_model_metadata = {
 ##############################################################################
-@model_manager_v2_router.get(
+@model_manager_router.get(
    "/",
    operation_id="list_model_records",
 )
@ -164,7 +164,7 @@ async def list_model_records(
    return ModelsList(models=found_models)
-@model_manager_v2_router.get(
+@model_manager_router.get(
    "/i/{key}",
    operation_id="get_model_record",
    responses={
@ -188,7 +188,7 @@ async def get_model_record(
        raise HTTPException(status_code=404, detail=str(e))
-@model_manager_v2_router.get("/summary", operation_id="list_model_summary")
+@model_manager_router.get("/summary", operation_id="list_model_summary")
 async def list_model_summary(
    page: int = Query(default=0, description="The page to get"),
    per_page: int = Query(default=10, description="The number of models per page"),
@ -200,7 +200,7 @@ async def list_model_summary(
    return results
-@model_manager_v2_router.get(
+@model_manager_router.get(
    "/meta/i/{key}",
    operation_id="get_model_metadata",
    responses={
@ -223,7 +223,7 @@ async def get_model_metadata(
    return result
-@model_manager_v2_router.get(
+@model_manager_router.get(
    "/tags",
    operation_id="list_tags",
 )
@ -234,7 +234,7 @@ async def list_tags() -> Set[str]:
    return result
-@model_manager_v2_router.get(
+@model_manager_router.get(
    "/tags/search",
    operation_id="search_by_metadata_tags",
 )
@ -247,7 +247,7 @@ async def search_by_metadata_tags(
    return ModelsList(models=results)
-@model_manager_v2_router.patch(
+@model_manager_router.patch(
    "/i/{key}",
    operation_id="update_model_record",
    responses={
@ -281,7 +281,7 @@ async def update_model_record(
    return model_response
-@model_manager_v2_router.delete(
+@model_manager_router.delete(
    "/i/{key}",
    operation_id="del_model_record",
    responses={
@ -311,7 +311,7 @@ async def del_model_record(
        raise HTTPException(status_code=404, detail=str(e))
-@model_manager_v2_router.post(
+@model_manager_router.post(
    "/i/",
    operation_id="add_model_record",
    responses={
@ -349,7 +349,7 @@ async def add_model_record(
    return result
-@model_manager_v2_router.post(
+@model_manager_router.post(
    "/heuristic_import",
    operation_id="heuristic_import_model",
    responses={
@ -416,7 +416,7 @@ async def heuristic_import(
    return result
-@model_manager_v2_router.post(
+@model_manager_router.post(
    "/install",
    operation_id="import_model",
    responses={
@ -516,7 +516,7 @@ async def import_model(
    return result
-@model_manager_v2_router.get(
+@model_manager_router.get(
    "/import",
    operation_id="list_model_install_jobs",
 )
@ -544,7 +544,7 @@ async def list_model_install_jobs() -> List[ModelInstallJob]:
    return jobs
-@model_manager_v2_router.get(
+@model_manager_router.get(
    "/import/{id}",
    operation_id="get_model_install_job",
    responses={
@ -564,7 +564,7 @@ async def get_model_install_job(id: int = Path(description="Model install id"))
        raise HTTPException(status_code=404, detail=str(e))
-@model_manager_v2_router.delete(
+@model_manager_router.delete(
    "/import/{id}",
    operation_id="cancel_model_install_job",
    responses={
@ -583,7 +583,7 @@ async def cancel_model_install_job(id: int = Path(description="Model install job
    installer.cancel_job(job)
-@model_manager_v2_router.patch(
+@model_manager_router.patch(
    "/import",
    operation_id="prune_model_install_jobs",
    responses={
@ -597,7 +597,7 @@ async def prune_model_install_jobs() -> Response:
    return Response(status_code=204)
-@model_manager_v2_router.patch(
+@model_manager_router.patch(
    "/sync",
    operation_id="sync_models_to_config",
    responses={
@ -616,7 +616,7 @@ async def sync_models_to_config() -> Response:
    return Response(status_code=204)
-@model_manager_v2_router.put(
+@model_manager_router.put(
    "/convert/{key}",
    operation_id="convert_model",
    responses={
@ -694,7 +694,7 @@ async def convert_model(
    return new_config
-@model_manager_v2_router.put(
+@model_manager_router.put(
    "/merge",
    operation_id="merge",
    responses={
--- a/invokeai/app/api/routers/models.py
+++ b/invokeai/app/api/routers/models.py
@ -1,426 +0,0 @@
 # Copyright (c) 2023 Kyle Schouviller (https://github.com/kyle0654), 2023 Kent Keirsey (https://github.com/hipsterusername), 2023 Lincoln D. Stein
 import pathlib
 from typing import Annotated, List, Literal, Optional, Union
 from fastapi import Body, Path, Query, Response
 from fastapi.routing import APIRouter
 from pydantic import BaseModel, ConfigDict, Field, TypeAdapter
 from starlette.exceptions import HTTPException
 from invokeai.backend.model_management import BaseModelType, MergeInterpolationMethod, ModelType
 from invokeai.backend.model_management.models import (
    OPENAPI_MODEL_CONFIGS,
    InvalidModelException,
    ModelNotFoundException,
    SchedulerPredictionType,
 )
 from ..dependencies import ApiDependencies
 models_router = APIRouter(prefix="/v1/models", tags=["models"])
 UpdateModelResponse = Union[tuple(OPENAPI_MODEL_CONFIGS)]
 UpdateModelResponseValidator = TypeAdapter(UpdateModelResponse)
 ImportModelResponse = Union[tuple(OPENAPI_MODEL_CONFIGS)]
 ImportModelResponseValidator = TypeAdapter(ImportModelResponse)
 ConvertModelResponse = Union[tuple(OPENAPI_MODEL_CONFIGS)]
 ConvertModelResponseValidator = TypeAdapter(ConvertModelResponse)
 MergeModelResponse = Union[tuple(OPENAPI_MODEL_CONFIGS)]
 ImportModelAttributes = Union[tuple(OPENAPI_MODEL_CONFIGS)]
 class ModelsList(BaseModel):
    models: list[Union[tuple(OPENAPI_MODEL_CONFIGS)]]
    model_config = ConfigDict(use_enum_values=True)
 ModelsListValidator = TypeAdapter(ModelsList)
@models_router.get(
    "/",
    operation_id="list_models",
    responses={200: {"model": ModelsList}},
 )
 async def list_models(
    base_models: Optional[List[BaseModelType]] = Query(default=None, description="Base models to include"),
    model_type: Optional[ModelType] = Query(default=None, description="The type of model to get"),
 ) -> ModelsList:
    """Gets a list of models"""
    if base_models and len(base_models) > 0:
        models_raw = []
        for base_model in base_models:
            models_raw.extend(ApiDependencies.invoker.services.model_manager.list_models(base_model, model_type))
    else:
        models_raw = ApiDependencies.invoker.services.model_manager.list_models(None, model_type)
    models = ModelsListValidator.validate_python({"models": models_raw})
    return models
@models_router.patch(
    "/{base_model}/{model_type}/{model_name}",
    operation_id="update_model",
    responses={
        200: {"description": "The model was updated successfully"},
        400: {"description": "Bad request"},
        404: {"description": "The model could not be found"},
        409: {"description": "There is already a model corresponding to the new name"},
    },
    status_code=200,
    response_model=UpdateModelResponse,
 )
 async def update_model(
    base_model: BaseModelType = Path(description="Base model"),
    model_type: ModelType = Path(description="The type of model"),
    model_name: str = Path(description="model name"),
    info: Union[tuple(OPENAPI_MODEL_CONFIGS)] = Body(description="Model configuration"),
 ) -> UpdateModelResponse:
    """Update model contents with a new config. If the model name or base fields are changed, then the model is renamed."""
    logger = ApiDependencies.invoker.services.logger
    try:
        previous_info = ApiDependencies.invoker.services.model_manager.list_model(
            model_name=model_name,
            base_model=base_model,
            model_type=model_type,
        )
        # rename operation requested
        if info.model_name != model_name or info.base_model != base_model:
            ApiDependencies.invoker.services.model_manager.rename_model(
                base_model=base_model,
                model_type=model_type,
                model_name=model_name,
                new_name=info.model_name,
                new_base=info.base_model,
            )
            logger.info(f"Successfully renamed {base_model.value}/{model_name}=>{info.base_model}/{info.model_name}")
            # update information to support an update of attributes
            model_name = info.model_name
            base_model = info.base_model
            new_info = ApiDependencies.invoker.services.model_manager.list_model(
                model_name=model_name,
                base_model=base_model,
                model_type=model_type,
            )
            if new_info.get("path") != previous_info.get(
                "path"
            ):  # model manager moved model path during rename - don't overwrite it
                info.path = new_info.get("path")
        # replace empty string values with None/null to avoid phenomenon of vae: ''
        info_dict = info.model_dump()
        info_dict = {x: info_dict[x] if info_dict[x] else None for x in info_dict.keys()}
        ApiDependencies.invoker.services.model_manager.update_model(
            model_name=model_name,
            base_model=base_model,
            model_type=model_type,
            model_attributes=info_dict,
        )
        model_raw = ApiDependencies.invoker.services.model_manager.list_model(
            model_name=model_name,
            base_model=base_model,
            model_type=model_type,
        )
        model_response = UpdateModelResponseValidator.validate_python(model_raw)
    except ModelNotFoundException as e:
        raise HTTPException(status_code=404, detail=str(e))
    except ValueError as e:
        logger.error(str(e))
        raise HTTPException(status_code=409, detail=str(e))
    except Exception as e:
        logger.error(str(e))
        raise HTTPException(status_code=400, detail=str(e))
    return model_response
@models_router.post(
    "/import",
    operation_id="import_model",
    responses={
        201: {"description": "The model imported successfully"},
        404: {"description": "The model could not be found"},
        415: {"description": "Unrecognized file/folder format"},
        424: {"description": "The model appeared to import successfully, but could not be found in the model manager"},
        409: {"description": "There is already a model corresponding to this path or repo_id"},
    },
    status_code=201,
    response_model=ImportModelResponse,
 )
 async def import_model(
    location: str = Body(description="A model path, repo_id or URL to import"),
    prediction_type: Optional[Literal["v_prediction", "epsilon", "sample"]] = Body(
        description="Prediction type for SDv2 checkpoints and rare SDv1 checkpoints",
        default=None,
    ),
 ) -> ImportModelResponse:
    """Add a model using its local path, repo_id, or remote URL. Model characteristics will be probed and configured automatically"""
    location = location.strip("\"' ")
    items_to_import = {location}
    prediction_types = {x.value: x for x in SchedulerPredictionType}
    logger = ApiDependencies.invoker.services.logger
    try:
        installed_models = ApiDependencies.invoker.services.model_manager.heuristic_import(
            items_to_import=items_to_import,
            prediction_type_helper=lambda x: prediction_types.get(prediction_type),
        )
        info = installed_models.get(location)
        if not info:
            logger.error("Import failed")
            raise HTTPException(status_code=415)
        logger.info(f"Successfully imported {location}, got {info}")
        model_raw = ApiDependencies.invoker.services.model_manager.list_model(
            model_name=info.name, base_model=info.base_model, model_type=info.model_type
        )
        return ImportModelResponseValidator.validate_python(model_raw)
    except ModelNotFoundException as e:
        logger.error(str(e))
        raise HTTPException(status_code=404, detail=str(e))
    except InvalidModelException as e:
        logger.error(str(e))
        raise HTTPException(status_code=415)
    except ValueError as e:
        logger.error(str(e))
        raise HTTPException(status_code=409, detail=str(e))
@models_router.post(
    "/add",
    operation_id="add_model",
    responses={
        201: {"description": "The model added successfully"},
        404: {"description": "The model could not be found"},
        424: {"description": "The model appeared to add successfully, but could not be found in the model manager"},
        409: {"description": "There is already a model corresponding to this path or repo_id"},
    },
    status_code=201,
    response_model=ImportModelResponse,
 )
 async def add_model(
    info: Union[tuple(OPENAPI_MODEL_CONFIGS)] = Body(description="Model configuration"),
 ) -> ImportModelResponse:
    """Add a model using the configuration information appropriate for its type. Only local models can be added by path"""
    logger = ApiDependencies.invoker.services.logger
    try:
        ApiDependencies.invoker.services.model_manager.add_model(
            info.model_name,
            info.base_model,
            info.model_type,
            model_attributes=info.model_dump(),
        )
        logger.info(f"Successfully added {info.model_name}")
        model_raw = ApiDependencies.invoker.services.model_manager.list_model(
            model_name=info.model_name,
            base_model=info.base_model,
            model_type=info.model_type,
        )
        return ImportModelResponseValidator.validate_python(model_raw)
    except ModelNotFoundException as e:
        logger.error(str(e))
        raise HTTPException(status_code=404, detail=str(e))
    except ValueError as e:
        logger.error(str(e))
        raise HTTPException(status_code=409, detail=str(e))
@models_router.delete(
    "/{base_model}/{model_type}/{model_name}",
    operation_id="del_model",
    responses={
        204: {"description": "Model deleted successfully"},
        404: {"description": "Model not found"},
    },
    status_code=204,
    response_model=None,
 )
 async def delete_model(
    base_model: BaseModelType = Path(description="Base model"),
    model_type: ModelType = Path(description="The type of model"),
    model_name: str = Path(description="model name"),
 ) -> Response:
    """Delete Model"""
    logger = ApiDependencies.invoker.services.logger
    try:
        ApiDependencies.invoker.services.model_manager.del_model(
            model_name, base_model=base_model, model_type=model_type
        )
        logger.info(f"Deleted model: {model_name}")
        return Response(status_code=204)
    except ModelNotFoundException as e:
        logger.error(str(e))
        raise HTTPException(status_code=404, detail=str(e))
@models_router.put(
    "/convert/{base_model}/{model_type}/{model_name}",
    operation_id="convert_model",
    responses={
        200: {"description": "Model converted successfully"},
        400: {"description": "Bad request"},
        404: {"description": "Model not found"},
    },
    status_code=200,
    response_model=ConvertModelResponse,
 )
 async def convert_model(
    base_model: BaseModelType = Path(description="Base model"),
    model_type: ModelType = Path(description="The type of model"),
    model_name: str = Path(description="model name"),
    convert_dest_directory: Optional[str] = Query(
        default=None, description="Save the converted model to the designated directory"
    ),
 ) -> ConvertModelResponse:
    """Convert a checkpoint model into a diffusers model, optionally saving to the indicated destination directory, or `models` if none."""
    logger = ApiDependencies.invoker.services.logger
    try:
        logger.info(f"Converting model: {model_name}")
        dest = pathlib.Path(convert_dest_directory) if convert_dest_directory else None
        ApiDependencies.invoker.services.model_manager.convert_model(
            model_name,
            base_model=base_model,
            model_type=model_type,
            convert_dest_directory=dest,
        )
        model_raw = ApiDependencies.invoker.services.model_manager.list_model(
            model_name, base_model=base_model, model_type=model_type
        )
        response = ConvertModelResponseValidator.validate_python(model_raw)
    except ModelNotFoundException as e:
        raise HTTPException(status_code=404, detail=f"Model '{model_name}' not found: {str(e)}")
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    return response
@models_router.get(
    "/search",
    operation_id="search_for_models",
    responses={
        200: {"description": "Directory searched successfully"},
        404: {"description": "Invalid directory path"},
    },
    status_code=200,
    response_model=List[pathlib.Path],
 )
 async def search_for_models(
    search_path: pathlib.Path = Query(description="Directory path to search for models"),
 ) -> List[pathlib.Path]:
    if not search_path.is_dir():
        raise HTTPException(
            status_code=404,
            detail=f"The search path '{search_path}' does not exist or is not directory",
        )
    return ApiDependencies.invoker.services.model_manager.search_for_models(search_path)
@models_router.get(
    "/ckpt_confs",
    operation_id="list_ckpt_configs",
    responses={
        200: {"description": "paths retrieved successfully"},
    },
    status_code=200,
    response_model=List[pathlib.Path],
 )
 async def list_ckpt_configs() -> List[pathlib.Path]:
    """Return a list of the legacy checkpoint configuration files stored in `ROOT/configs/stable-diffusion`, relative to ROOT."""
    return ApiDependencies.invoker.services.model_manager.list_checkpoint_configs()
@models_router.post(
    "/sync",
    operation_id="sync_to_config",
    responses={
        201: {"description": "synchronization successful"},
    },
    status_code=201,
    response_model=bool,
 )
 async def sync_to_config() -> bool:
    """Call after making changes to models.yaml, autoimport directories or models directory to synchronize
    in-memory data structures with disk data structures."""
    ApiDependencies.invoker.services.model_manager.sync_to_config()
    return True
 # There's some weird pydantic-fastapi behaviour that requires this to be a separate class
 # TODO: After a few updates, see if it works inside the route operation handler?
 class MergeModelsBody(BaseModel):
    model_names: List[str] = Field(description="model name", min_length=2, max_length=3)
    merged_model_name: Optional[str] = Field(description="Name of destination model")
    alpha: Optional[float] = Field(description="Alpha weighting strength to apply to 2d and 3d models", default=0.5)
    interp: Optional[MergeInterpolationMethod] = Field(description="Interpolation method")
    force: Optional[bool] = Field(
        description="Force merging of models created with different versions of diffusers",
        default=False,
    )
    merge_dest_directory: Optional[str] = Field(
        description="Save the merged model to the designated directory (with 'merged_model_name' appended)",
        default=None,
    )
    model_config = ConfigDict(protected_namespaces=())
@models_router.put(
    "/merge/{base_model}",
    operation_id="merge_models",
    responses={
        200: {"description": "Model converted successfully"},
        400: {"description": "Incompatible models"},
        404: {"description": "One or more models not found"},
    },
    status_code=200,
    response_model=MergeModelResponse,
 )
 async def merge_models(
    body: Annotated[MergeModelsBody, Body(description="Model configuration", embed=True)],
    base_model: BaseModelType = Path(description="Base model"),
 ) -> MergeModelResponse:
    """Convert a checkpoint model into a diffusers model"""
    logger = ApiDependencies.invoker.services.logger
    try:
        logger.info(
            f"Merging models: {body.model_names} into {body.merge_dest_directory or '<MODELS>'}/{body.merged_model_name}"
        )
        dest = pathlib.Path(body.merge_dest_directory) if body.merge_dest_directory else None
        result = ApiDependencies.invoker.services.model_manager.merge_models(
            model_names=body.model_names,
            base_model=base_model,
            merged_model_name=body.merged_model_name or "+".join(body.model_names),
            alpha=body.alpha,
            interp=body.interp,
            force=body.force,
            merge_dest_directory=dest,
        )
        model_raw = ApiDependencies.invoker.services.model_manager.list_model(
            result.name,
            base_model=base_model,
            model_type=ModelType.Main,
        )
        response = ConvertModelResponseValidator.validate_python(model_raw)
    except ModelNotFoundException:
        raise HTTPException(
            status_code=404,
            detail=f"One or more of the models '{body.model_names}' not found",
        )
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    return response
--- a/invokeai/app/api_app.py
+++ b/invokeai/app/api_app.py
@ -48,7 +48,7 @@ if True:  # hack to make flake8 happy with imports coming after setting up the c
        boards,
        download_queue,
        images,
-        model_manager_v2,
+        model_manager,
        session_queue,
        sessions,
        utilities,
@ -113,7 +113,7 @@ async def shutdown_event() -> None:
 app.include_router(sessions.session_router, prefix="/api")
 app.include_router(utilities.utilities_router, prefix="/api")
-app.include_router(model_manager_v2.model_manager_v2_router, prefix="/api")
+app.include_router(model_manager.model_manager_router, prefix="/api")
 app.include_router(download_queue.download_queue_router, prefix="/api")
 app.include_router(images.images_router, prefix="/api")
 app.include_router(boards.boards_router, prefix="/api")
@ -175,21 +175,23 @@ def custom_openapi() -> dict[str, Any]:
        invoker_schema["class"] = "invocation"
        openapi_schema["components"]["schemas"][f"{output_type_title}"]["class"] = "output"
-    from invokeai.backend.model_management.models import get_model_config_enums
+    # This code no longer seems to be necessary?
    # Leave it here just in case
    #
    # from invokeai.backend.model_manager import get_model_config_formats
    # formats = get_model_config_formats()
    # for model_config_name, enum_set in formats.items():
-    for model_config_format_enum in set(get_model_config_enums()):
+    #     if model_config_name in openapi_schema["components"]["schemas"]:
-        name = model_config_format_enum.__qualname__
+    #         # print(f"Config with name {name} already defined")
    #         continue
-        if name in openapi_schema["components"]["schemas"]:
+    #     openapi_schema["components"]["schemas"][model_config_name] = {
-            # print(f"Config with name {name} already defined")
+    #         "title": model_config_name,
-            continue
+    #         "description": "An enumeration.",
-
+    #         "type": "string",
-        openapi_schema["components"]["schemas"][name] = {
+    #         "enum": [v.value for v in enum_set],
-            "title": name,
+    #     }
            "description": "An enumeration.",
            "type": "string",
            "enum": [v.value for v in model_config_format_enum],
        }
    app.openapi_schema = openapi_schema
    return app.openapi_schema
--- a/invokeai/app/invocations/compel.py
+++ b/invokeai/app/invocations/compel.py
@ -18,15 +18,15 @@ from invokeai.app.services.model_records import UnknownModelException
 from invokeai.app.services.shared.invocation_context import InvocationContext
 from invokeai.app.util.ti_utils import extract_ti_triggers_from_prompt
 from invokeai.backend.lora import LoRAModelRaw
 from invokeai.backend.model_patcher import ModelPatcher
 from invokeai.backend.textual_inversion import TextualInversionModelRaw
 from invokeai.backend.model_manager import ModelType
 from invokeai.backend.model_patcher import ModelPatcher
 from invokeai.backend.stable_diffusion.diffusion.conditioning_data import (
    BasicConditioningInfo,
    ConditioningFieldData,
    ExtraConditioningInfo,
    SDXLConditioningInfo,
 )
 from invokeai.backend.textual_inversion import TextualInversionModelRaw
 from invokeai.backend.util.devices import torch_dtype
 from .baseinvocation import (
--- a/invokeai/app/services/config/config_base.py
+++ b/invokeai/app/services/config/config_base.py
@ -68,7 +68,7 @@ class InvokeAISettings(BaseSettings):
        return OmegaConf.to_yaml(conf)
    @classmethod
-    def add_parser_arguments(cls, parser) -> None:
+    def add_parser_arguments(cls, parser: ArgumentParser) -> None:
        """Dynamically create arguments for a settings parser."""
        if "type" in get_type_hints(cls):
            settings_stanza = get_args(get_type_hints(cls)["type"])[0]
--- a/invokeai/app/services/invocation_stats/invocation_stats_base.py
+++ b/invokeai/app/services/invocation_stats/invocation_stats_base.py
@ -29,8 +29,8 @@ writes to the system log is stored in InvocationServices.performance_statistics.
 """
 from abc import ABC, abstractmethod
 from contextlib import AbstractContextManager
 from pathlib import Path
 from typing import Iterator
 from invokeai.app.invocations.baseinvocation import BaseInvocation
 from invokeai.app.services.invocation_stats.invocation_stats_common import InvocationStatsSummary
@ -40,18 +40,17 @@ class InvocationStatsServiceBase(ABC):
    "Abstract base class for recording node memory/time performance statistics"
    @abstractmethod
-    def __init__(self):
+    def __init__(self) -> None:
        """
        Initialize the InvocationStatsService and reset counters to zero
        """
        pass
    @abstractmethod
    def collect_stats(
        self,
        invocation: BaseInvocation,
        graph_execution_state_id: str,
-    ) -> AbstractContextManager:
+    ) -> Iterator[None]:
        """
        Return a context object that will capture the statistics on the execution
        of invocaation. Use with: to place around the part of the code that executes the invocation.
@ -61,7 +60,7 @@ class InvocationStatsServiceBase(ABC):
        pass
    @abstractmethod
-    def reset_stats(self, graph_execution_state_id: str):
+    def reset_stats(self, graph_execution_state_id: str) -> None:
        """
        Reset all statistics for the indicated graph.
        :param graph_execution_state_id: The id of the session whose stats to reset.
@ -70,7 +69,7 @@ class InvocationStatsServiceBase(ABC):
        pass
    @abstractmethod
-    def log_stats(self, graph_execution_state_id: str):
+    def log_stats(self, graph_execution_state_id: str) -> None:
        """
        Write out the accumulated statistics to the log or somewhere else.
        :param graph_execution_state_id: The id of the session whose stats to log.
--- a/invokeai/app/services/model_install/model_install_base.py
+++ b/invokeai/app/services/model_install/model_install_base.py
@ -14,7 +14,7 @@ from typing_extensions import Annotated
 from invokeai.app.services.config import InvokeAIAppConfig
 from invokeai.app.services.download import DownloadJob, DownloadQueueServiceBase
-from invokeai.app.services.events import EventServiceBase
+from invokeai.app.services.events.events_base import EventServiceBase
 from invokeai.app.services.invoker import Invoker
 from invokeai.app.services.model_records import ModelRecordServiceBase
 from invokeai.backend.model_manager import AnyModelConfig, ModelRepoVariant
--- a/invokeai/app/services/model_load/model_load_base.py
+++ b/invokeai/app/services/model_load/model_load_base.py
@ -5,7 +5,7 @@ from abc import ABC, abstractmethod
 from typing import Optional
 from invokeai.app.services.shared.invocation_context import InvocationContextData
-from invokeai.backend.model_manager import AnyModel, AnyModelConfig, BaseModelType, ModelType, SubModelType
+from invokeai.backend.model_manager import AnyModel, AnyModelConfig, SubModelType
 from invokeai.backend.model_manager.load import LoadedModel
 from invokeai.backend.model_manager.load.convert_cache import ModelConvertCacheBase
 from invokeai.backend.model_manager.load.model_cache.model_cache_base import ModelCacheBase
@ -15,23 +15,7 @@ class ModelLoadServiceBase(ABC):
    """Wrapper around AnyModelLoader."""
    @abstractmethod
-    def load_model_by_key(
+    def load_model(
        self,
        key: str,
        submodel_type: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        """
        Given a model's key, load it and return the LoadedModel object.
        :param key: Key of model config to be fetched.
        :param submodel: For main (pipeline models), the submodel to fetch.
        :param context_data: Invocation context data used for event reporting
        """
        pass
    @abstractmethod
    def load_model_by_config(
        self,
        model_config: AnyModelConfig,
        submodel_type: Optional[SubModelType] = None,
@ -44,34 +28,6 @@ class ModelLoadServiceBase(ABC):
        :param submodel: For main (pipeline models), the submodel to fetch.
        :param context_data: Invocation context data used for event reporting
        """
        pass
    @abstractmethod
    def load_model_by_attr(
        self,
        model_name: str,
        base_model: BaseModelType,
        model_type: ModelType,
        submodel: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        """
        Given a model's attributes, search the database for it, and if found, load and return the LoadedModel object.
        This is provided for API compatability with the get_model() method
        in the original model manager. However, note that LoadedModel is
        not the same as the original ModelInfo that ws returned.
        :param model_name: Name of to be fetched.
        :param base_model: Base model
        :param model_type: Type of the model
        :param submodel: For main (pipeline models), the submodel to fetch
        :param context_data: The invocation context data.
        Exceptions: UnknownModelException -- model with these attributes not known
                    NotImplementedException -- a model loader was not provided at initialization time
                    ValueError -- more than one model matches this combination
        """
    @property
    @abstractmethod
--- a/invokeai/app/services/model_load/model_load_default.py
+++ b/invokeai/app/services/model_load/model_load_default.py
@ -1,15 +1,18 @@
 # Copyright (c) 2024 Lincoln D. Stein and the InvokeAI Team
 """Implementation of model loader service."""
-from typing import Optional
+from typing import Optional, Type
 from invokeai.app.services.config import InvokeAIAppConfig
 from invokeai.app.services.invocation_processor.invocation_processor_common import CanceledException
 from invokeai.app.services.invoker import Invoker
 from invokeai.app.services.model_records import ModelRecordServiceBase, UnknownModelException
 from invokeai.app.services.shared.invocation_context import InvocationContextData
-from invokeai.backend.model_manager import AnyModel, AnyModelConfig, BaseModelType, ModelType, SubModelType
+from invokeai.backend.model_manager import AnyModel, AnyModelConfig, SubModelType
-from invokeai.backend.model_manager.load import AnyModelLoader, LoadedModel, ModelCache, ModelConvertCache
+from invokeai.backend.model_manager.load import (
    LoadedModel,
    ModelLoaderRegistry,
    ModelLoaderRegistryBase,
 )
 from invokeai.backend.model_manager.load.convert_cache import ModelConvertCacheBase
 from invokeai.backend.model_manager.load.model_cache.model_cache_base import ModelCacheBase
 from invokeai.backend.util.logging import InvokeAILogger
@ -18,25 +21,23 @@ from .model_load_base import ModelLoadServiceBase
 class ModelLoadService(ModelLoadServiceBase):
-    """Wrapper around AnyModelLoader."""
+    """Wrapper around ModelLoaderRegistry."""
    def __init__(
-            self,
+        self,
-            app_config: InvokeAIAppConfig,
+        app_config: InvokeAIAppConfig,
-            record_store: ModelRecordServiceBase,
+        ram_cache: ModelCacheBase[AnyModel],
-            ram_cache: ModelCacheBase[AnyModel],
+        convert_cache: ModelConvertCacheBase,
-            convert_cache: ModelConvertCacheBase,
+        registry: Optional[Type[ModelLoaderRegistryBase]] = ModelLoaderRegistry,
    ):
        """Initialize the model load service."""
        logger = InvokeAILogger.get_logger(self.__class__.__name__)
        logger.setLevel(app_config.log_level.upper())
-        self._store = record_store
+        self._logger = logger
-        self._any_loader = AnyModelLoader(
+        self._app_config = app_config
-            app_config=app_config,
+        self._ram_cache = ram_cache
-            logger=logger,
+        self._convert_cache = convert_cache
-            ram_cache=ram_cache,
+        self._registry = registry
            convert_cache=convert_cache,
        )
    def start(self, invoker: Invoker) -> None:
        self._invoker = invoker
@ -44,63 +45,14 @@ class ModelLoadService(ModelLoadServiceBase):
    @property
    def ram_cache(self) -> ModelCacheBase[AnyModel]:
        """Return the RAM cache used by this loader."""
-        return self._any_loader.ram_cache
+        return self._ram_cache
    @property
    def convert_cache(self) -> ModelConvertCacheBase:
        """Return the checkpoint convert cache used by this loader."""
-        return self._any_loader.convert_cache
+        return self._convert_cache
-    def load_model_by_key(
+    def load_model(
        self,
        key: str,
        submodel_type: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        """
        Given a model's key, load it and return the LoadedModel object.
        :param key: Key of model config to be fetched.
        :param submodel: For main (pipeline models), the submodel to fetch.
        :param context: Invocation context used for event reporting
        """
        config = self._store.get_model(key)
        return self.load_model_by_config(config, submodel_type, context_data)
    def load_model_by_attr(
        self,
        model_name: str,
        base_model: BaseModelType,
        model_type: ModelType,
        submodel: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        """
        Given a model's attributes, search the database for it, and if found, load and return the LoadedModel object.
        This is provided for API compatability with the get_model() method
        in the original model manager. However, note that LoadedModel is
        not the same as the original ModelInfo that ws returned.
        :param model_name: Name of to be fetched.
        :param base_model: Base model
        :param model_type: Type of the model
        :param submodel: For main (pipeline models), the submodel to fetch
        :param context: The invocation context.
        Exceptions: UnknownModelException -- model with this key not known
                    NotImplementedException -- a model loader was not provided at initialization time
                    ValueError -- more than one model matches this combination
        """
        configs = self._store.search_by_attr(model_name, base_model, model_type)
        if len(configs) == 0:
            raise UnknownModelException(f"{base_model}/{model_type}/{model_name}: Unknown model")
        elif len(configs) > 1:
            raise ValueError(f"{base_model}/{model_type}/{model_name}: More than one model matches.")
        else:
            return self.load_model_by_key(configs[0].key, submodel)
    def load_model_by_config(
        self,
        model_config: AnyModelConfig,
        submodel_type: Optional[SubModelType] = None,
@ -118,7 +70,15 @@ class ModelLoadService(ModelLoadServiceBase):
                context_data=context_data,
                model_config=model_config,
            )
-        loaded_model = self._any_loader.load_model(model_config, submodel_type)
+
        implementation, model_config, submodel_type = self._registry.get_implementation(model_config, submodel_type)  # type: ignore
        loaded_model: LoadedModel = implementation(
            app_config=self._app_config,
            logger=self._logger,
            ram_cache=self._ram_cache,
            convert_cache=self._convert_cache,
        ).load_model(model_config, submodel_type)
        if context_data:
            self._emit_load_event(
                context_data=context_data,
--- a/invokeai/app/services/model_manager/init.py
+++ b/invokeai/app/services/model_manager/init.py
@ -3,7 +3,7 @@
 from invokeai.backend.model_manager import AnyModel, AnyModelConfig, BaseModelType, ModelType, SubModelType
 from invokeai.backend.model_manager.load import LoadedModel
-from .model_manager_default import ModelManagerServiceBase, ModelManagerService
+from .model_manager_default import ModelManagerService, ModelManagerServiceBase
 __all__ = [
    "ModelManagerServiceBase",
--- a/invokeai/app/services/model_manager/model_manager_base.py
+++ b/invokeai/app/services/model_manager/model_manager_base.py
@ -1,10 +1,14 @@
 # Copyright (c) 2023 Lincoln D. Stein and the InvokeAI Team
 from abc import ABC, abstractmethod
 from typing import Optional
 from typing_extensions import Self
 from invokeai.app.services.invoker import Invoker
 from invokeai.app.services.shared.invocation_context import InvocationContextData
 from invokeai.backend.model_manager.config import AnyModelConfig, BaseModelType, ModelType, SubModelType
 from invokeai.backend.model_manager.load.load_base import LoadedModel
 from ..config import InvokeAIAppConfig
 from ..download import DownloadQueueServiceBase
@ -65,3 +69,32 @@ class ModelManagerServiceBase(ABC):
    @abstractmethod
    def stop(self, invoker: Invoker) -> None:
        pass
    @abstractmethod
    def load_model_by_config(
        self,
        model_config: AnyModelConfig,
        submodel_type: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        pass
    @abstractmethod
    def load_model_by_key(
        self,
        key: str,
        submodel_type: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        pass
    @abstractmethod
    def load_model_by_attr(
        self,
        model_name: str,
        base_model: BaseModelType,
        model_type: ModelType,
        submodel: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        pass
--- a/invokeai/app/services/model_manager/model_manager_default.py
+++ b/invokeai/app/services/model_manager/model_manager_default.py
@ -1,10 +1,14 @@
 # Copyright (c) 2023 Lincoln D. Stein and the InvokeAI Team
 """Implementation of ModelManagerServiceBase."""
 from typing import Optional
 from typing_extensions import Self
 from invokeai.app.services.invoker import Invoker
-from invokeai.backend.model_manager.load import ModelCache, ModelConvertCache
+from invokeai.app.services.shared.invocation_context import InvocationContextData
 from invokeai.backend.model_manager import AnyModelConfig, BaseModelType, LoadedModel, ModelType, SubModelType
 from invokeai.backend.model_manager.load import ModelCache, ModelConvertCache, ModelLoaderRegistry
 from invokeai.backend.util.logging import InvokeAILogger
 from ..config import InvokeAIAppConfig
@ -12,7 +16,7 @@ from ..download import DownloadQueueServiceBase
 from ..events.events_base import EventServiceBase
 from ..model_install import ModelInstallService, ModelInstallServiceBase
 from ..model_load import ModelLoadService, ModelLoadServiceBase
-from ..model_records import ModelRecordServiceBase
+from ..model_records import ModelRecordServiceBase, UnknownModelException
 from .model_manager_base import ModelManagerServiceBase
@ -58,6 +62,56 @@ class ModelManagerService(ModelManagerServiceBase):
            if hasattr(service, "stop"):
                service.stop(invoker)
    def load_model_by_config(
        self,
        model_config: AnyModelConfig,
        submodel_type: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        return self.load.load_model(model_config, submodel_type, context_data)
    def load_model_by_key(
        self,
        key: str,
        submodel_type: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        config = self.store.get_model(key)
        return self.load.load_model(config, submodel_type, context_data)
    def load_model_by_attr(
        self,
        model_name: str,
        base_model: BaseModelType,
        model_type: ModelType,
        submodel: Optional[SubModelType] = None,
        context_data: Optional[InvocationContextData] = None,
    ) -> LoadedModel:
        """
        Given a model's attributes, search the database for it, and if found, load and return the LoadedModel object.
        This is provided for API compatability with the get_model() method
        in the original model manager. However, note that LoadedModel is
        not the same as the original ModelInfo that ws returned.
        :param model_name: Name of to be fetched.
        :param base_model: Base model
        :param model_type: Type of the model
        :param submodel: For main (pipeline models), the submodel to fetch
        :param context: The invocation context.
        Exceptions: UnknownModelException -- model with this key not known
                    NotImplementedException -- a model loader was not provided at initialization time
                    ValueError -- more than one model matches this combination
        """
        configs = self.store.search_by_attr(model_name, base_model, model_type)
        if len(configs) == 0:
            raise UnknownModelException(f"{base_model}/{model_type}/{model_name}: Unknown model")
        elif len(configs) > 1:
            raise ValueError(f"{base_model}/{model_type}/{model_name}: More than one model matches.")
        else:
            return self.load.load_model(configs[0], submodel, context_data)
    @classmethod
    def build_model_manager(
        cls,
@ -82,9 +136,9 @@ class ModelManagerService(ModelManagerServiceBase):
        )
        loader = ModelLoadService(
            app_config=app_config,
            record_store=model_record_service,
            ram_cache=ram_cache,
            convert_cache=convert_cache,
            registry=ModelLoaderRegistry,
        )
        installer = ModelInstallService(
            app_config=app_config,
--- a/invokeai/app/services/shared/invocation_context.py
+++ b/invokeai/app/services/shared/invocation_context.py
@ -281,7 +281,7 @@ class ModelsInterface(InvocationContextInterface):
        # The model manager emits events as it loads the model. It needs the context data to build
        # the event payloads.
-        return self._services.model_manager.load.load_model_by_key(
+        return self._services.model_manager.load_model_by_key(
            key=key, submodel_type=submodel_type, context_data=self._context_data
        )
@ -296,7 +296,7 @@ class ModelsInterface(InvocationContextInterface):
        :param model_type: Type of the model
        :param submodel: For main (pipeline models), the submodel to fetch
        """
-        return self._services.model_manager.load.load_model_by_attr(
+        return self._services.model_manager.load_model_by_attr(
            model_name=model_name,
            base_model=base_model,
            model_type=model_type,
--- a/invokeai/backend/install/migrate_to_3.py
+++ b/invokeai/backend/install/migrate_to_3.py
@ -1,591 +0,0 @@
 """
 Migrate the models directory and models.yaml file from an existing
 InvokeAI 2.3 installation to 3.0.0.
 """
 import argparse
 import os
 import shutil
 import warnings
 from dataclasses import dataclass
 from pathlib import Path
 from typing import Union
 import diffusers
 import transformers
 import yaml
 from diffusers import AutoencoderKL, StableDiffusionPipeline
 from diffusers.pipelines.stable_diffusion.safety_checker import StableDiffusionSafetyChecker
 from omegaconf import DictConfig, OmegaConf
 from transformers import AutoFeatureExtractor, BertTokenizerFast, CLIPTextModel, CLIPTokenizer
 import invokeai.backend.util.logging as logger
 from invokeai.app.services.config import InvokeAIAppConfig
 from invokeai.backend.model_management import ModelManager
 from invokeai.backend.model_management.model_probe import BaseModelType, ModelProbe, ModelProbeInfo, ModelType
 warnings.filterwarnings("ignore")
 transformers.logging.set_verbosity_error()
 diffusers.logging.set_verbosity_error()
 # holder for paths that we will migrate
@dataclass
 class ModelPaths:
    models: Path
    embeddings: Path
    loras: Path
    controlnets: Path
 class MigrateTo3(object):
    def __init__(
        self,
        from_root: Path,
        to_models: Path,
        model_manager: ModelManager,
        src_paths: ModelPaths,
    ):
        self.root_directory = from_root
        self.dest_models = to_models
        self.mgr = model_manager
        self.src_paths = src_paths
    @classmethod
    def initialize_yaml(cls, yaml_file: Path):
        with open(yaml_file, "w") as file:
            file.write(yaml.dump({"__metadata__": {"version": "3.0.0"}}))
    def create_directory_structure(self):
        """
        Create the basic directory structure for the models folder.
        """
        for model_base in [BaseModelType.StableDiffusion1, BaseModelType.StableDiffusion2]:
            for model_type in [
                ModelType.Main,
                ModelType.Vae,
                ModelType.Lora,
                ModelType.ControlNet,
                ModelType.TextualInversion,
            ]:
                path = self.dest_models / model_base.value / model_type.value
                path.mkdir(parents=True, exist_ok=True)
        path = self.dest_models / "core"
        path.mkdir(parents=True, exist_ok=True)
    @staticmethod
    def copy_file(src: Path, dest: Path):
        """
        copy a single file with logging
        """
        if dest.exists():
            logger.info(f"Skipping existing {str(dest)}")
            return
        logger.info(f"Copying {str(src)} to {str(dest)}")
        try:
            shutil.copy(src, dest)
        except Exception as e:
            logger.error(f"COPY FAILED: {str(e)}")
    @staticmethod
    def copy_dir(src: Path, dest: Path):
        """
        Recursively copy a directory with logging
        """
        if dest.exists():
            logger.info(f"Skipping existing {str(dest)}")
            return
        logger.info(f"Copying {str(src)} to {str(dest)}")
        try:
            shutil.copytree(src, dest)
        except Exception as e:
            logger.error(f"COPY FAILED: {str(e)}")
    def migrate_models(self, src_dir: Path):
        """
        Recursively walk through src directory, probe anything
        that looks like a model, and copy the model into the
        appropriate location within the destination models directory.
        """
        directories_scanned = set()
        for root, dirs, files in os.walk(src_dir, followlinks=True):
            for d in dirs:
                try:
                    model = Path(root, d)
                    info = ModelProbe().heuristic_probe(model)
                    if not info:
                        continue
                    dest = self._model_probe_to_path(info) / model.name
                    self.copy_dir(model, dest)
                    directories_scanned.add(model)
                except Exception as e:
                    logger.error(str(e))
                except KeyboardInterrupt:
                    raise
            for f in files:
                # don't copy raw learned_embeds.bin or pytorch_lora_weights.bin
                # let them be copied as part of a tree copy operation
                try:
                    if f in {"learned_embeds.bin", "pytorch_lora_weights.bin"}:
                        continue
                    model = Path(root, f)
                    if model.parent in directories_scanned:
                        continue
                    info = ModelProbe().heuristic_probe(model)
                    if not info:
                        continue
                    dest = self._model_probe_to_path(info) / f
                    self.copy_file(model, dest)
                except Exception as e:
                    logger.error(str(e))
                except KeyboardInterrupt:
                    raise
    def migrate_support_models(self):
        """
        Copy the clipseg, upscaler, and restoration models to their new
        locations.
        """
        dest_directory = self.dest_models
        if (self.root_directory / "models/clipseg").exists():
            self.copy_dir(self.root_directory / "models/clipseg", dest_directory / "core/misc/clipseg")
        if (self.root_directory / "models/realesrgan").exists():
            self.copy_dir(self.root_directory / "models/realesrgan", dest_directory / "core/upscaling/realesrgan")
        for d in ["codeformer", "gfpgan"]:
            path = self.root_directory / "models" / d
            if path.exists():
                self.copy_dir(path, dest_directory / f"core/face_restoration/{d}")
    def migrate_tuning_models(self):
        """
        Migrate the embeddings, loras and controlnets directories to their new homes.
        """
        for src in [self.src_paths.embeddings, self.src_paths.loras, self.src_paths.controlnets]:
            if not src:
                continue
            if src.is_dir():
                logger.info(f"Scanning {src}")
                self.migrate_models(src)
            else:
                logger.info(f"{src} directory not found; skipping")
                continue
    def migrate_conversion_models(self):
        """
        Migrate all the models that are needed by the ckpt_to_diffusers conversion
        script.
        """
        dest_directory = self.dest_models
        kwargs = {
            "cache_dir": self.root_directory / "models/hub",
            # local_files_only = True
        }
        try:
            logger.info("Migrating core tokenizers and text encoders")
            target_dir = dest_directory / "core" / "convert"
            self._migrate_pretrained(
                BertTokenizerFast, repo_id="bert-base-uncased", dest=target_dir / "bert-base-uncased", **kwargs
            )
            # sd-1
            repo_id = "openai/clip-vit-large-patch14"
            self._migrate_pretrained(
                CLIPTokenizer, repo_id=repo_id, dest=target_dir / "clip-vit-large-patch14", **kwargs
            )
            self._migrate_pretrained(
                CLIPTextModel, repo_id=repo_id, dest=target_dir / "clip-vit-large-patch14", force=True, **kwargs
            )
            # sd-2
            repo_id = "stabilityai/stable-diffusion-2"
            self._migrate_pretrained(
                CLIPTokenizer,
                repo_id=repo_id,
                dest=target_dir / "stable-diffusion-2-clip" / "tokenizer",
                **{"subfolder": "tokenizer", **kwargs},
            )
            self._migrate_pretrained(
                CLIPTextModel,
                repo_id=repo_id,
                dest=target_dir / "stable-diffusion-2-clip" / "text_encoder",
                **{"subfolder": "text_encoder", **kwargs},
            )
            # VAE
            logger.info("Migrating stable diffusion VAE")
            self._migrate_pretrained(
                AutoencoderKL, repo_id="stabilityai/sd-vae-ft-mse", dest=target_dir / "sd-vae-ft-mse", **kwargs
            )
            # safety checking
            logger.info("Migrating safety checker")
            repo_id = "CompVis/stable-diffusion-safety-checker"
            self._migrate_pretrained(
                AutoFeatureExtractor, repo_id=repo_id, dest=target_dir / "stable-diffusion-safety-checker", **kwargs
            )
            self._migrate_pretrained(
                StableDiffusionSafetyChecker,
                repo_id=repo_id,
                dest=target_dir / "stable-diffusion-safety-checker",
                **kwargs,
            )
        except KeyboardInterrupt:
            raise
        except Exception as e:
            logger.error(str(e))
    def _model_probe_to_path(self, info: ModelProbeInfo) -> Path:
        return Path(self.dest_models, info.base_type.value, info.model_type.value)
    def _migrate_pretrained(self, model_class, repo_id: str, dest: Path, force: bool = False, **kwargs):
        if dest.exists() and not force:
            logger.info(f"Skipping existing {dest}")
            return
        model = model_class.from_pretrained(repo_id, **kwargs)
        self._save_pretrained(model, dest, overwrite=force)
    def _save_pretrained(self, model, dest: Path, overwrite: bool = False):
        model_name = dest.name
        if overwrite:
            model.save_pretrained(dest, safe_serialization=True)
        else:
            download_path = dest.with_name(f"{model_name}.downloading")
            model.save_pretrained(download_path, safe_serialization=True)
            download_path.replace(dest)
    def _download_vae(self, repo_id: str, subfolder: str = None) -> Path:
        vae = AutoencoderKL.from_pretrained(repo_id, cache_dir=self.root_directory / "models/hub", subfolder=subfolder)
        info = ModelProbe().heuristic_probe(vae)
        _, model_name = repo_id.split("/")
        dest = self._model_probe_to_path(info) / self.unique_name(model_name, info)
        vae.save_pretrained(dest, safe_serialization=True)
        return dest
    def _vae_path(self, vae: Union[str, dict]) -> Path:
        """
        Convert 2.3 VAE stanza to a straight path.
        """
        vae_path = None
        # First get a path
        if isinstance(vae, str):
            vae_path = vae
        elif isinstance(vae, DictConfig):
            if p := vae.get("path"):
                vae_path = p
            elif repo_id := vae.get("repo_id"):
                if repo_id == "stabilityai/sd-vae-ft-mse":  # this guy is already downloaded
                    vae_path = "models/core/convert/sd-vae-ft-mse"
                    return vae_path
                else:
                    vae_path = self._download_vae(repo_id, vae.get("subfolder"))
        assert vae_path is not None, "Couldn't find VAE for this model"
        # if the VAE is in the old models directory, then we must move it into the new
        # one. VAEs outside of this directory can stay where they are.
        vae_path = Path(vae_path)
        if vae_path.is_relative_to(self.src_paths.models):
            info = ModelProbe().heuristic_probe(vae_path)
            dest = self._model_probe_to_path(info) / vae_path.name
            if not dest.exists():
                if vae_path.is_dir():
                    self.copy_dir(vae_path, dest)
                else:
                    self.copy_file(vae_path, dest)
            vae_path = dest
        if vae_path.is_relative_to(self.dest_models):
            rel_path = vae_path.relative_to(self.dest_models)
            return Path("models", rel_path)
        else:
            return vae_path
    def migrate_repo_id(self, repo_id: str, model_name: str = None, **extra_config):
        """
        Migrate a locally-cached diffusers pipeline identified with a repo_id
        """
        dest_dir = self.dest_models
        cache = self.root_directory / "models/hub"
        kwargs = {
            "cache_dir": cache,
            "safety_checker": None,
            # local_files_only = True,
        }
        owner, repo_name = repo_id.split("/")
        model_name = model_name or repo_name
        model = cache / "--".join(["models", owner, repo_name])
        if len(list(model.glob("snapshots/**/model_index.json"))) == 0:
            return
        revisions = [x.name for x in model.glob("refs/*")]
        # if an fp16 is available we use that
        revision = "fp16" if len(revisions) > 1 and "fp16" in revisions else revisions[0]
        pipeline = StableDiffusionPipeline.from_pretrained(repo_id, revision=revision, **kwargs)
        info = ModelProbe().heuristic_probe(pipeline)
        if not info:
            return
        if self.mgr.model_exists(model_name, info.base_type, info.model_type):
            logger.warning(f"A model named {model_name} already exists at the destination. Skipping migration.")
            return
        dest = self._model_probe_to_path(info) / model_name
        self._save_pretrained(pipeline, dest)
        rel_path = Path("models", dest.relative_to(dest_dir))
        self._add_model(model_name, info, rel_path, **extra_config)
    def migrate_path(self, location: Path, model_name: str = None, **extra_config):
        """
        Migrate a model referred to using 'weights' or 'path'
        """
        # handle relative paths
        dest_dir = self.dest_models
        location = self.root_directory / location
        model_name = model_name or location.stem
        info = ModelProbe().heuristic_probe(location)
        if not info:
            return
        if self.mgr.model_exists(model_name, info.base_type, info.model_type):
            logger.warning(f"A model named {model_name} already exists at the destination. Skipping migration.")
            return
        # uh oh, weights is in the old models directory - move it into the new one
        if Path(location).is_relative_to(self.src_paths.models):
            dest = Path(dest_dir, info.base_type.value, info.model_type.value, location.name)
            if location.is_dir():
                self.copy_dir(location, dest)
            else:
                self.copy_file(location, dest)
            location = Path("models", info.base_type.value, info.model_type.value, location.name)
        self._add_model(model_name, info, location, **extra_config)
    def _add_model(self, model_name: str, info: ModelProbeInfo, location: Path, **extra_config):
        if info.model_type != ModelType.Main:
            return
        self.mgr.add_model(
            model_name=model_name,
            base_model=info.base_type,
            model_type=info.model_type,
            clobber=True,
            model_attributes={
                "path": str(location),
                "description": f"A {info.base_type.value} {info.model_type.value} model",
                "model_format": info.format,
                "variant": info.variant_type.value,
                **extra_config,
            },
        )
    def migrate_defined_models(self):
        """
        Migrate models defined in models.yaml
        """
        # find any models referred to in old models.yaml
        conf = OmegaConf.load(self.root_directory / "configs/models.yaml")
        for model_name, stanza in conf.items():
            try:
                passthru_args = {}
                if vae := stanza.get("vae"):
                    try:
                        passthru_args["vae"] = str(self._vae_path(vae))
                    except Exception as e:
                        logger.warning(f'Could not find a VAE matching "{vae}" for model "{model_name}"')
                        logger.warning(str(e))
                if config := stanza.get("config"):
                    passthru_args["config"] = config
                if description := stanza.get("description"):
                    passthru_args["description"] = description
                if repo_id := stanza.get("repo_id"):
                    logger.info(f"Migrating diffusers model {model_name}")
                    self.migrate_repo_id(repo_id, model_name, **passthru_args)
                elif location := stanza.get("weights"):
                    logger.info(f"Migrating checkpoint model {model_name}")
                    self.migrate_path(Path(location), model_name, **passthru_args)
                elif location := stanza.get("path"):
                    logger.info(f"Migrating diffusers model {model_name}")
                    self.migrate_path(Path(location), model_name, **passthru_args)
            except KeyboardInterrupt:
                raise
            except Exception as e:
                logger.error(str(e))
    def migrate(self):
        self.create_directory_structure()
        # the configure script is doing this
        self.migrate_support_models()
        self.migrate_conversion_models()
        self.migrate_tuning_models()
        self.migrate_defined_models()
 def _parse_legacy_initfile(root: Path, initfile: Path) -> ModelPaths:
    """
    Returns tuple of (embedding_path, lora_path, controlnet_path)
    """
    parser = argparse.ArgumentParser(fromfile_prefix_chars="@")
    parser.add_argument(
        "--embedding_directory",
        "--embedding_path",
        type=Path,
        dest="embedding_path",
        default=Path("embeddings"),
    )
    parser.add_argument(
        "--lora_directory",
        dest="lora_path",
        type=Path,
        default=Path("loras"),
    )
    opt, _ = parser.parse_known_args([f"@{str(initfile)}"])
    return ModelPaths(
        models=root / "models",
        embeddings=root / str(opt.embedding_path).strip('"'),
        loras=root / str(opt.lora_path).strip('"'),
        controlnets=root / "controlnets",
    )
 def _parse_legacy_yamlfile(root: Path, initfile: Path) -> ModelPaths:
    """
    Returns tuple of (embedding_path, lora_path, controlnet_path)
    """
    # Don't use the config object because it is unforgiving of version updates
    # Just use omegaconf directly
    opt = OmegaConf.load(initfile)
    paths = opt.InvokeAI.Paths
    models = paths.get("models_dir", "models")
    embeddings = paths.get("embedding_dir", "embeddings")
    loras = paths.get("lora_dir", "loras")
    controlnets = paths.get("controlnet_dir", "controlnets")
    return ModelPaths(
        models=root / models if models else None,
        embeddings=root / embeddings if embeddings else None,
        loras=root / loras if loras else None,
        controlnets=root / controlnets if controlnets else None,
    )
 def get_legacy_embeddings(root: Path) -> ModelPaths:
    path = root / "invokeai.init"
    if path.exists():
        return _parse_legacy_initfile(root, path)
    path = root / "invokeai.yaml"
    if path.exists():
        return _parse_legacy_yamlfile(root, path)
 def do_migrate(src_directory: Path, dest_directory: Path):
    """
    Migrate models from src to dest InvokeAI root directories
    """
    config_file = dest_directory / "configs" / "models.yaml.3"
    dest_models = dest_directory / "models.3"
    version_3 = (dest_directory / "models" / "core").exists()
    # Here we create the destination models.yaml file.
    # If we are writing into a version 3 directory and the
    # file already exists, then we write into a copy of it to
    # avoid deleting its previous customizations. Otherwise we
    # create a new empty one.
    if version_3:  # write into the dest directory
        try:
            shutil.copy(dest_directory / "configs" / "models.yaml", config_file)
        except Exception:
            MigrateTo3.initialize_yaml(config_file)
        mgr = ModelManager(config_file)  # important to initialize BEFORE moving the models directory
        (dest_directory / "models").replace(dest_models)
    else:
        MigrateTo3.initialize_yaml(config_file)
        mgr = ModelManager(config_file)
    paths = get_legacy_embeddings(src_directory)
    migrator = MigrateTo3(from_root=src_directory, to_models=dest_models, model_manager=mgr, src_paths=paths)
    migrator.migrate()
    print("Migration successful.")
    if not version_3:
        (dest_directory / "models").replace(src_directory / "models.orig")
        print(f"Original models directory moved to {dest_directory}/models.orig")
    (dest_directory / "configs" / "models.yaml").replace(src_directory / "configs" / "models.yaml.orig")
    print(f"Original models.yaml file moved to {dest_directory}/configs/models.yaml.orig")
    config_file.replace(config_file.with_suffix(""))
    dest_models.replace(dest_models.with_suffix(""))
 def main():
    parser = argparse.ArgumentParser(
        prog="invokeai-migrate3",
        description="""
 This will copy and convert the models directory and the configs/models.yaml from the InvokeAI 2.3 format
 '--from-directory' root to the InvokeAI 3.0 '--to-directory' root. These may be abbreviated '--from' and '--to'.a
 The old models directory and config file will be renamed 'models.orig' and 'models.yaml.orig' respectively.
 It is safe to provide the same directory for both arguments, but it is better to use the invokeai_configure
 script, which will perform a full upgrade in place.""",
    )
    parser.add_argument(
        "--from-directory",
        dest="src_root",
        type=Path,
        required=True,
        help='Source InvokeAI 2.3 root directory (containing "invokeai.init" or "invokeai.yaml")',
    )
    parser.add_argument(
        "--to-directory",
        dest="dest_root",
        type=Path,
        required=True,
        help='Destination InvokeAI 3.0 directory (containing "invokeai.yaml")',
    )
    args = parser.parse_args()
    src_root = args.src_root
    assert src_root.is_dir(), f"{src_root} is not a valid directory"
    assert (src_root / "models").is_dir(), f"{src_root} does not contain a 'models' subdirectory"
    assert (src_root / "models" / "hub").exists(), f"{src_root} does not contain a version 2.3 models directory"
    assert (src_root / "invokeai.init").exists() or (
        src_root / "invokeai.yaml"
    ).exists(), f"{src_root} does not contain an InvokeAI init file."
    dest_root = args.dest_root
    assert dest_root.is_dir(), f"{dest_root} is not a valid directory"
    config = InvokeAIAppConfig.get_config()
    config.parse_args(["--root", str(dest_root)])
    # TODO: revisit - don't rely on invokeai.yaml to exist yet!
    dest_is_setup = (dest_root / "models/core").exists() and (dest_root / "databases").exists()
    if not dest_is_setup:
        from invokeai.backend.install.invokeai_configure import initialize_rootdir
        initialize_rootdir(dest_root, True)
    do_migrate(src_root, dest_root)
 if __name__ == "__main__":
    main()
--- a/invokeai/backend/install/model_install_backend.py
+++ b/invokeai/backend/install/model_install_backend.py
@ -1,637 +0,0 @@
 """
 Utility (backend) functions used by model_install.py
 """
 import os
 import re
 import shutil
 import warnings
 from dataclasses import dataclass, field
 from pathlib import Path
 from tempfile import TemporaryDirectory
 from typing import Callable, Dict, List, Optional, Set, Union
 import requests
 import torch
 from diffusers import DiffusionPipeline
 from diffusers import logging as dlogging
 from huggingface_hub import HfApi, HfFolder, hf_hub_url
 from omegaconf import OmegaConf
 from tqdm import tqdm
 import invokeai.configs as configs
 from invokeai.app.services.config import InvokeAIAppConfig
 from invokeai.backend.model_management import AddModelResult, BaseModelType, ModelManager, ModelType, ModelVariantType
 from invokeai.backend.model_management.model_probe import ModelProbe, ModelProbeInfo, SchedulerPredictionType
 from invokeai.backend.util import download_with_resume
 from invokeai.backend.util.devices import choose_torch_device, torch_dtype
 from ..util.logging import InvokeAILogger
 warnings.filterwarnings("ignore")
 # --------------------------globals-----------------------
 config = InvokeAIAppConfig.get_config()
 logger = InvokeAILogger.get_logger(name="InvokeAI")
 # the initial "configs" dir is now bundled in the `invokeai.configs` package
 Dataset_path = Path(configs.__path__[0]) / "INITIAL_MODELS.yaml"
 Config_preamble = """
 # This file describes the alternative machine learning models
 # available to InvokeAI script.
 #
 # To add a new model, follow the examples below. Each
 # model requires a model config file, a weights file,
 # and the width and height of the images it
 # was trained on.
 """
 LEGACY_CONFIGS = {
    BaseModelType.StableDiffusion1: {
        ModelVariantType.Normal: {
            SchedulerPredictionType.Epsilon: "v1-inference.yaml",
            SchedulerPredictionType.VPrediction: "v1-inference-v.yaml",
        },
        ModelVariantType.Inpaint: {
            SchedulerPredictionType.Epsilon: "v1-inpainting-inference.yaml",
            SchedulerPredictionType.VPrediction: "v1-inpainting-inference-v.yaml",
        },
    },
    BaseModelType.StableDiffusion2: {
        ModelVariantType.Normal: {
            SchedulerPredictionType.Epsilon: "v2-inference.yaml",
            SchedulerPredictionType.VPrediction: "v2-inference-v.yaml",
        },
        ModelVariantType.Inpaint: {
            SchedulerPredictionType.Epsilon: "v2-inpainting-inference.yaml",
            SchedulerPredictionType.VPrediction: "v2-inpainting-inference-v.yaml",
        },
    },
    BaseModelType.StableDiffusionXL: {
        ModelVariantType.Normal: "sd_xl_base.yaml",
    },
    BaseModelType.StableDiffusionXLRefiner: {
        ModelVariantType.Normal: "sd_xl_refiner.yaml",
    },
 }
@dataclass
 class InstallSelections:
    install_models: List[str] = field(default_factory=list)
    remove_models: List[str] = field(default_factory=list)
@dataclass
 class ModelLoadInfo:
    name: str
    model_type: ModelType
    base_type: BaseModelType
    path: Optional[Path] = None
    repo_id: Optional[str] = None
    subfolder: Optional[str] = None
    description: str = ""
    installed: bool = False
    recommended: bool = False
    default: bool = False
    requires: Optional[List[str]] = field(default_factory=list)
 class ModelInstall(object):
    def __init__(
        self,
        config: InvokeAIAppConfig,
        prediction_type_helper: Optional[Callable[[Path], SchedulerPredictionType]] = None,
        model_manager: Optional[ModelManager] = None,
        access_token: Optional[str] = None,
        civitai_api_key: Optional[str] = None,
    ):
        self.config = config
        self.mgr = model_manager or ModelManager(config.model_conf_path)
        self.datasets = OmegaConf.load(Dataset_path)
        self.prediction_helper = prediction_type_helper
        self.access_token = access_token or HfFolder.get_token()
        self.civitai_api_key = civitai_api_key or config.civitai_api_key
        self.reverse_paths = self._reverse_paths(self.datasets)
    def all_models(self) -> Dict[str, ModelLoadInfo]:
        """
        Return dict of model_key=>ModelLoadInfo objects.
        This method consolidates and simplifies the entries in both
        models.yaml and INITIAL_MODELS.yaml so that they can
        be treated uniformly. It also sorts the models alphabetically
        by their name, to improve the display somewhat.
        """
        model_dict = {}
        # first populate with the entries in INITIAL_MODELS.yaml
        for key, value in self.datasets.items():
            name, base, model_type = ModelManager.parse_key(key)
            value["name"] = name
            value["base_type"] = base
            value["model_type"] = model_type
            model_info = ModelLoadInfo(**value)
            if model_info.subfolder and model_info.repo_id:
                model_info.repo_id += f":{model_info.subfolder}"
            model_dict[key] = model_info
        # supplement with entries in models.yaml
        installed_models = list(self.mgr.list_models())
        for md in installed_models:
            base = md["base_model"]
            model_type = md["model_type"]
            name = md["model_name"]
            key = ModelManager.create_key(name, base, model_type)
            if key in model_dict:
                model_dict[key].installed = True
            else:
                model_dict[key] = ModelLoadInfo(
                    name=name,
                    base_type=base,
                    model_type=model_type,
                    path=value.get("path"),
                    installed=True,
                )
        return {x: model_dict[x] for x in sorted(model_dict.keys(), key=lambda y: model_dict[y].name.lower())}
    def _is_autoloaded(self, model_info: dict) -> bool:
        path = model_info.get("path")
        if not path:
            return False
        for autodir in ["autoimport_dir", "lora_dir", "embedding_dir", "controlnet_dir"]:
            if autodir_path := getattr(self.config, autodir):
                autodir_path = self.config.root_path / autodir_path
                if Path(path).is_relative_to(autodir_path):
                    return True
        return False
    def list_models(self, model_type):
        installed = self.mgr.list_models(model_type=model_type)
        print()
        print(f"Installed models of type `{model_type}`:")
        print(f"{'Model Key':50} Model Path")
        for i in installed:
            print(f"{'/'.join([i['base_model'],i['model_type'],i['model_name']]):50} {i['path']}")
        print()
    # logic here a little reversed to maintain backward compatibility
    def starter_models(self, all_models: bool = False) -> Set[str]:
        models = set()
        for key, _value in self.datasets.items():
            name, base, model_type = ModelManager.parse_key(key)
            if all_models or model_type in [ModelType.Main, ModelType.Vae]:
                models.add(key)
        return models
    def recommended_models(self) -> Set[str]:
        starters = self.starter_models(all_models=True)
        return {x for x in starters if self.datasets[x].get("recommended", False)}
    def default_model(self) -> str:
        starters = self.starter_models()
        defaults = [x for x in starters if self.datasets[x].get("default", False)]
        return defaults[0]
    def install(self, selections: InstallSelections):
        verbosity = dlogging.get_verbosity()  # quench NSFW nags
        dlogging.set_verbosity_error()
        job = 1
        jobs = len(selections.remove_models) + len(selections.install_models)
        # remove requested models
        for key in selections.remove_models:
            name, base, mtype = self.mgr.parse_key(key)
            logger.info(f"Deleting {mtype} model {name} [{job}/{jobs}]")
            try:
                self.mgr.del_model(name, base, mtype)
            except FileNotFoundError as e:
                logger.warning(e)
            job += 1
        # add requested models
        self._remove_installed(selections.install_models)
        self._add_required_models(selections.install_models)
        for path in selections.install_models:
            logger.info(f"Installing {path} [{job}/{jobs}]")
            try:
                self.heuristic_import(path)
            except (ValueError, KeyError) as e:
                logger.error(str(e))
            job += 1
        dlogging.set_verbosity(verbosity)
        self.mgr.commit()
    def heuristic_import(
        self,
        model_path_id_or_url: Union[str, Path],
        models_installed: Set[Path] = None,
    ) -> Dict[str, AddModelResult]:
        """
        :param model_path_id_or_url: A Path to a local model to import, or a string representing its repo_id or URL
        :param models_installed: Set of installed models, used for recursive invocation
        Returns a set of dict objects corresponding to newly-created stanzas in models.yaml.
        """
        if not models_installed:
            models_installed = {}
        model_path_id_or_url = str(model_path_id_or_url).strip("\"' ")
        # A little hack to allow nested routines to retrieve info on the requested ID
        self.current_id = model_path_id_or_url
        path = Path(model_path_id_or_url)
        # fix relative paths
        if path.exists() and not path.is_absolute():
            path = path.absolute()  # make relative to current WD
        # checkpoint file, or similar
        if path.is_file():
            models_installed.update({str(path): self._install_path(path)})
        # folders style or similar
        elif path.is_dir() and any(
            (path / x).exists()
            for x in {
                "config.json",
                "model_index.json",
                "learned_embeds.bin",
                "pytorch_lora_weights.bin",
                "pytorch_lora_weights.safetensors",
            }
        ):
            models_installed.update({str(model_path_id_or_url): self._install_path(path)})
        # recursive scan
        elif path.is_dir():
            for child in path.iterdir():
                self.heuristic_import(child, models_installed=models_installed)
        # huggingface repo
        elif len(str(model_path_id_or_url).split("/")) == 2:
            models_installed.update({str(model_path_id_or_url): self._install_repo(str(model_path_id_or_url))})
        # a URL
        elif str(model_path_id_or_url).startswith(("http:", "https:", "ftp:")):
            models_installed.update({str(model_path_id_or_url): self._install_url(model_path_id_or_url)})
        else:
            raise KeyError(f"{str(model_path_id_or_url)} is not recognized as a local path, repo ID or URL. Skipping")
        return models_installed
    def _remove_installed(self, model_list: List[str]):
        all_models = self.all_models()
        models_to_remove = []
        for path in model_list:
            key = self.reverse_paths.get(path)
            if key and all_models[key].installed:
                models_to_remove.append(path)
        for path in models_to_remove:
            logger.warning(f"{path} already installed. Skipping")
            model_list.remove(path)
    def _add_required_models(self, model_list: List[str]):
        additional_models = []
        all_models = self.all_models()
        for path in model_list:
            if not (key := self.reverse_paths.get(path)):
                continue
            for requirement in all_models[key].requires:
                requirement_key = self.reverse_paths.get(requirement)
                if not all_models[requirement_key].installed:
                    additional_models.append(requirement)
        model_list.extend(additional_models)
    # install a model from a local path. The optional info parameter is there to prevent
    # the model from being probed twice in the event that it has already been probed.
    def _install_path(self, path: Path, info: ModelProbeInfo = None) -> AddModelResult:
        info = info or ModelProbe().heuristic_probe(path, self.prediction_helper)
        if not info:
            logger.warning(f"Unable to parse format of {path}")
            return None
        model_name = path.stem if path.is_file() else path.name
        if self.mgr.model_exists(model_name, info.base_type, info.model_type):
            raise ValueError(f'A model named "{model_name}" is already installed.')
        attributes = self._make_attributes(path, info)
        return self.mgr.add_model(
            model_name=model_name,
            base_model=info.base_type,
            model_type=info.model_type,
            model_attributes=attributes,
        )
    def _install_url(self, url: str) -> AddModelResult:
        with TemporaryDirectory(dir=self.config.models_path) as staging:
            CIVITAI_RE = r".*civitai.com.*"
            civit_url = re.match(CIVITAI_RE, url, re.IGNORECASE)
            location = download_with_resume(
                url, Path(staging), access_token=self.civitai_api_key if civit_url else None
            )
            if not location:
                logger.error(f"Unable to download {url}. Skipping.")
            info = ModelProbe().heuristic_probe(location, self.prediction_helper)
            dest = self.config.models_path / info.base_type.value / info.model_type.value / location.name
            dest.parent.mkdir(parents=True, exist_ok=True)
            models_path = shutil.move(location, dest)
        # staged version will be garbage-collected at this time
        return self._install_path(Path(models_path), info)
    def _install_repo(self, repo_id: str) -> AddModelResult:
        # hack to recover models stored in subfolders --
        # Required to get the "v2" model of monster-labs/control_v1p_sd15_qrcode_monster
        subfolder = None
        if match := re.match(r"^([^/]+/[^/]+):(\w+)$", repo_id):
            repo_id = match.group(1)
            subfolder = match.group(2)
        hinfo = HfApi().model_info(repo_id)
        # we try to figure out how to download this most economically
        # list all the files in the repo
        files = [x.rfilename for x in hinfo.siblings]
        if subfolder:
            files = [x for x in files if x.startswith(f"{subfolder}/")]
        prefix = f"{subfolder}/" if subfolder else ""
        location = None
        with TemporaryDirectory(dir=self.config.models_path) as staging:
            staging = Path(staging)
            if f"{prefix}model_index.json" in files:
                location = self._download_hf_pipeline(repo_id, staging, subfolder=subfolder)  # pipeline
            elif f"{prefix}unet/model.onnx" in files:
                location = self._download_hf_model(repo_id, files, staging)
            else:
                for suffix in ["safetensors", "bin"]:
                    if f"{prefix}pytorch_lora_weights.{suffix}" in files:
                        location = self._download_hf_model(
                            repo_id, [f"pytorch_lora_weights.{suffix}"], staging, subfolder=subfolder
                        )  # LoRA
                        break
                    elif (
                        self.config.precision == "float16" and f"{prefix}diffusion_pytorch_model.fp16.{suffix}" in files
                    ):  # vae, controlnet or some other standalone
                        files = ["config.json", f"diffusion_pytorch_model.fp16.{suffix}"]
                        location = self._download_hf_model(repo_id, files, staging, subfolder=subfolder)
                        break
                    elif f"{prefix}diffusion_pytorch_model.{suffix}" in files:
                        files = ["config.json", f"diffusion_pytorch_model.{suffix}"]
                        location = self._download_hf_model(repo_id, files, staging, subfolder=subfolder)
                        break
                    elif f"{prefix}learned_embeds.{suffix}" in files:
                        location = self._download_hf_model(
                            repo_id, [f"learned_embeds.{suffix}"], staging, subfolder=subfolder
                        )
                        break
                    elif (
                        f"{prefix}image_encoder.txt" in files and f"{prefix}ip_adapter.{suffix}" in files
                    ):  # IP-Adapter
                        files = ["image_encoder.txt", f"ip_adapter.{suffix}"]
                        location = self._download_hf_model(repo_id, files, staging, subfolder=subfolder)
                        break
                    elif f"{prefix}model.{suffix}" in files and f"{prefix}config.json" in files:
                        # This elif-condition is pretty fragile, but it is intended to handle CLIP Vision models hosted
                        # by InvokeAI for use with IP-Adapters.
                        files = ["config.json", f"model.{suffix}"]
                        location = self._download_hf_model(repo_id, files, staging, subfolder=subfolder)
                        break
            if not location:
                logger.warning(f"Could not determine type of repo {repo_id}. Skipping install.")
                return {}
            info = ModelProbe().heuristic_probe(location, self.prediction_helper)
            if not info:
                logger.warning(f"Could not probe {location}. Skipping install.")
                return {}
            dest = (
                self.config.models_path
                / info.base_type.value
                / info.model_type.value
                / self._get_model_name(repo_id, location)
            )
            if dest.exists():
                shutil.rmtree(dest)
            shutil.copytree(location, dest)
            return self._install_path(dest, info)
    def _get_model_name(self, path_name: str, location: Path) -> str:
        """
        Calculate a name for the model - primitive implementation.
        """
        if key := self.reverse_paths.get(path_name):
            (name, base, mtype) = ModelManager.parse_key(key)
            return name
        elif location.is_dir():
            return location.name
        else:
            return location.stem
    def _make_attributes(self, path: Path, info: ModelProbeInfo) -> dict:
        model_name = path.name if path.is_dir() else path.stem
        description = f"{info.base_type.value} {info.model_type.value} model {model_name}"
        if key := self.reverse_paths.get(self.current_id):
            if key in self.datasets:
                description = self.datasets[key].get("description") or description
        rel_path = self.relative_to_root(path, self.config.models_path)
        attributes = {
            "path": str(rel_path),
            "description": str(description),
            "model_format": info.format,
        }
        legacy_conf = None
        if info.model_type == ModelType.Main or info.model_type == ModelType.ONNX:
            attributes.update(
                {
                    "variant": info.variant_type,
                }
            )
            if info.format == "checkpoint":
                try:
                    possible_conf = path.with_suffix(".yaml")
                    if possible_conf.exists():
                        legacy_conf = str(self.relative_to_root(possible_conf))
                    elif info.base_type in [BaseModelType.StableDiffusion1, BaseModelType.StableDiffusion2]:
                        legacy_conf = Path(
                            self.config.legacy_conf_dir,
                            LEGACY_CONFIGS[info.base_type][info.variant_type][info.prediction_type],
                        )
                    else:
                        legacy_conf = Path(
                            self.config.legacy_conf_dir, LEGACY_CONFIGS[info.base_type][info.variant_type]
                        )
                except KeyError:
                    legacy_conf = Path(self.config.legacy_conf_dir, "v1-inference.yaml")  # best guess
        if info.model_type == ModelType.ControlNet and info.format == "checkpoint":
            possible_conf = path.with_suffix(".yaml")
            if possible_conf.exists():
                legacy_conf = str(self.relative_to_root(possible_conf))
            else:
                legacy_conf = Path(
                    self.config.root_path,
                    "configs/controlnet",
                    ("cldm_v15.yaml" if info.base_type == BaseModelType("sd-1") else "cldm_v21.yaml"),
                )
        if legacy_conf:
            attributes.update({"config": str(legacy_conf)})
        return attributes
    def relative_to_root(self, path: Path, root: Optional[Path] = None) -> Path:
        root = root or self.config.root_path
        if path.is_relative_to(root):
            return path.relative_to(root)
        else:
            return path
    def _download_hf_pipeline(self, repo_id: str, staging: Path, subfolder: str = None) -> Path:
        """
        Retrieve a StableDiffusion model from cache or remote and then
        does a save_pretrained() to the indicated staging area.
        """
        _, name = repo_id.split("/")
        precision = torch_dtype(choose_torch_device())
        variants = ["fp16", None] if precision == torch.float16 else [None, "fp16"]
        model = None
        for variant in variants:
            try:
                model = DiffusionPipeline.from_pretrained(
                    repo_id,
                    variant=variant,
                    torch_dtype=precision,
                    safety_checker=None,
                    subfolder=subfolder,
                )
            except Exception as e:  # most errors are due to fp16 not being present. Fix this to catch other errors
                if "fp16" not in str(e):
                    print(e)
            if model:
                break
        if not model:
            logger.error(f"Diffusers model {repo_id} could not be downloaded. Skipping.")
            return None
        model.save_pretrained(staging / name, safe_serialization=True)
        return staging / name
    def _download_hf_model(self, repo_id: str, files: List[str], staging: Path, subfolder: None) -> Path:
        _, name = repo_id.split("/")
        location = staging / name
        paths = []
        for filename in files:
            filePath = Path(filename)
            p = hf_download_with_resume(
                repo_id,
                model_dir=location / filePath.parent,
                model_name=filePath.name,
                access_token=self.access_token,
                subfolder=filePath.parent / subfolder if subfolder else filePath.parent,
            )
            if p:
                paths.append(p)
            else:
                logger.warning(f"Could not download {filename} from {repo_id}.")
        return location if len(paths) > 0 else None
    @classmethod
    def _reverse_paths(cls, datasets) -> dict:
        """
        Reverse mapping from repo_id/path to destination name.
        """
        return {v.get("path") or v.get("repo_id"): k for k, v in datasets.items()}
 # -------------------------------------
 def yes_or_no(prompt: str, default_yes=True):
    default = "y" if default_yes else "n"
    response = input(f"{prompt} [{default}] ") or default
    if default_yes:
        return response[0] not in ("n", "N")
    else:
        return response[0] in ("y", "Y")
 # ---------------------------------------------
 def hf_download_from_pretrained(model_class: object, model_name: str, destination: Path, **kwargs):
    logger = InvokeAILogger.get_logger("InvokeAI")
    logger.addFilter(lambda x: "fp16 is not a valid" not in x.getMessage())
    model = model_class.from_pretrained(
        model_name,
        resume_download=True,
        **kwargs,
    )
    model.save_pretrained(destination, safe_serialization=True)
    return destination
 # ---------------------------------------------
 def hf_download_with_resume(
    repo_id: str,
    model_dir: str,
    model_name: str,
    model_dest: Path = None,
    access_token: str = None,
    subfolder: str = None,
 ) -> Path:
    model_dest = model_dest or Path(os.path.join(model_dir, model_name))
    os.makedirs(model_dir, exist_ok=True)
    url = hf_hub_url(repo_id, model_name, subfolder=subfolder)
    header = {"Authorization": f"Bearer {access_token}"} if access_token else {}
    open_mode = "wb"
    exist_size = 0
    if os.path.exists(model_dest):
        exist_size = os.path.getsize(model_dest)
        header["Range"] = f"bytes={exist_size}-"
        open_mode = "ab"
    resp = requests.get(url, headers=header, stream=True)
    total = int(resp.headers.get("content-length", 0))
    if resp.status_code == 416:  # "range not satisfiable", which means nothing to return
        logger.info(f"{model_name}: complete file found. Skipping.")
        return model_dest
    elif resp.status_code == 404:
        logger.warning("File not found")
        return None
    elif resp.status_code != 200:
        logger.warning(f"{model_name}: {resp.reason}")
    elif exist_size > 0:
        logger.info(f"{model_name}: partial file found. Resuming...")
    else:
        logger.info(f"{model_name}: Downloading...")
    try:
        with (
            open(model_dest, open_mode) as file,
            tqdm(
                desc=model_name,
                initial=exist_size,
                total=total + exist_size,
                unit="iB",
                unit_scale=True,
                unit_divisor=1000,
            ) as bar,
        ):
            for data in resp.iter_content(chunk_size=1024):
                size = file.write(data)
                bar.update(size)
    except Exception as e:
        logger.error(f"An error occurred while downloading {model_name}: {str(e)}")
        return None
    return model_dest
--- a/invokeai/backend/ip_adapter/ip_adapter.py
+++ b/invokeai/backend/ip_adapter/ip_adapter.py
@ -9,8 +9,8 @@ from transformers import CLIPImageProcessor, CLIPVisionModelWithProjection
 from invokeai.backend.ip_adapter.ip_attention_weights import IPAttentionWeights
 from .resampler import Resampler
 from ..raw_model import RawModel
 from .resampler import Resampler
 class ImageProjModel(torch.nn.Module):
--- a/invokeai/backend/lora.py
+++ b/invokeai/backend/lora.py
@ -10,6 +10,7 @@ from safetensors.torch import load_file
 from typing_extensions import Self
 from invokeai.backend.model_manager import BaseModelType
 from .raw_model import RawModel
@ -366,6 +367,7 @@ class IA3Layer(LoRALayerBase):
 AnyLoRALayer = Union[LoRALayer, LoHALayer, LoKRLayer, FullLayer, IA3Layer]
 class LoRAModelRaw(RawModel):  # (torch.nn.Module):
    _name: str
    layers: Dict[str, AnyLoRALayer]
--- a/invokeai/backend/model_management_OLD/README.md
+++ b/invokeai/backend/model_management_OLD/README.md
@ -1,27 +0,0 @@
 # Model Cache
 ## `glibc` Memory Allocator Fragmentation
 Python (and PyTorch) relies on the memory allocator from the C Standard Library (`libc`). On linux, with the GNU C Standard Library implementation (`glibc`), our memory access patterns have been observed to cause severe memory fragmentation. This fragmentation results in large amounts of memory that has been freed but can't be released back to the OS. Loading models from disk and moving them between CPU/CUDA seem to be the operations that contribute most to the fragmentation. This memory fragmentation issue can result in OOM crashes during frequent model switching, even if `max_cache_size` is set to a reasonable value (e.g. a OOM crash with `max_cache_size=16` on a system with 32GB of RAM).
 This problem may also exist on other OSes, and other `libc` implementations. But, at the time of writing, it has only been investigated on linux with `glibc`.
 To better understand how the `glibc` memory allocator works, see these references:
 - Basics: https://www.gnu.org/software/libc/manual/html_node/The-GNU-Allocator.html
 - Details: https://sourceware.org/glibc/wiki/MallocInternals
 Note the differences between memory allocated as chunks in an arena vs. memory allocated with `mmap`. Under `glibc`'s default configuration, most model tensors get allocated as chunks in an arena making them vulnerable to the problem of fragmentation.
 We can work around this memory fragmentation issue by setting the following env var:
 ```bash
 # Force blocks >1MB to be allocated with `mmap` so that they are released to the system immediately when they are freed.
 MALLOC_MMAP_THRESHOLD_=1048576
 ```
 See the following references for more information about the `malloc` tunable parameters:
 - https://www.gnu.org/software/libc/manual/html_node/Malloc-Tunable-Parameters.html
 - https://www.gnu.org/software/libc/manual/html_node/Memory-Allocation-Tunables.html
 - https://man7.org/linux/man-pages/man3/mallopt.3.html
 The model cache emits debug logs that provide visibility into the state of the `libc` memory allocator. See the `LibcUtil` class for more info on how these `libc` malloc stats are collected.
--- a/invokeai/backend/model_management_OLD/init.py
+++ b/invokeai/backend/model_management_OLD/init.py
@ -1,20 +0,0 @@
 # ruff: noqa: I001, F401
 """
 Initialization file for invokeai.backend.model_management
 """
 # This import must be first
 from .model_manager import AddModelResult, LoadedModelInfo, ModelManager, SchedulerPredictionType
 from .lora import ModelPatcher, ONNXModelPatcher
 from .model_cache import ModelCache
 from .models import (
    BaseModelType,
    DuplicateModelException,
    ModelNotFoundException,
    ModelType,
    ModelVariantType,
    SubModelType,
 )
 # This import must be last
 from .model_merge import MergeInterpolationMethod, ModelMerger
--- a/invokeai/backend/model_management_OLD/convert_ckpt_to_diffusers.py
+++ b/invokeai/backend/model_management_OLD/convert_ckpt_to_diffusers.py
--- a/invokeai/backend/model_management_OLD/detect_baked_in_vae.py
+++ b/invokeai/backend/model_management_OLD/detect_baked_in_vae.py
@ -1,31 +0,0 @@
 # Copyright (c) 2024 Lincoln Stein and the InvokeAI Development Team
 """
 This module exports the function has_baked_in_sdxl_vae().
 It returns True if an SDXL checkpoint model has the original SDXL 1.0 VAE,
 which doesn't work properly in fp16 mode.
 """
 import hashlib
 from pathlib import Path
 from safetensors.torch import load_file
 SDXL_1_0_VAE_HASH = "bc40b16c3a0fa4625abdfc01c04ffc21bf3cefa6af6c7768ec61eb1f1ac0da51"
 def has_baked_in_sdxl_vae(checkpoint_path: Path) -> bool:
    """Return true if the checkpoint contains a custom (non SDXL-1.0) VAE."""
    hash = _vae_hash(checkpoint_path)
    return hash != SDXL_1_0_VAE_HASH
 def _vae_hash(checkpoint_path: Path) -> str:
    checkpoint = load_file(checkpoint_path, device="cpu")
    vae_keys = [x for x in checkpoint.keys() if x.startswith("first_stage_model.")]
    hash = hashlib.new("sha256")
    for key in vae_keys:
        value = checkpoint[key]
        hash.update(bytes(key, "UTF-8"))
        hash.update(bytes(str(value), "UTF-8"))
    return hash.hexdigest()
--- a/invokeai/backend/model_management_OLD/lora.py
+++ b/invokeai/backend/model_management_OLD/lora.py
@ -1,582 +0,0 @@
 from __future__ import annotations
 import pickle
 from contextlib import contextmanager
 from pathlib import Path
 from typing import Any, Dict, List, Optional, Tuple, Union
 import numpy as np
 import torch
 from compel.embeddings_provider import BaseTextualInversionManager
 from diffusers.models import UNet2DConditionModel
 from safetensors.torch import load_file
 from transformers import CLIPTextModel, CLIPTokenizer
 from invokeai.app.shared.models import FreeUConfig
 from invokeai.backend.model_management.model_load_optimizations import skip_torch_weight_init
 from .models.lora import LoRAModel
 """
 loras = [
    (lora_model1, 0.7),
    (lora_model2, 0.4),
 ]
 with LoRAHelper.apply_lora_unet(unet, loras):
    # unet with applied loras
 # unmodified unet
 """
 # TODO: rename smth like ModelPatcher and add TI method?
 class ModelPatcher:
    @staticmethod
    def _resolve_lora_key(model: torch.nn.Module, lora_key: str, prefix: str) -> Tuple[str, torch.nn.Module]:
        assert "." not in lora_key
        if not lora_key.startswith(prefix):
            raise Exception(f"lora_key with invalid prefix: {lora_key}, {prefix}")
        module = model
        module_key = ""
        key_parts = lora_key[len(prefix) :].split("_")
        submodule_name = key_parts.pop(0)
        while len(key_parts) > 0:
            try:
                module = module.get_submodule(submodule_name)
                module_key += "." + submodule_name
                submodule_name = key_parts.pop(0)
            except Exception:
                submodule_name += "_" + key_parts.pop(0)
        module = module.get_submodule(submodule_name)
        module_key = (module_key + "." + submodule_name).lstrip(".")
        return (module_key, module)
    @classmethod
    @contextmanager
    def apply_lora_unet(
        cls,
        unet: UNet2DConditionModel,
        loras: List[Tuple[LoRAModel, float]],
    ):
        with cls.apply_lora(unet, loras, "lora_unet_"):
            yield
    @classmethod
    @contextmanager
    def apply_lora_text_encoder(
        cls,
        text_encoder: CLIPTextModel,
        loras: List[Tuple[LoRAModel, float]],
    ):
        with cls.apply_lora(text_encoder, loras, "lora_te_"):
            yield
    @classmethod
    @contextmanager
    def apply_sdxl_lora_text_encoder(
        cls,
        text_encoder: CLIPTextModel,
        loras: List[Tuple[LoRAModel, float]],
    ):
        with cls.apply_lora(text_encoder, loras, "lora_te1_"):
            yield
    @classmethod
    @contextmanager
    def apply_sdxl_lora_text_encoder2(
        cls,
        text_encoder: CLIPTextModel,
        loras: List[Tuple[LoRAModel, float]],
    ):
        with cls.apply_lora(text_encoder, loras, "lora_te2_"):
            yield
    @classmethod
    @contextmanager
    def apply_lora(
        cls,
        model: torch.nn.Module,
        loras: List[Tuple[LoRAModel, float]],  # THIS IS INCORRECT. IT IS ACTUALLY A LoRAModelRaw
        prefix: str,
    ):
        original_weights = {}
        try:
            with torch.no_grad():
                for lora, lora_weight in loras:
                    # assert lora.device.type == "cpu"
                    for layer_key, layer in lora.layers.items():
                        if not layer_key.startswith(prefix):
                            continue
                        # TODO(ryand): A non-negligible amount of time is currently spent resolving LoRA keys. This
                        # should be improved in the following ways:
                        # 1. The key mapping could be more-efficiently pre-computed. This would save time every time a
                        #    LoRA model is applied.
                        # 2. From an API perspective, there's no reason that the `ModelPatcher` should be aware of the
                        #    intricacies of Stable Diffusion key resolution. It should just expect the input LoRA
                        #    weights to have valid keys.
                        module_key, module = cls._resolve_lora_key(model, layer_key, prefix)
                        # All of the LoRA weight calculations will be done on the same device as the module weight.
                        # (Performance will be best if this is a CUDA device.)
                        device = module.weight.device
                        dtype = module.weight.dtype
                        if module_key not in original_weights:
                            original_weights[module_key] = module.weight.detach().to(device="cpu", copy=True)
                        layer_scale = layer.alpha / layer.rank if (layer.alpha and layer.rank) else 1.0
                        # We intentionally move to the target device first, then cast. Experimentally, this was found to
                        # be significantly faster for 16-bit CPU tensors being moved to a CUDA device than doing the
                        # same thing in a single call to '.to(...)'.
                        layer.to(device=device)
                        layer.to(dtype=torch.float32)
                        # TODO(ryand): Using torch.autocast(...) over explicit casting may offer a speed benefit on CUDA
                        # devices here. Experimentally, it was found to be very slow on CPU. More investigation needed.
                        layer_weight = layer.get_weight(module.weight) * (lora_weight * layer_scale)
                        layer.to(device="cpu")
                        if module.weight.shape != layer_weight.shape:
                            # TODO: debug on lycoris
                            layer_weight = layer_weight.reshape(module.weight.shape)
                        module.weight += layer_weight.to(dtype=dtype)
            yield  # wait for context manager exit
        finally:
            with torch.no_grad():
                for module_key, weight in original_weights.items():
                    model.get_submodule(module_key).weight.copy_(weight)
    @classmethod
    @contextmanager
    def apply_ti(
        cls,
        tokenizer: CLIPTokenizer,
        text_encoder: CLIPTextModel,
        ti_list: List[Tuple[str, Any]],
    ) -> Tuple[CLIPTokenizer, TextualInversionManager]:
        init_tokens_count = None
        new_tokens_added = None
        # TODO: This is required since Transformers 4.32 see
        # https://github.com/huggingface/transformers/pull/25088
        # More information by NVIDIA:
        # https://docs.nvidia.com/deeplearning/performance/dl-performance-matrix-multiplication/index.html#requirements-tc
        # This value might need to be changed in the future and take the GPUs model into account as there seem
        # to be ideal values for different GPUS. This value is temporary!
        # For references to the current discussion please see https://github.com/invoke-ai/InvokeAI/pull/4817
        pad_to_multiple_of = 8
        try:
            # HACK: The CLIPTokenizer API does not include a way to remove tokens after calling add_tokens(...). As a
            # workaround, we create a full copy of `tokenizer` so that its original behavior can be restored after
            # exiting this `apply_ti(...)` context manager.
            #
            # In a previous implementation, the deep copy was obtained with `ti_tokenizer = copy.deepcopy(tokenizer)`,
            # but a pickle roundtrip was found to be much faster (1 sec vs. 0.05 secs).
            ti_tokenizer = pickle.loads(pickle.dumps(tokenizer))
            ti_manager = TextualInversionManager(ti_tokenizer)
            init_tokens_count = text_encoder.resize_token_embeddings(None, pad_to_multiple_of).num_embeddings
            def _get_trigger(ti_name, index):
                trigger = ti_name
                if index > 0:
                    trigger += f"-!pad-{i}"
                return f"<{trigger}>"
            def _get_ti_embedding(model_embeddings, ti):
                print(f"DEBUG: model_embeddings={type(model_embeddings)}, ti={type(ti)}")
                print(f"DEBUG: is it an nn.Module? {isinstance(model_embeddings, torch.nn.Module)}")
                # for SDXL models, select the embedding that matches the text encoder's dimensions
                if ti.embedding_2 is not None:
                    return (
                        ti.embedding_2
                        if ti.embedding_2.shape[1] == model_embeddings.weight.data[0].shape[0]
                        else ti.embedding
                    )
                else:
                    print(f"DEBUG: ti.embedding={type(ti.embedding)}")
                    return ti.embedding
            # modify tokenizer
            new_tokens_added = 0
            for ti_name, ti in ti_list:
                ti_embedding = _get_ti_embedding(text_encoder.get_input_embeddings(), ti)
                for i in range(ti_embedding.shape[0]):
                    new_tokens_added += ti_tokenizer.add_tokens(_get_trigger(ti_name, i))
            # Modify text_encoder.
            # resize_token_embeddings(...) constructs a new torch.nn.Embedding internally. Initializing the weights of
            # this embedding is slow and unnecessary, so we wrap this step in skip_torch_weight_init() to save some
            # time.
            with skip_torch_weight_init():
                text_encoder.resize_token_embeddings(init_tokens_count + new_tokens_added, pad_to_multiple_of)
            model_embeddings = text_encoder.get_input_embeddings()
            for ti_name, ti in ti_list:
                ti_embedding = _get_ti_embedding(text_encoder.get_input_embeddings(), ti)
                ti_tokens = []
                for i in range(ti_embedding.shape[0]):
                    embedding = ti_embedding[i]
                    trigger = _get_trigger(ti_name, i)
                    token_id = ti_tokenizer.convert_tokens_to_ids(trigger)
                    if token_id == ti_tokenizer.unk_token_id:
                        raise RuntimeError(f"Unable to find token id for token '{trigger}'")
                    if model_embeddings.weight.data[token_id].shape != embedding.shape:
                        raise ValueError(
                            f"Cannot load embedding for {trigger}. It was trained on a model with token dimension"
                            f" {embedding.shape[0]}, but the current model has token dimension"
                            f" {model_embeddings.weight.data[token_id].shape[0]}."
                        )
                    model_embeddings.weight.data[token_id] = embedding.to(
                        device=text_encoder.device, dtype=text_encoder.dtype
                    )
                    ti_tokens.append(token_id)
                if len(ti_tokens) > 1:
                    ti_manager.pad_tokens[ti_tokens[0]] = ti_tokens[1:]
            yield ti_tokenizer, ti_manager
        finally:
            if init_tokens_count and new_tokens_added:
                text_encoder.resize_token_embeddings(init_tokens_count, pad_to_multiple_of)
    @classmethod
    @contextmanager
    def apply_clip_skip(
        cls,
        text_encoder: CLIPTextModel,
        clip_skip: int,
    ):
        skipped_layers = []
        try:
            for _i in range(clip_skip):
                skipped_layers.append(text_encoder.text_model.encoder.layers.pop(-1))
            yield
        finally:
            while len(skipped_layers) > 0:
                text_encoder.text_model.encoder.layers.append(skipped_layers.pop())
    @classmethod
    @contextmanager
    def apply_freeu(
        cls,
        unet: UNet2DConditionModel,
        freeu_config: Optional[FreeUConfig] = None,
    ):
        did_apply_freeu = False
        try:
            if freeu_config is not None:
                unet.enable_freeu(b1=freeu_config.b1, b2=freeu_config.b2, s1=freeu_config.s1, s2=freeu_config.s2)
                did_apply_freeu = True
            yield
        finally:
            if did_apply_freeu:
                unet.disable_freeu()
 class TextualInversionModel:
    embedding: torch.Tensor  # [n, 768]|[n, 1280]
    embedding_2: Optional[torch.Tensor] = None  # [n, 768]|[n, 1280]   - for SDXL models
    @classmethod
    def from_checkpoint(
        cls,
        file_path: Union[str, Path],
        device: Optional[torch.device] = None,
        dtype: Optional[torch.dtype] = None,
    ):
        if not isinstance(file_path, Path):
            file_path = Path(file_path)
        result = cls()  # TODO:
        if file_path.suffix == ".safetensors":
            state_dict = load_file(file_path.absolute().as_posix(), device="cpu")
        else:
            state_dict = torch.load(file_path, map_location="cpu")
        # both v1 and v2 format embeddings
        # difference mostly in metadata
        if "string_to_param" in state_dict:
            if len(state_dict["string_to_param"]) > 1:
                print(
                    f'Warn: Embedding "{file_path.name}" contains multiple tokens, which is not supported. The first',
                    " token will be used.",
                )
            result.embedding = next(iter(state_dict["string_to_param"].values()))
        # v3 (easynegative)
        elif "emb_params" in state_dict:
            result.embedding = state_dict["emb_params"]
        # v5(sdxl safetensors file)
        elif "clip_g" in state_dict and "clip_l" in state_dict:
            result.embedding = state_dict["clip_g"]
            result.embedding_2 = state_dict["clip_l"]
        # v4(diffusers bin files)
        else:
            result.embedding = next(iter(state_dict.values()))
            if len(result.embedding.shape) == 1:
                result.embedding = result.embedding.unsqueeze(0)
            if not isinstance(result.embedding, torch.Tensor):
                raise ValueError(f"Invalid embeddings file: {file_path.name}")
        return result
 class TextualInversionManager(BaseTextualInversionManager):
    pad_tokens: Dict[int, List[int]]
    tokenizer: CLIPTokenizer
    def __init__(self, tokenizer: CLIPTokenizer):
        self.pad_tokens = {}
        self.tokenizer = tokenizer
    def expand_textual_inversion_token_ids_if_necessary(self, token_ids: list[int]) -> list[int]:
        if len(self.pad_tokens) == 0:
            return token_ids
        if token_ids[0] == self.tokenizer.bos_token_id:
            raise ValueError("token_ids must not start with bos_token_id")
        if token_ids[-1] == self.tokenizer.eos_token_id:
            raise ValueError("token_ids must not end with eos_token_id")
        new_token_ids = []
        for token_id in token_ids:
            new_token_ids.append(token_id)
            if token_id in self.pad_tokens:
                new_token_ids.extend(self.pad_tokens[token_id])
        # Do not exceed the max model input size
        # The -2 here is compensating for compensate compel.embeddings_provider.get_token_ids(),
        # which first removes and then adds back the start and end tokens.
        max_length = list(self.tokenizer.max_model_input_sizes.values())[0] - 2
        if len(new_token_ids) > max_length:
            new_token_ids = new_token_ids[0:max_length]
        return new_token_ids
 class ONNXModelPatcher:
    from diffusers import OnnxRuntimeModel
    from .models.base import IAIOnnxRuntimeModel
    @classmethod
    @contextmanager
    def apply_lora_unet(
        cls,
        unet: OnnxRuntimeModel,
        loras: List[Tuple[LoRAModel, float]],
    ):
        with cls.apply_lora(unet, loras, "lora_unet_"):
            yield
    @classmethod
    @contextmanager
    def apply_lora_text_encoder(
        cls,
        text_encoder: OnnxRuntimeModel,
        loras: List[Tuple[LoRAModel, float]],
    ):
        with cls.apply_lora(text_encoder, loras, "lora_te_"):
            yield
    # based on
    # https://github.com/ssube/onnx-web/blob/ca2e436f0623e18b4cfe8a0363fcfcf10508acf7/api/onnx_web/convert/diffusion/lora.py#L323
    @classmethod
    @contextmanager
    def apply_lora(
        cls,
        model: IAIOnnxRuntimeModel,
        loras: List[Tuple[LoRAModel, float]],
        prefix: str,
    ):
        from .models.base import IAIOnnxRuntimeModel
        if not isinstance(model, IAIOnnxRuntimeModel):
            raise Exception("Only IAIOnnxRuntimeModel models supported")
        orig_weights = {}
        try:
            blended_loras = {}
            for lora, lora_weight in loras:
                for layer_key, layer in lora.layers.items():
                    if not layer_key.startswith(prefix):
                        continue
                    layer.to(dtype=torch.float32)
                    layer_key = layer_key.replace(prefix, "")
                    # TODO: rewrite to pass original tensor weight(required by ia3)
                    layer_weight = layer.get_weight(None).detach().cpu().numpy() * lora_weight
                    if layer_key is blended_loras:
                        blended_loras[layer_key] += layer_weight
                    else:
                        blended_loras[layer_key] = layer_weight
            node_names = {}
            for node in model.nodes.values():
                node_names[node.name.replace("/", "_").replace(".", "_").lstrip("_")] = node.name
            for layer_key, lora_weight in blended_loras.items():
                conv_key = layer_key + "_Conv"
                gemm_key = layer_key + "_Gemm"
                matmul_key = layer_key + "_MatMul"
                if conv_key in node_names or gemm_key in node_names:
                    if conv_key in node_names:
                        conv_node = model.nodes[node_names[conv_key]]
                    else:
                        conv_node = model.nodes[node_names[gemm_key]]
                    weight_name = [n for n in conv_node.input if ".weight" in n][0]
                    orig_weight = model.tensors[weight_name]
                    if orig_weight.shape[-2:] == (1, 1):
                        if lora_weight.shape[-2:] == (1, 1):
                            new_weight = orig_weight.squeeze((3, 2)) + lora_weight.squeeze((3, 2))
                        else:
                            new_weight = orig_weight.squeeze((3, 2)) + lora_weight
                        new_weight = np.expand_dims(new_weight, (2, 3))
                    else:
                        if orig_weight.shape != lora_weight.shape:
                            new_weight = orig_weight + lora_weight.reshape(orig_weight.shape)
                        else:
                            new_weight = orig_weight + lora_weight
                    orig_weights[weight_name] = orig_weight
                    model.tensors[weight_name] = new_weight.astype(orig_weight.dtype)
                elif matmul_key in node_names:
                    weight_node = model.nodes[node_names[matmul_key]]
                    matmul_name = [n for n in weight_node.input if "MatMul" in n][0]
                    orig_weight = model.tensors[matmul_name]
                    new_weight = orig_weight + lora_weight.transpose()
                    orig_weights[matmul_name] = orig_weight
                    model.tensors[matmul_name] = new_weight.astype(orig_weight.dtype)
                else:
                    # warn? err?
                    pass
            yield
        finally:
            # restore original weights
            for name, orig_weight in orig_weights.items():
                model.tensors[name] = orig_weight
    @classmethod
    @contextmanager
    def apply_ti(
        cls,
        tokenizer: CLIPTokenizer,
        text_encoder: IAIOnnxRuntimeModel,
        ti_list: List[Tuple[str, Any]],
    ) -> Tuple[CLIPTokenizer, TextualInversionManager]:
        from .models.base import IAIOnnxRuntimeModel
        if not isinstance(text_encoder, IAIOnnxRuntimeModel):
            raise Exception("Only IAIOnnxRuntimeModel models supported")
        orig_embeddings = None
        try:
            # HACK: The CLIPTokenizer API does not include a way to remove tokens after calling add_tokens(...). As a
            # workaround, we create a full copy of `tokenizer` so that its original behavior can be restored after
            # exiting this `apply_ti(...)` context manager.
            #
            # In a previous implementation, the deep copy was obtained with `ti_tokenizer = copy.deepcopy(tokenizer)`,
            # but a pickle roundtrip was found to be much faster (1 sec vs. 0.05 secs).
            ti_tokenizer = pickle.loads(pickle.dumps(tokenizer))
            ti_manager = TextualInversionManager(ti_tokenizer)
            def _get_trigger(ti_name, index):
                trigger = ti_name
                if index > 0:
                    trigger += f"-!pad-{i}"
                return f"<{trigger}>"
            # modify text_encoder
            orig_embeddings = text_encoder.tensors["text_model.embeddings.token_embedding.weight"]
            # modify tokenizer
            new_tokens_added = 0
            for ti_name, ti in ti_list:
                if ti.embedding_2 is not None:
                    ti_embedding = (
                        ti.embedding_2 if ti.embedding_2.shape[1] == orig_embeddings.shape[0] else ti.embedding
                    )
                else:
                    ti_embedding = ti.embedding
                for i in range(ti_embedding.shape[0]):
                    new_tokens_added += ti_tokenizer.add_tokens(_get_trigger(ti_name, i))
            embeddings = np.concatenate(
                (np.copy(orig_embeddings), np.zeros((new_tokens_added, orig_embeddings.shape[1]))),
                axis=0,
            )
            for ti_name, _ in ti_list:
                ti_tokens = []
                for i in range(ti_embedding.shape[0]):
                    embedding = ti_embedding[i].detach().numpy()
                    trigger = _get_trigger(ti_name, i)
                    token_id = ti_tokenizer.convert_tokens_to_ids(trigger)
                    if token_id == ti_tokenizer.unk_token_id:
                        raise RuntimeError(f"Unable to find token id for token '{trigger}'")
                    if embeddings[token_id].shape != embedding.shape:
                        raise ValueError(
                            f"Cannot load embedding for {trigger}. It was trained on a model with token dimension"
                            f" {embedding.shape[0]}, but the current model has token dimension"
                            f" {embeddings[token_id].shape[0]}."
                        )
                    embeddings[token_id] = embedding
                    ti_tokens.append(token_id)
                if len(ti_tokens) > 1:
                    ti_manager.pad_tokens[ti_tokens[0]] = ti_tokens[1:]
            text_encoder.tensors["text_model.embeddings.token_embedding.weight"] = embeddings.astype(
                orig_embeddings.dtype
            )
            yield ti_tokenizer, ti_manager
        finally:
            # restore
            if orig_embeddings is not None:
                text_encoder.tensors["text_model.embeddings.token_embedding.weight"] = orig_embeddings
--- a/invokeai/backend/model_management_OLD/memory_snapshot.py
+++ b/invokeai/backend/model_management_OLD/memory_snapshot.py
@ -1,99 +0,0 @@
 import gc
 from typing import Optional
 import psutil
 import torch
 from invokeai.backend.model_management.libc_util import LibcUtil, Struct_mallinfo2
 GB = 2**30  # 1 GB
 class MemorySnapshot:
    """A snapshot of RAM and VRAM usage. All values are in bytes."""
    def __init__(self, process_ram: int, vram: Optional[int], malloc_info: Optional[Struct_mallinfo2]):
        """Initialize a MemorySnapshot.
        Most of the time, `MemorySnapshot` will be constructed with `MemorySnapshot.capture()`.
        Args:
            process_ram (int): CPU RAM used by the current process.
            vram (Optional[int]): VRAM used by torch.
            malloc_info (Optional[Struct_mallinfo2]): Malloc info obtained from LibcUtil.
        """
        self.process_ram = process_ram
        self.vram = vram
        self.malloc_info = malloc_info
    @classmethod
    def capture(cls, run_garbage_collector: bool = True):
        """Capture and return a MemorySnapshot.
        Note: This function has significant overhead, particularly if `run_garbage_collector == True`.
        Args:
            run_garbage_collector (bool, optional): If true, gc.collect() will be run before checking the process RAM
                usage. Defaults to True.
        Returns:
            MemorySnapshot
        """
        if run_garbage_collector:
            gc.collect()
        # According to the psutil docs (https://psutil.readthedocs.io/en/latest/#psutil.Process.memory_info), rss is
        # supported on all platforms.
        process_ram = psutil.Process().memory_info().rss
        if torch.cuda.is_available():
            vram = torch.cuda.memory_allocated()
        else:
            # TODO: We could add support for mps.current_allocated_memory() as well. Leaving out for now until we have
            # time to test it properly.
            vram = None
        try:
            malloc_info = LibcUtil().mallinfo2()
        except (OSError, AttributeError):
            # OSError: This is expected in environments that do not have the 'libc.so.6' shared library.
            # AttributeError: This is expected in environments that have `libc.so.6` but do not have the `mallinfo2` (e.g. glibc < 2.33)
            # TODO: Does `mallinfo` work?
            malloc_info = None
        return cls(process_ram, vram, malloc_info)
 def get_pretty_snapshot_diff(snapshot_1: Optional[MemorySnapshot], snapshot_2: Optional[MemorySnapshot]) -> str:
    """Get a pretty string describing the difference between two `MemorySnapshot`s."""
    def get_msg_line(prefix: str, val1: int, val2: int):
        diff = val2 - val1
        return f"{prefix: <30} ({(diff/GB):+5.3f}): {(val1/GB):5.3f}GB -> {(val2/GB):5.3f}GB\n"
    msg = ""
    if snapshot_1 is None or snapshot_2 is None:
        return msg
    msg += get_msg_line("Process RAM", snapshot_1.process_ram, snapshot_2.process_ram)
    if snapshot_1.malloc_info is not None and snapshot_2.malloc_info is not None:
        msg += get_msg_line("libc mmap allocated", snapshot_1.malloc_info.hblkhd, snapshot_2.malloc_info.hblkhd)
        msg += get_msg_line("libc arena used", snapshot_1.malloc_info.uordblks, snapshot_2.malloc_info.uordblks)
        msg += get_msg_line("libc arena free", snapshot_1.malloc_info.fordblks, snapshot_2.malloc_info.fordblks)
        libc_total_allocated_1 = snapshot_1.malloc_info.arena + snapshot_1.malloc_info.hblkhd
        libc_total_allocated_2 = snapshot_2.malloc_info.arena + snapshot_2.malloc_info.hblkhd
        msg += get_msg_line("libc total allocated", libc_total_allocated_1, libc_total_allocated_2)
        libc_total_used_1 = snapshot_1.malloc_info.uordblks + snapshot_1.malloc_info.hblkhd
        libc_total_used_2 = snapshot_2.malloc_info.uordblks + snapshot_2.malloc_info.hblkhd
        msg += get_msg_line("libc total used", libc_total_used_1, libc_total_used_2)
    if snapshot_1.vram is not None and snapshot_2.vram is not None:
        msg += get_msg_line("VRAM", snapshot_1.vram, snapshot_2.vram)
    return msg
--- a/invokeai/backend/model_management_OLD/model_cache.py
+++ b/invokeai/backend/model_management_OLD/model_cache.py
@ -1,553 +0,0 @@
 """
 Manage a RAM cache of diffusion/transformer models for fast switching.
 They are moved between GPU VRAM and CPU RAM as necessary. If the cache
 grows larger than a preset maximum, then the least recently used
 model will be cleared and (re)loaded from disk when next needed.
 The cache returns context manager generators designed to load the
 model into the GPU within the context, and unload outside the
 context. Use like this:
   cache = ModelCache(max_cache_size=7.5)
   with cache.get_model('runwayml/stable-diffusion-1-5') as SD1,
          cache.get_model('stabilityai/stable-diffusion-2') as SD2:
       do_something_in_GPU(SD1,SD2)
 """
 import gc
 import hashlib
 import math
 import os
 import sys
 import time
 from contextlib import suppress
 from dataclasses import dataclass, field
 from pathlib import Path
 from typing import Any, Dict, Optional, Type, Union, types
 import torch
 import invokeai.backend.util.logging as logger
 from invokeai.backend.model_management.memory_snapshot import MemorySnapshot, get_pretty_snapshot_diff
 from invokeai.backend.model_management.model_load_optimizations import skip_torch_weight_init
 from ..util.devices import choose_torch_device
 from .models import BaseModelType, ModelBase, ModelType, SubModelType
 if choose_torch_device() == torch.device("mps"):
    from torch import mps
 # Maximum size of the cache, in gigs
 # Default is roughly enough to hold three fp16 diffusers models in RAM simultaneously
 DEFAULT_MAX_CACHE_SIZE = 6.0
 # amount of GPU memory to hold in reserve for use by generations (GB)
 DEFAULT_MAX_VRAM_CACHE_SIZE = 2.75
 # actual size of a gig
 GIG = 1073741824
 # Size of a MB in bytes.
 MB = 2**20
@dataclass
 class CacheStats(object):
    hits: int = 0  # cache hits
    misses: int = 0  # cache misses
    high_watermark: int = 0  # amount of cache used
    in_cache: int = 0  # number of models in cache
    cleared: int = 0  # number of models cleared to make space
    cache_size: int = 0  # total size of cache
    # {submodel_key => size}
    loaded_model_sizes: Dict[str, int] = field(default_factory=dict)
 class ModelLocker(object):
    "Forward declaration"
    pass
 class ModelCache(object):
    "Forward declaration"
    pass
 class _CacheRecord:
    size: int
    model: Any
    cache: ModelCache
    _locks: int
    def __init__(self, cache, model: Any, size: int):
        self.size = size
        self.model = model
        self.cache = cache
        self._locks = 0
    def lock(self):
        self._locks += 1
    def unlock(self):
        self._locks -= 1
        assert self._locks >= 0
    @property
    def locked(self):
        return self._locks > 0
    @property
    def loaded(self):
        if self.model is not None and hasattr(self.model, "device"):
            return self.model.device != self.cache.storage_device
        else:
            return False
 class ModelCache(object):
    def __init__(
        self,
        max_cache_size: float = DEFAULT_MAX_CACHE_SIZE,
        max_vram_cache_size: float = DEFAULT_MAX_VRAM_CACHE_SIZE,
        execution_device: torch.device = torch.device("cuda"),
        storage_device: torch.device = torch.device("cpu"),
        precision: torch.dtype = torch.float16,
        sequential_offload: bool = False,
        lazy_offloading: bool = True,
        sha_chunksize: int = 16777216,
        logger: types.ModuleType = logger,
        log_memory_usage: bool = False,
    ):
        """
        :param max_cache_size: Maximum size of the RAM cache [6.0 GB]
        :param execution_device: Torch device to load active model into [torch.device('cuda')]
        :param storage_device: Torch device to save inactive model in [torch.device('cpu')]
        :param precision: Precision for loaded models [torch.float16]
        :param lazy_offloading: Keep model in VRAM until another model needs to be loaded
        :param sequential_offload: Conserve VRAM by loading and unloading each stage of the pipeline sequentially
        :param sha_chunksize: Chunksize to use when calculating sha256 model hash
        :param log_memory_usage: If True, a memory snapshot will be captured before and after every model cache
            operation, and the result will be logged (at debug level). There is a time cost to capturing the memory
            snapshots, so it is recommended to disable this feature unless you are actively inspecting the model cache's
            behaviour.
        """
        self.model_infos: Dict[str, ModelBase] = {}
        # allow lazy offloading only when vram cache enabled
        self.lazy_offloading = lazy_offloading and max_vram_cache_size > 0
        self.precision: torch.dtype = precision
        self.max_cache_size: float = max_cache_size
        self.max_vram_cache_size: float = max_vram_cache_size
        self.execution_device: torch.device = execution_device
        self.storage_device: torch.device = storage_device
        self.sha_chunksize = sha_chunksize
        self.logger = logger
        self._log_memory_usage = log_memory_usage
        # used for stats collection
        self.stats = None
        self._cached_models = {}
        self._cache_stack = []
    def _capture_memory_snapshot(self) -> Optional[MemorySnapshot]:
        if self._log_memory_usage:
            return MemorySnapshot.capture()
        return None
    def get_key(
        self,
        model_path: str,
        base_model: BaseModelType,
        model_type: ModelType,
        submodel_type: Optional[SubModelType] = None,
    ):
        key = f"{model_path}:{base_model}:{model_type}"
        if submodel_type:
            key += f":{submodel_type}"
        return key
    def _get_model_info(
        self,
        model_path: str,
        model_class: Type[ModelBase],
        base_model: BaseModelType,
        model_type: ModelType,
    ):
        model_info_key = self.get_key(
            model_path=model_path,
            base_model=base_model,
            model_type=model_type,
            submodel_type=None,
        )
        if model_info_key not in self.model_infos:
            self.model_infos[model_info_key] = model_class(
                model_path,
                base_model,
                model_type,
            )
        return self.model_infos[model_info_key]
    # TODO: args
    def get_model(
        self,
        model_path: Union[str, Path],
        model_class: Type[ModelBase],
        base_model: BaseModelType,
        model_type: ModelType,
        submodel: Optional[SubModelType] = None,
        gpu_load: bool = True,
    ) -> Any:
        if not isinstance(model_path, Path):
            model_path = Path(model_path)
        if not os.path.exists(model_path):
            raise Exception(f"Model not found: {model_path}")
        model_info = self._get_model_info(
            model_path=model_path,
            model_class=model_class,
            base_model=base_model,
            model_type=model_type,
        )
        key = self.get_key(
            model_path=model_path,
            base_model=base_model,
            model_type=model_type,
            submodel_type=submodel,
        )
        # TODO: lock for no copies on simultaneous calls?
        cache_entry = self._cached_models.get(key, None)
        if cache_entry is None:
            self.logger.info(
                f"Loading model {model_path}, type"
                f" {base_model.value}:{model_type.value}{':'+submodel.value if submodel else ''}"
            )
            if self.stats:
                self.stats.misses += 1
            self_reported_model_size_before_load = model_info.get_size(submodel)
            # Remove old models from the cache to make room for the new model.
            self._make_cache_room(self_reported_model_size_before_load)
            # Load the model from disk and capture a memory snapshot before/after.
            start_load_time = time.time()
            snapshot_before = self._capture_memory_snapshot()
            with skip_torch_weight_init():
                model = model_info.get_model(child_type=submodel, torch_dtype=self.precision)
            snapshot_after = self._capture_memory_snapshot()
            end_load_time = time.time()
            self_reported_model_size_after_load = model_info.get_size(submodel)
            self.logger.debug(
                f"Moved model '{key}' from disk to cpu in {(end_load_time-start_load_time):.2f}s.\n"
                f"Self-reported size before/after load: {(self_reported_model_size_before_load/GIG):.3f}GB /"
                f" {(self_reported_model_size_after_load/GIG):.3f}GB.\n"
                f"{get_pretty_snapshot_diff(snapshot_before, snapshot_after)}"
            )
            if abs(self_reported_model_size_after_load - self_reported_model_size_before_load) > 10 * MB:
                self.logger.debug(
                    f"Model '{key}' mis-reported its size before load. Self-reported size before/after load:"
                    f" {(self_reported_model_size_before_load/GIG):.2f}GB /"
                    f" {(self_reported_model_size_after_load/GIG):.2f}GB."
                )
            cache_entry = _CacheRecord(self, model, self_reported_model_size_after_load)
            self._cached_models[key] = cache_entry
        else:
            if self.stats:
                self.stats.hits += 1
        if self.stats:
            self.stats.cache_size = self.max_cache_size * GIG
            self.stats.high_watermark = max(self.stats.high_watermark, self._cache_size())
            self.stats.in_cache = len(self._cached_models)
            self.stats.loaded_model_sizes[key] = max(
                self.stats.loaded_model_sizes.get(key, 0), model_info.get_size(submodel)
            )
        with suppress(Exception):
            self._cache_stack.remove(key)
        self._cache_stack.append(key)
        return self.ModelLocker(self, key, cache_entry.model, gpu_load, cache_entry.size)
    def _move_model_to_device(self, key: str, target_device: torch.device):
        cache_entry = self._cached_models[key]
        source_device = cache_entry.model.device
        # Note: We compare device types only so that 'cuda' == 'cuda:0'. This would need to be revised to support
        # multi-GPU.
        if torch.device(source_device).type == torch.device(target_device).type:
            return
        start_model_to_time = time.time()
        snapshot_before = self._capture_memory_snapshot()
        cache_entry.model.to(target_device)
        snapshot_after = self._capture_memory_snapshot()
        end_model_to_time = time.time()
        self.logger.debug(
            f"Moved model '{key}' from {source_device} to"
            f" {target_device} in {(end_model_to_time-start_model_to_time):.2f}s.\n"
            f"Estimated model size: {(cache_entry.size/GIG):.3f} GB.\n"
            f"{get_pretty_snapshot_diff(snapshot_before, snapshot_after)}"
        )
        if (
            snapshot_before is not None
            and snapshot_after is not None
            and snapshot_before.vram is not None
            and snapshot_after.vram is not None
        ):
            vram_change = abs(snapshot_before.vram - snapshot_after.vram)
            # If the estimated model size does not match the change in VRAM, log a warning.
            if not math.isclose(
                vram_change,
                cache_entry.size,
                rel_tol=0.1,
                abs_tol=10 * MB,
            ):
                self.logger.debug(
                    f"Moving model '{key}' from {source_device} to"
                    f" {target_device} caused an unexpected change in VRAM usage. The model's"
                    " estimated size may be incorrect. Estimated model size:"
                    f" {(cache_entry.size/GIG):.3f} GB.\n"
                    f"{get_pretty_snapshot_diff(snapshot_before, snapshot_after)}"
                )
    class ModelLocker(object):
        def __init__(self, cache, key, model, gpu_load, size_needed):
            """
            :param cache: The model_cache object
            :param key: The key of the model to lock in GPU
            :param model: The model to lock
            :param gpu_load: True if load into gpu
            :param size_needed: Size of the model to load
            """
            self.gpu_load = gpu_load
            self.cache = cache
            self.key = key
            self.model = model
            self.size_needed = size_needed
            self.cache_entry = self.cache._cached_models[self.key]
        def __enter__(self) -> Any:
            if not hasattr(self.model, "to"):
                return self.model
            # NOTE that the model has to have the to() method in order for this
            # code to move it into GPU!
            if self.gpu_load:
                self.cache_entry.lock()
                try:
                    if self.cache.lazy_offloading:
                        self.cache._offload_unlocked_models(self.size_needed)
                    self.cache._move_model_to_device(self.key, self.cache.execution_device)
                    self.cache.logger.debug(f"Locking {self.key} in {self.cache.execution_device}")
                    self.cache._print_cuda_stats()
                except Exception:
                    self.cache_entry.unlock()
                    raise
            # TODO: not fully understand
            # in the event that the caller wants the model in RAM, we
            # move it into CPU if it is in GPU and not locked
            elif self.cache_entry.loaded and not self.cache_entry.locked:
                self.cache._move_model_to_device(self.key, self.cache.storage_device)
            return self.model
        def __exit__(self, type, value, traceback):
            if not hasattr(self.model, "to"):
                return
            self.cache_entry.unlock()
            if not self.cache.lazy_offloading:
                self.cache._offload_unlocked_models()
                self.cache._print_cuda_stats()
    # TODO: should it be called untrack_model?
    def uncache_model(self, cache_id: str):
        with suppress(ValueError):
            self._cache_stack.remove(cache_id)
        self._cached_models.pop(cache_id, None)
    def model_hash(
        self,
        model_path: Union[str, Path],
    ) -> str:
        """
        Given the HF repo id or path to a model on disk, returns a unique
        hash. Works for legacy checkpoint files, HF models on disk, and HF repo IDs
        :param model_path: Path to model file/directory on disk.
        """
        return self._local_model_hash(model_path)
    def cache_size(self) -> float:
        """Return the current size of the cache, in GB."""
        return self._cache_size() / GIG
    def _has_cuda(self) -> bool:
        return self.execution_device.type == "cuda"
    def _print_cuda_stats(self):
        vram = "%4.2fG" % (torch.cuda.memory_allocated() / GIG)
        ram = "%4.2fG" % self.cache_size()
        cached_models = 0
        loaded_models = 0
        locked_models = 0
        for model_info in self._cached_models.values():
            cached_models += 1
            if model_info.loaded:
                loaded_models += 1
            if model_info.locked:
                locked_models += 1
        self.logger.debug(
            f"Current VRAM/RAM usage: {vram}/{ram}; cached_models/loaded_models/locked_models/ ="
            f" {cached_models}/{loaded_models}/{locked_models}"
        )
    def _cache_size(self) -> int:
        return sum([m.size for m in self._cached_models.values()])
    def _make_cache_room(self, model_size):
        # calculate how much memory this model will require
        # multiplier = 2 if self.precision==torch.float32 else 1
        bytes_needed = model_size
        maximum_size = self.max_cache_size * GIG  # stored in GB, convert to bytes
        current_size = self._cache_size()
        if current_size + bytes_needed > maximum_size:
            self.logger.debug(
                f"Max cache size exceeded: {(current_size/GIG):.2f}/{self.max_cache_size:.2f} GB, need an additional"
                f" {(bytes_needed/GIG):.2f} GB"
            )
        self.logger.debug(f"Before unloading: cached_models={len(self._cached_models)}")
        pos = 0
        models_cleared = 0
        while current_size + bytes_needed > maximum_size and pos < len(self._cache_stack):
            model_key = self._cache_stack[pos]
            cache_entry = self._cached_models[model_key]
            refs = sys.getrefcount(cache_entry.model)
            # HACK: This is a workaround for a memory-management issue that we haven't tracked down yet. We are directly
            # going against the advice in the Python docs by using `gc.get_referrers(...)` in this way:
            # https://docs.python.org/3/library/gc.html#gc.get_referrers
            # manualy clear local variable references of just finished function calls
            # for some reason python don't want to collect it even by gc.collect() immidiately
            if refs > 2:
                while True:
                    cleared = False
                    for referrer in gc.get_referrers(cache_entry.model):
                        if type(referrer).__name__ == "frame":
                            # RuntimeError: cannot clear an executing frame
                            with suppress(RuntimeError):
                                referrer.clear()
                                cleared = True
                                # break
                    # repeat if referrers changes(due to frame clear), else exit loop
                    if cleared:
                        gc.collect()
                    else:
                        break
            device = cache_entry.model.device if hasattr(cache_entry.model, "device") else None
            self.logger.debug(
                f"Model: {model_key}, locks: {cache_entry._locks}, device: {device}, loaded: {cache_entry.loaded},"
                f" refs: {refs}"
            )
            # Expected refs:
            # 1 from cache_entry
            # 1 from getrefcount function
            # 1 from onnx runtime object
            if not cache_entry.locked and refs <= (3 if "onnx" in model_key else 2):
                self.logger.debug(
                    f"Unloading model {model_key} to free {(model_size/GIG):.2f} GB (-{(cache_entry.size/GIG):.2f} GB)"
                )
                current_size -= cache_entry.size
                models_cleared += 1
                if self.stats:
                    self.stats.cleared += 1
                del self._cache_stack[pos]
                del self._cached_models[model_key]
                del cache_entry
            else:
                pos += 1
        if models_cleared > 0:
            # There would likely be some 'garbage' to be collected regardless of whether a model was cleared or not, but
            # there is a significant time cost to calling `gc.collect()`, so we want to use it sparingly. (The time cost
            # is high even if no garbage gets collected.)
            #
            # Calling gc.collect(...) when a model is cleared seems like a good middle-ground:
            # - If models had to be cleared, it's a signal that we are close to our memory limit.
            # - If models were cleared, there's a good chance that there's a significant amount of garbage to be
            #   collected.
            #
            # Keep in mind that gc is only responsible for handling reference cycles. Most objects should be cleaned up
            # immediately when their reference count hits 0.
            gc.collect()
        torch.cuda.empty_cache()
        if choose_torch_device() == torch.device("mps"):
            mps.empty_cache()
        self.logger.debug(f"After unloading: cached_models={len(self._cached_models)}")
    def _offload_unlocked_models(self, size_needed: int = 0):
        reserved = self.max_vram_cache_size * GIG
        vram_in_use = torch.cuda.memory_allocated()
        self.logger.debug(f"{(vram_in_use/GIG):.2f}GB VRAM used for models; max allowed={(reserved/GIG):.2f}GB")
        for model_key, cache_entry in sorted(self._cached_models.items(), key=lambda x: x[1].size):
            if vram_in_use <= reserved:
                break
            if not cache_entry.locked and cache_entry.loaded:
                self._move_model_to_device(model_key, self.storage_device)
                vram_in_use = torch.cuda.memory_allocated()
                self.logger.debug(f"{(vram_in_use/GIG):.2f}GB VRAM used for models; max allowed={(reserved/GIG):.2f}GB")
        torch.cuda.empty_cache()
        if choose_torch_device() == torch.device("mps"):
            mps.empty_cache()
    def _local_model_hash(self, model_path: Union[str, Path]) -> str:
        sha = hashlib.sha256()
        path = Path(model_path)
        hashpath = path / "checksum.sha256"
        if hashpath.exists() and path.stat().st_mtime <= hashpath.stat().st_mtime:
            with open(hashpath) as f:
                hash = f.read()
            return hash
        self.logger.debug(f"computing hash of model {path.name}")
        for file in list(path.rglob("*.ckpt")) + list(path.rglob("*.safetensors")) + list(path.rglob("*.pth")):
            with open(file, "rb") as f:
                while chunk := f.read(self.sha_chunksize):
                    sha.update(chunk)
        hash = sha.hexdigest()
        with open(hashpath, "w") as f:
            f.write(hash)
        return hash
--- a/invokeai/backend/model_management_OLD/model_load_optimizations.py
+++ b/invokeai/backend/model_management_OLD/model_load_optimizations.py
@ -1,30 +0,0 @@
 from contextlib import contextmanager
 import torch
 def _no_op(*args, **kwargs):
    pass
@contextmanager
 def skip_torch_weight_init():
    """A context manager that monkey-patches several of the common torch layers (torch.nn.Linear, torch.nn.Conv1d, etc.)
    to skip weight initialization.
    By default, `torch.nn.Linear` and `torch.nn.ConvNd` layers initialize their weights (according to a particular
    distribution) when __init__ is called. This weight initialization step can take a significant amount of time, and is
    completely unnecessary if the intent is to load checkpoint weights from disk for the layer. This context manager
    monkey-patches common torch layers to skip the weight initialization step.
    """
    torch_modules = [torch.nn.Linear, torch.nn.modules.conv._ConvNd, torch.nn.Embedding]
    saved_functions = [m.reset_parameters for m in torch_modules]
    try:
        for torch_module in torch_modules:
            torch_module.reset_parameters = _no_op
        yield None
    finally:
        for torch_module, saved_function in zip(torch_modules, saved_functions, strict=True):
            torch_module.reset_parameters = saved_function
--- a/invokeai/backend/model_management_OLD/model_manager.py
+++ b/invokeai/backend/model_management_OLD/model_manager.py
--- a/invokeai/backend/model_management_OLD/model_merge.py
+++ b/invokeai/backend/model_management_OLD/model_merge.py
@ -1,140 +0,0 @@
 """
 invokeai.backend.model_management.model_merge exports:
 merge_diffusion_models() -- combine multiple models by location and return a pipeline object
 merge_diffusion_models_and_commit() -- combine multiple models by ModelManager ID and write to models.yaml
 Copyright (c) 2023 Lincoln Stein and the InvokeAI Development Team
 """
 import warnings
 from enum import Enum
 from pathlib import Path
 from typing import List, Optional, Union
 from diffusers import DiffusionPipeline
 from diffusers import logging as dlogging
 import invokeai.backend.util.logging as logger
 from ...backend.model_management import AddModelResult, BaseModelType, ModelManager, ModelType, ModelVariantType
 class MergeInterpolationMethod(str, Enum):
    WeightedSum = "weighted_sum"
    Sigmoid = "sigmoid"
    InvSigmoid = "inv_sigmoid"
    AddDifference = "add_difference"
 class ModelMerger(object):
    def __init__(self, manager: ModelManager):
        self.manager = manager
    def merge_diffusion_models(
        self,
        model_paths: List[Path],
        alpha: float = 0.5,
        interp: Optional[MergeInterpolationMethod] = None,
        force: bool = False,
        **kwargs,
    ) -> DiffusionPipeline:
        """
        :param model_paths:  up to three models, designated by their local paths or HuggingFace repo_ids
        :param alpha: The interpolation parameter. Ranges from 0 to 1.  It affects the ratio in which the checkpoints are merged. A 0.8 alpha
                   would mean that the first model checkpoints would affect the final result far less than an alpha of 0.2
        :param interp: The interpolation method to use for the merging. Supports "sigmoid", "inv_sigmoid", "add_difference" and None.
                   Passing None uses the default interpolation which is weighted sum interpolation. For merging three checkpoints, only "add_difference" is supported.
        :param force:  Whether to ignore mismatch in model_config.json for the current models. Defaults to False.
        **kwargs - the default DiffusionPipeline.get_config_dict kwargs:
             cache_dir, resume_download, force_download, proxies, local_files_only, use_auth_token, revision, torch_dtype, device_map
        """
        with warnings.catch_warnings():
            warnings.simplefilter("ignore")
            verbosity = dlogging.get_verbosity()
            dlogging.set_verbosity_error()
            pipe = DiffusionPipeline.from_pretrained(
                model_paths[0],
                custom_pipeline="checkpoint_merger",
            )
            merged_pipe = pipe.merge(
                pretrained_model_name_or_path_list=model_paths,
                alpha=alpha,
                interp=interp.value if interp else None,  # diffusers API treats None as "weighted sum"
                force=force,
                **kwargs,
            )
            dlogging.set_verbosity(verbosity)
        return merged_pipe
    def merge_diffusion_models_and_save(
        self,
        model_names: List[str],
        base_model: Union[BaseModelType, str],
        merged_model_name: str,
        alpha: float = 0.5,
        interp: Optional[MergeInterpolationMethod] = None,
        force: bool = False,
        merge_dest_directory: Optional[Path] = None,
        **kwargs,
    ) -> AddModelResult:
        """
        :param models: up to three models, designated by their InvokeAI models.yaml model name
        :param base_model: base model (must be the same for all merged models!)
        :param merged_model_name: name for new model
        :param alpha: The interpolation parameter. Ranges from 0 to 1.  It affects the ratio in which the checkpoints are merged. A 0.8 alpha
                   would mean that the first model checkpoints would affect the final result far less than an alpha of 0.2
        :param interp: The interpolation method to use for the merging. Supports "weighted_average", "sigmoid", "inv_sigmoid", "add_difference" and None.
                   Passing None uses the default interpolation which is weighted sum interpolation. For merging three checkpoints, only "add_difference" is supported. Add_difference is A+(B-C).
        :param force:  Whether to ignore mismatch in model_config.json for the current models. Defaults to False.
        :param merge_dest_directory: Save the merged model to the designated directory (with 'merged_model_name' appended)
        **kwargs - the default DiffusionPipeline.get_config_dict kwargs:
             cache_dir, resume_download, force_download, proxies, local_files_only, use_auth_token, revision, torch_dtype, device_map
        """
        model_paths = []
        config = self.manager.app_config
        base_model = BaseModelType(base_model)
        vae = None
        for mod in model_names:
            info = self.manager.list_model(mod, base_model=base_model, model_type=ModelType.Main)
            assert info, f"model {mod}, base_model {base_model}, is unknown"
            assert (
                info["model_format"] == "diffusers"
            ), f"{mod} is not a diffusers model. It must be optimized before merging"
            assert info["variant"] == "normal", f"{mod} is a {info['variant']} model, which cannot currently be merged"
            assert (
                len(model_names) <= 2 or interp == MergeInterpolationMethod.AddDifference
            ), "When merging three models, only the 'add_difference' merge method is supported"
            # pick up the first model's vae
            if mod == model_names[0]:
                vae = info.get("vae")
            model_paths.extend([(config.root_path / info["path"]).as_posix()])
        merge_method = None if interp == "weighted_sum" else MergeInterpolationMethod(interp)
        logger.debug(f"interp = {interp}, merge_method={merge_method}")
        merged_pipe = self.merge_diffusion_models(model_paths, alpha, merge_method, force, **kwargs)
        dump_path = (
            Path(merge_dest_directory)
            if merge_dest_directory
            else config.models_path / base_model.value / ModelType.Main.value
        )
        dump_path.mkdir(parents=True, exist_ok=True)
        dump_path = (dump_path / merged_model_name).as_posix()
        merged_pipe.save_pretrained(dump_path, safe_serialization=True)
        attributes = {
            "path": dump_path,
            "description": f"Merge of models {', '.join(model_names)}",
            "model_format": "diffusers",
            "variant": ModelVariantType.Normal.value,
            "vae": vae,
        }
        return self.manager.add_model(
            merged_model_name,
            base_model=base_model,
            model_type=ModelType.Main,
            model_attributes=attributes,
            clobber=True,
        )
--- a/invokeai/backend/model_management_OLD/model_probe.py
+++ b/invokeai/backend/model_management_OLD/model_probe.py
@ -1,664 +0,0 @@
 import json
 import re
 from dataclasses import dataclass
 from pathlib import Path
 from typing import Callable, Dict, Literal, Optional, Union
 import safetensors.torch
 import torch
 from diffusers import ConfigMixin, ModelMixin
 from picklescan.scanner import scan_file_path
 from invokeai.backend.model_management.models.ip_adapter import IPAdapterModelFormat
 from .models import (
    BaseModelType,
    InvalidModelException,
    ModelType,
    ModelVariantType,
    SchedulerPredictionType,
    SilenceWarnings,
 )
 from .models.base import read_checkpoint_meta
 from .util import lora_token_vector_length
@dataclass
 class ModelProbeInfo(object):
    model_type: ModelType
    base_type: BaseModelType
    variant_type: ModelVariantType
    prediction_type: SchedulerPredictionType
    upcast_attention: bool
    format: Literal["diffusers", "checkpoint", "lycoris", "olive", "onnx"]
    image_size: int
    name: Optional[str] = None
    description: Optional[str] = None
 class ProbeBase(object):
    """forward declaration"""
    pass
 class ModelProbe(object):
    PROBES = {
        "diffusers": {},
        "checkpoint": {},
        "onnx": {},
    }
    CLASS2TYPE = {
        "StableDiffusionPipeline": ModelType.Main,
        "StableDiffusionInpaintPipeline": ModelType.Main,
        "StableDiffusionXLPipeline": ModelType.Main,
        "StableDiffusionXLImg2ImgPipeline": ModelType.Main,
        "StableDiffusionXLInpaintPipeline": ModelType.Main,
        "LatentConsistencyModelPipeline": ModelType.Main,
        "AutoencoderKL": ModelType.Vae,
        "AutoencoderTiny": ModelType.Vae,
        "ControlNetModel": ModelType.ControlNet,
        "CLIPVisionModelWithProjection": ModelType.CLIPVision,
        "T2IAdapter": ModelType.T2IAdapter,
    }
    @classmethod
    def register_probe(
        cls, format: Literal["diffusers", "checkpoint", "onnx"], model_type: ModelType, probe_class: ProbeBase
    ):
        cls.PROBES[format][model_type] = probe_class
    @classmethod
    def heuristic_probe(
        cls,
        model: Union[Dict, ModelMixin, Path],
        prediction_type_helper: Callable[[Path], SchedulerPredictionType] = None,
    ) -> ModelProbeInfo:
        if isinstance(model, Path):
            return cls.probe(model_path=model, prediction_type_helper=prediction_type_helper)
        elif isinstance(model, (dict, ModelMixin, ConfigMixin)):
            return cls.probe(model_path=None, model=model, prediction_type_helper=prediction_type_helper)
        else:
            raise InvalidModelException("model parameter {model} is neither a Path, nor a model")
    @classmethod
    def probe(
        cls,
        model_path: Path,
        model: Optional[Union[Dict, ModelMixin]] = None,
        prediction_type_helper: Optional[Callable[[Path], SchedulerPredictionType]] = None,
    ) -> ModelProbeInfo:
        """
        Probe the model at model_path and return sufficient information about it
        to place it somewhere in the models directory hierarchy. If the model is
        already loaded into memory, you may provide it as model in order to avoid
        opening it a second time. The prediction_type_helper callable is a function that receives
        the path to the model and returns the SchedulerPredictionType.
        """
        if model_path:
            format_type = "diffusers" if model_path.is_dir() else "checkpoint"
        else:
            format_type = "diffusers" if isinstance(model, (ConfigMixin, ModelMixin)) else "checkpoint"
        model_info = None
        try:
            model_type = (
                cls.get_model_type_from_folder(model_path, model)
                if format_type == "diffusers"
                else cls.get_model_type_from_checkpoint(model_path, model)
            )
            format_type = "onnx" if model_type == ModelType.ONNX else format_type
            probe_class = cls.PROBES[format_type].get(model_type)
            if not probe_class:
                return None
            probe = probe_class(model_path, model, prediction_type_helper)
            base_type = probe.get_base_type()
            variant_type = probe.get_variant_type()
            prediction_type = probe.get_scheduler_prediction_type()
            name = cls.get_model_name(model_path)
            description = f"{base_type.value} {model_type.value} model {name}"
            format = probe.get_format()
            model_info = ModelProbeInfo(
                model_type=model_type,
                base_type=base_type,
                variant_type=variant_type,
                prediction_type=prediction_type,
                name=name,
                description=description,
                upcast_attention=(
                    base_type == BaseModelType.StableDiffusion2
                    and prediction_type == SchedulerPredictionType.VPrediction
                ),
                format=format,
                image_size=(
                    1024
                    if (base_type in {BaseModelType.StableDiffusionXL, BaseModelType.StableDiffusionXLRefiner})
                    else (
                        768
                        if (
                            base_type == BaseModelType.StableDiffusion2
                            and prediction_type == SchedulerPredictionType.VPrediction
                        )
                        else 512
                    )
                ),
            )
        except Exception:
            raise
        return model_info
    @classmethod
    def get_model_name(cls, model_path: Path) -> str:
        if model_path.suffix in {".safetensors", ".bin", ".pt", ".ckpt"}:
            return model_path.stem
        else:
            return model_path.name
    @classmethod
    def get_model_type_from_checkpoint(cls, model_path: Path, checkpoint: dict) -> ModelType:
        if model_path.suffix not in (".bin", ".pt", ".ckpt", ".safetensors", ".pth"):
            return None
        if model_path.name == "learned_embeds.bin":
            return ModelType.TextualInversion
        ckpt = checkpoint if checkpoint else read_checkpoint_meta(model_path, scan=True)
        ckpt = ckpt.get("state_dict", ckpt)
        for key in ckpt.keys():
            if any(key.startswith(v) for v in {"cond_stage_model.", "first_stage_model.", "model.diffusion_model."}):
                return ModelType.Main
            elif any(key.startswith(v) for v in {"encoder.conv_in", "decoder.conv_in"}):
                return ModelType.Vae
            elif any(key.startswith(v) for v in {"lora_te_", "lora_unet_"}):
                return ModelType.Lora
            elif any(key.endswith(v) for v in {"to_k_lora.up.weight", "to_q_lora.down.weight"}):
                return ModelType.Lora
            elif any(key.startswith(v) for v in {"control_model", "input_blocks"}):
                return ModelType.ControlNet
            elif key in {"emb_params", "string_to_param"}:
                return ModelType.TextualInversion
        else:
            # diffusers-ti
            if len(ckpt) < 10 and all(isinstance(v, torch.Tensor) for v in ckpt.values()):
                return ModelType.TextualInversion
        raise InvalidModelException(f"Unable to determine model type for {model_path}")
    @classmethod
    def get_model_type_from_folder(cls, folder_path: Path, model: ModelMixin) -> ModelType:
        """
        Get the model type of a hugging-face style folder.
        """
        class_name = None
        error_hint = None
        if model:
            class_name = model.__class__.__name__
        else:
            for suffix in ["bin", "safetensors"]:
                if (folder_path / f"learned_embeds.{suffix}").exists():
                    return ModelType.TextualInversion
                if (folder_path / f"pytorch_lora_weights.{suffix}").exists():
                    return ModelType.Lora
            if (folder_path / "unet/model.onnx").exists():
                return ModelType.ONNX
            if (folder_path / "image_encoder.txt").exists():
                return ModelType.IPAdapter
            i = folder_path / "model_index.json"
            c = folder_path / "config.json"
            config_path = i if i.exists() else c if c.exists() else None
            if config_path:
                with open(config_path, "r") as file:
                    conf = json.load(file)
                if "_class_name" in conf:
                    class_name = conf["_class_name"]
                elif "architectures" in conf:
                    class_name = conf["architectures"][0]
                else:
                    class_name = None
            else:
                error_hint = f"No model_index.json or config.json found in {folder_path}."
        if class_name and (type := cls.CLASS2TYPE.get(class_name)):
            return type
        else:
            error_hint = f"class {class_name} is not one of the supported classes [{', '.join(cls.CLASS2TYPE.keys())}]"
        # give up
        raise InvalidModelException(
            f"Unable to determine model type for {folder_path}" + (f"; {error_hint}" if error_hint else "")
        )
    @classmethod
    def _scan_and_load_checkpoint(cls, model_path: Path) -> dict:
        with SilenceWarnings():
            if model_path.suffix.endswith((".ckpt", ".pt", ".bin")):
                cls._scan_model(model_path, model_path)
                return torch.load(model_path, map_location="cpu")
            else:
                return safetensors.torch.load_file(model_path)
    @classmethod
    def _scan_model(cls, model_name, checkpoint):
        """
        Apply picklescanner to the indicated checkpoint and issue a warning
        and option to exit if an infected file is identified.
        """
        # scan model
        scan_result = scan_file_path(checkpoint)
        if scan_result.infected_files != 0:
            raise Exception("The model {model_name} is potentially infected by malware. Aborting import.")
 # ##################################################3
 # Checkpoint probing
 # ##################################################3
 class ProbeBase(object):
    def get_base_type(self) -> BaseModelType:
        pass
    def get_variant_type(self) -> ModelVariantType:
        pass
    def get_scheduler_prediction_type(self) -> SchedulerPredictionType:
        pass
    def get_format(self) -> str:
        pass
 class CheckpointProbeBase(ProbeBase):
    def __init__(
        self, checkpoint_path: Path, checkpoint: dict, helper: Callable[[Path], SchedulerPredictionType] = None
    ) -> BaseModelType:
        self.checkpoint = checkpoint or ModelProbe._scan_and_load_checkpoint(checkpoint_path)
        self.checkpoint_path = checkpoint_path
        self.helper = helper
    def get_base_type(self) -> BaseModelType:
        pass
    def get_format(self) -> str:
        return "checkpoint"
    def get_variant_type(self) -> ModelVariantType:
        model_type = ModelProbe.get_model_type_from_checkpoint(self.checkpoint_path, self.checkpoint)
        if model_type != ModelType.Main:
            return ModelVariantType.Normal
        state_dict = self.checkpoint.get("state_dict") or self.checkpoint
        in_channels = state_dict["model.diffusion_model.input_blocks.0.0.weight"].shape[1]
        if in_channels == 9:
            return ModelVariantType.Inpaint
        elif in_channels == 5:
            return ModelVariantType.Depth
        elif in_channels == 4:
            return ModelVariantType.Normal
        else:
            raise InvalidModelException(
                f"Cannot determine variant type (in_channels={in_channels}) at {self.checkpoint_path}"
            )
 class PipelineCheckpointProbe(CheckpointProbeBase):
    def get_base_type(self) -> BaseModelType:
        checkpoint = self.checkpoint
        state_dict = self.checkpoint.get("state_dict") or checkpoint
        key_name = "model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn2.to_k.weight"
        if key_name in state_dict and state_dict[key_name].shape[-1] == 768:
            return BaseModelType.StableDiffusion1
        if key_name in state_dict and state_dict[key_name].shape[-1] == 1024:
            return BaseModelType.StableDiffusion2
        key_name = "model.diffusion_model.input_blocks.4.1.transformer_blocks.0.attn2.to_k.weight"
        if key_name in state_dict and state_dict[key_name].shape[-1] == 2048:
            return BaseModelType.StableDiffusionXL
        elif key_name in state_dict and state_dict[key_name].shape[-1] == 1280:
            return BaseModelType.StableDiffusionXLRefiner
        else:
            raise InvalidModelException("Cannot determine base type")
    def get_scheduler_prediction_type(self) -> Optional[SchedulerPredictionType]:
        """Return model prediction type."""
        # if there is a .yaml associated with this checkpoint, then we do not need
        # to probe for the prediction type as it will be ignored.
        if self.checkpoint_path and self.checkpoint_path.with_suffix(".yaml").exists():
            return None
        type = self.get_base_type()
        if type == BaseModelType.StableDiffusion2:
            checkpoint = self.checkpoint
            state_dict = self.checkpoint.get("state_dict") or checkpoint
            key_name = "model.diffusion_model.input_blocks.2.1.transformer_blocks.0.attn2.to_k.weight"
            if key_name in state_dict and state_dict[key_name].shape[-1] == 1024:
                if "global_step" in checkpoint:
                    if checkpoint["global_step"] == 220000:
                        return SchedulerPredictionType.Epsilon
                    elif checkpoint["global_step"] == 110000:
                        return SchedulerPredictionType.VPrediction
            if self.helper and self.checkpoint_path:
                if helper_guess := self.helper(self.checkpoint_path):
                    return helper_guess
            return SchedulerPredictionType.VPrediction  # a guess for sd2 ckpts
        elif type == BaseModelType.StableDiffusion1:
            if self.helper and self.checkpoint_path:
                if helper_guess := self.helper(self.checkpoint_path):
                    return helper_guess
            return SchedulerPredictionType.Epsilon  # a reasonable guess for sd1 ckpts
        else:
            return None
 class VaeCheckpointProbe(CheckpointProbeBase):
    def get_base_type(self) -> BaseModelType:
        # I can't find any standalone 2.X VAEs to test with!
        return BaseModelType.StableDiffusion1
 class LoRACheckpointProbe(CheckpointProbeBase):
    def get_format(self) -> str:
        return "lycoris"
    def get_base_type(self) -> BaseModelType:
        checkpoint = self.checkpoint
        token_vector_length = lora_token_vector_length(checkpoint)
        if token_vector_length == 768:
            return BaseModelType.StableDiffusion1
        elif token_vector_length == 1024:
            return BaseModelType.StableDiffusion2
        elif token_vector_length == 1280:
            return BaseModelType.StableDiffusionXL  # recognizes format at https://civitai.com/models/224641
        elif token_vector_length == 2048:
            return BaseModelType.StableDiffusionXL
        else:
            raise InvalidModelException(f"Unknown LoRA type: {self.checkpoint_path}")
 class TextualInversionCheckpointProbe(CheckpointProbeBase):
    def get_format(self) -> str:
        return None
    def get_base_type(self) -> BaseModelType:
        checkpoint = self.checkpoint
        if "string_to_token" in checkpoint:
            token_dim = list(checkpoint["string_to_param"].values())[0].shape[-1]
        elif "emb_params" in checkpoint:
            token_dim = checkpoint["emb_params"].shape[-1]
        elif "clip_g" in checkpoint:
            token_dim = checkpoint["clip_g"].shape[-1]
        else:
            token_dim = list(checkpoint.values())[0].shape[-1]
        if token_dim == 768:
            return BaseModelType.StableDiffusion1
        elif token_dim == 1024:
            return BaseModelType.StableDiffusion2
        elif token_dim == 1280:
            return BaseModelType.StableDiffusionXL
        else:
            return None
 class ControlNetCheckpointProbe(CheckpointProbeBase):
    def get_base_type(self) -> BaseModelType:
        checkpoint = self.checkpoint
        for key_name in (
            "control_model.input_blocks.2.1.transformer_blocks.0.attn2.to_k.weight",
            "input_blocks.2.1.transformer_blocks.0.attn2.to_k.weight",
        ):
            if key_name not in checkpoint:
                continue
            if checkpoint[key_name].shape[-1] == 768:
                return BaseModelType.StableDiffusion1
            elif checkpoint[key_name].shape[-1] == 1024:
                return BaseModelType.StableDiffusion2
            elif self.checkpoint_path and self.helper:
                return self.helper(self.checkpoint_path)
        raise InvalidModelException("Unable to determine base type for {self.checkpoint_path}")
 class IPAdapterCheckpointProbe(CheckpointProbeBase):
    def get_base_type(self) -> BaseModelType:
        raise NotImplementedError()
 class CLIPVisionCheckpointProbe(CheckpointProbeBase):
    def get_base_type(self) -> BaseModelType:
        raise NotImplementedError()
 class T2IAdapterCheckpointProbe(CheckpointProbeBase):
    def get_base_type(self) -> BaseModelType:
        raise NotImplementedError()
 ########################################################
 # classes for probing folders
 #######################################################
 class FolderProbeBase(ProbeBase):
    def __init__(self, folder_path: Path, model: ModelMixin = None, helper: Callable = None):  # not used
        self.model = model
        self.folder_path = folder_path
    def get_variant_type(self) -> ModelVariantType:
        return ModelVariantType.Normal
    def get_format(self) -> str:
        return "diffusers"
 class PipelineFolderProbe(FolderProbeBase):
    def get_base_type(self) -> BaseModelType:
        if self.model:
            unet_conf = self.model.unet.config
        else:
            with open(self.folder_path / "unet" / "config.json", "r") as file:
                unet_conf = json.load(file)
        if unet_conf["cross_attention_dim"] == 768:
            return BaseModelType.StableDiffusion1
        elif unet_conf["cross_attention_dim"] == 1024:
            return BaseModelType.StableDiffusion2
        elif unet_conf["cross_attention_dim"] == 1280:
            return BaseModelType.StableDiffusionXLRefiner
        elif unet_conf["cross_attention_dim"] == 2048:
            return BaseModelType.StableDiffusionXL
        else:
            raise InvalidModelException(f"Unknown base model for {self.folder_path}")
    def get_scheduler_prediction_type(self) -> SchedulerPredictionType:
        if self.model:
            scheduler_conf = self.model.scheduler.config
        else:
            with open(self.folder_path / "scheduler" / "scheduler_config.json", "r") as file:
                scheduler_conf = json.load(file)
        if scheduler_conf["prediction_type"] == "v_prediction":
            return SchedulerPredictionType.VPrediction
        elif scheduler_conf["prediction_type"] == "epsilon":
            return SchedulerPredictionType.Epsilon
        else:
            return None
    def get_variant_type(self) -> ModelVariantType:
        # This only works for pipelines! Any kind of
        # exception results in our returning the
        # "normal" variant type
        try:
            if self.model:
                conf = self.model.unet.config
            else:
                config_file = self.folder_path / "unet" / "config.json"
                with open(config_file, "r") as file:
                    conf = json.load(file)
            in_channels = conf["in_channels"]
            if in_channels == 9:
                return ModelVariantType.Inpaint
            elif in_channels == 5:
                return ModelVariantType.Depth
            elif in_channels == 4:
                return ModelVariantType.Normal
        except Exception:
            pass
        return ModelVariantType.Normal
 class VaeFolderProbe(FolderProbeBase):
    def get_base_type(self) -> BaseModelType:
        if self._config_looks_like_sdxl():
            return BaseModelType.StableDiffusionXL
        elif self._name_looks_like_sdxl():
            # but SD and SDXL VAE are the same shape (3-channel RGB to 4-channel float scaled down
            # by a factor of 8), we can't necessarily tell them apart by config hyperparameters.
            return BaseModelType.StableDiffusionXL
        else:
            return BaseModelType.StableDiffusion1
    def _config_looks_like_sdxl(self) -> bool:
        # config values that distinguish Stability's SD 1.x VAE from their SDXL VAE.
        config_file = self.folder_path / "config.json"
        if not config_file.exists():
            raise InvalidModelException(f"Cannot determine base type for {self.folder_path}")
        with open(config_file, "r") as file:
            config = json.load(file)
        return config.get("scaling_factor", 0) == 0.13025 and config.get("sample_size") in [512, 1024]
    def _name_looks_like_sdxl(self) -> bool:
        return bool(re.search(r"xl\b", self._guess_name(), re.IGNORECASE))
    def _guess_name(self) -> str:
        name = self.folder_path.name
        if name == "vae":
            name = self.folder_path.parent.name
        return name
 class TextualInversionFolderProbe(FolderProbeBase):
    def get_format(self) -> str:
        return None
    def get_base_type(self) -> BaseModelType:
        path = self.folder_path / "learned_embeds.bin"
        if not path.exists():
            return None
        checkpoint = ModelProbe._scan_and_load_checkpoint(path)
        return TextualInversionCheckpointProbe(None, checkpoint=checkpoint).get_base_type()
 class ONNXFolderProbe(FolderProbeBase):
    def get_format(self) -> str:
        return "onnx"
    def get_base_type(self) -> BaseModelType:
        return BaseModelType.StableDiffusion1
    def get_variant_type(self) -> ModelVariantType:
        return ModelVariantType.Normal
 class ControlNetFolderProbe(FolderProbeBase):
    def get_base_type(self) -> BaseModelType:
        config_file = self.folder_path / "config.json"
        if not config_file.exists():
            raise InvalidModelException(f"Cannot determine base type for {self.folder_path}")
        with open(config_file, "r") as file:
            config = json.load(file)
        # no obvious way to distinguish between sd2-base and sd2-768
        dimension = config["cross_attention_dim"]
        base_model = (
            BaseModelType.StableDiffusion1
            if dimension == 768
            else (
                BaseModelType.StableDiffusion2
                if dimension == 1024
                else BaseModelType.StableDiffusionXL
                if dimension == 2048
                else None
            )
        )
        if not base_model:
            raise InvalidModelException(f"Unable to determine model base for {self.folder_path}")
        return base_model
 class LoRAFolderProbe(FolderProbeBase):
    def get_base_type(self) -> BaseModelType:
        model_file = None
        for suffix in ["safetensors", "bin"]:
            base_file = self.folder_path / f"pytorch_lora_weights.{suffix}"
            if base_file.exists():
                model_file = base_file
                break
        if not model_file:
            raise InvalidModelException("Unknown LoRA format encountered")
        return LoRACheckpointProbe(model_file, None).get_base_type()
 class IPAdapterFolderProbe(FolderProbeBase):
    def get_format(self) -> str:
        return IPAdapterModelFormat.InvokeAI.value
    def get_base_type(self) -> BaseModelType:
        model_file = self.folder_path / "ip_adapter.bin"
        if not model_file.exists():
            raise InvalidModelException("Unknown IP-Adapter model format.")
        state_dict = torch.load(model_file, map_location="cpu")
        cross_attention_dim = state_dict["ip_adapter"]["1.to_k_ip.weight"].shape[-1]
        if cross_attention_dim == 768:
            return BaseModelType.StableDiffusion1
        elif cross_attention_dim == 1024:
            return BaseModelType.StableDiffusion2
        elif cross_attention_dim == 2048:
            return BaseModelType.StableDiffusionXL
        else:
            raise InvalidModelException(f"IP-Adapter had unexpected cross-attention dimension: {cross_attention_dim}.")
 class CLIPVisionFolderProbe(FolderProbeBase):
    def get_base_type(self) -> BaseModelType:
        return BaseModelType.Any
 class T2IAdapterFolderProbe(FolderProbeBase):
    def get_base_type(self) -> BaseModelType:
        config_file = self.folder_path / "config.json"
        if not config_file.exists():
            raise InvalidModelException(f"Cannot determine base type for {self.folder_path}")
        with open(config_file, "r") as file:
            config = json.load(file)
        adapter_type = config.get("adapter_type", None)
        if adapter_type == "full_adapter_xl":
            return BaseModelType.StableDiffusionXL
        elif adapter_type == "full_adapter" or "light_adapter":
            # I haven't seen any T2I adapter models for SD2, so assume that this is an SD1 adapter.
            return BaseModelType.StableDiffusion1
        else:
            raise InvalidModelException(
                f"Unable to determine base model for '{self.folder_path}' (adapter_type = {adapter_type})."
            )
 ############## register probe classes ######
 ModelProbe.register_probe("diffusers", ModelType.Main, PipelineFolderProbe)
 ModelProbe.register_probe("diffusers", ModelType.Vae, VaeFolderProbe)
 ModelProbe.register_probe("diffusers", ModelType.Lora, LoRAFolderProbe)
 ModelProbe.register_probe("diffusers", ModelType.TextualInversion, TextualInversionFolderProbe)
 ModelProbe.register_probe("diffusers", ModelType.ControlNet, ControlNetFolderProbe)
 ModelProbe.register_probe("diffusers", ModelType.IPAdapter, IPAdapterFolderProbe)
 ModelProbe.register_probe("diffusers", ModelType.CLIPVision, CLIPVisionFolderProbe)
 ModelProbe.register_probe("diffusers", ModelType.T2IAdapter, T2IAdapterFolderProbe)
 ModelProbe.register_probe("checkpoint", ModelType.Main, PipelineCheckpointProbe)
 ModelProbe.register_probe("checkpoint", ModelType.Vae, VaeCheckpointProbe)
 ModelProbe.register_probe("checkpoint", ModelType.Lora, LoRACheckpointProbe)
 ModelProbe.register_probe("checkpoint", ModelType.TextualInversion, TextualInversionCheckpointProbe)
 ModelProbe.register_probe("checkpoint", ModelType.ControlNet, ControlNetCheckpointProbe)
 ModelProbe.register_probe("checkpoint", ModelType.IPAdapter, IPAdapterCheckpointProbe)
 ModelProbe.register_probe("checkpoint", ModelType.CLIPVision, CLIPVisionCheckpointProbe)
 ModelProbe.register_probe("checkpoint", ModelType.T2IAdapter, T2IAdapterCheckpointProbe)
 ModelProbe.register_probe("onnx", ModelType.ONNX, ONNXFolderProbe)
--- a/invokeai/backend/model_management_OLD/model_search.py
+++ b/invokeai/backend/model_management_OLD/model_search.py
@ -1,112 +0,0 @@
 # Copyright 2023, Lincoln D. Stein and the InvokeAI Team
 """
 Abstract base class for recursive directory search for models.
 """
 import os
 from abc import ABC, abstractmethod
 from pathlib import Path
 from typing import List, Set, types
 import invokeai.backend.util.logging as logger
 class ModelSearch(ABC):
    def __init__(self, directories: List[Path], logger: types.ModuleType = logger):
        """
        Initialize a recursive model directory search.
        :param directories: List of directory Paths to recurse through
        :param logger: Logger to use
        """
        self.directories = directories
        self.logger = logger
        self._items_scanned = 0
        self._models_found = 0
        self._scanned_dirs = set()
        self._scanned_paths = set()
        self._pruned_paths = set()
    @abstractmethod
    def on_search_started(self):
        """
        Called before the scan starts.
        """
        pass
    @abstractmethod
    def on_model_found(self, model: Path):
        """
        Process a found model. Raise an exception if something goes wrong.
        :param model: Model to process - could be a directory or checkpoint.
        """
        pass
    @abstractmethod
    def on_search_completed(self):
        """
        Perform some activity when the scan is completed. May use instance
        variables, items_scanned and models_found
        """
        pass
    def search(self):
        self.on_search_started()
        for dir in self.directories:
            self.walk_directory(dir)
        self.on_search_completed()
    def walk_directory(self, path: Path):
        for root, dirs, files in os.walk(path, followlinks=True):
            if str(Path(root).name).startswith("."):
                self._pruned_paths.add(root)
            if any(Path(root).is_relative_to(x) for x in self._pruned_paths):
                continue
            self._items_scanned += len(dirs) + len(files)
            for d in dirs:
                path = Path(root) / d
                if path in self._scanned_paths or path.parent in self._scanned_dirs:
                    self._scanned_dirs.add(path)
                    continue
                if any(
                    (path / x).exists()
                    for x in {
                        "config.json",
                        "model_index.json",
                        "learned_embeds.bin",
                        "pytorch_lora_weights.bin",
                        "image_encoder.txt",
                    }
                ):
                    try:
                        self.on_model_found(path)
                        self._models_found += 1
                        self._scanned_dirs.add(path)
                    except Exception as e:
                        self.logger.warning(f"Failed to process '{path}': {e}")
            for f in files:
                path = Path(root) / f
                if path.parent in self._scanned_dirs:
                    continue
                if path.suffix in {".ckpt", ".bin", ".pth", ".safetensors", ".pt"}:
                    try:
                        self.on_model_found(path)
                        self._models_found += 1
                    except Exception as e:
                        self.logger.warning(f"Failed to process '{path}': {e}")
 class FindModels(ModelSearch):
    def on_search_started(self):
        self.models_found: Set[Path] = set()
    def on_model_found(self, model: Path):
        self.models_found.add(model)
    def on_search_completed(self):
        pass
    def list_models(self) -> List[Path]:
        self.search()
        return list(self.models_found)
--- a/invokeai/backend/model_management_OLD/models/init.py
+++ b/invokeai/backend/model_management_OLD/models/init.py
@ -1,167 +0,0 @@
 import inspect
 from enum import Enum
 from typing import Literal, get_origin
 from pydantic import BaseModel, ConfigDict, create_model
 from .base import (  # noqa: F401
    BaseModelType,
    DuplicateModelException,
    InvalidModelException,
    ModelBase,
    ModelConfigBase,
    ModelError,
    ModelNotFoundException,
    ModelType,
    ModelVariantType,
    SchedulerPredictionType,
    SilenceWarnings,
    SubModelType,
 )
 from .clip_vision import CLIPVisionModel
 from .controlnet import ControlNetModel  # TODO:
 from .ip_adapter import IPAdapterModel
 from .lora import LoRAModel
 from .sdxl import StableDiffusionXLModel
 from .stable_diffusion import StableDiffusion1Model, StableDiffusion2Model
 from .stable_diffusion_onnx import ONNXStableDiffusion1Model, ONNXStableDiffusion2Model
 from .t2i_adapter import T2IAdapterModel
 from .textual_inversion import TextualInversionModel
 from .vae import VaeModel
 MODEL_CLASSES = {
    BaseModelType.StableDiffusion1: {
        ModelType.ONNX: ONNXStableDiffusion1Model,
        ModelType.Main: StableDiffusion1Model,
        ModelType.Vae: VaeModel,
        ModelType.Lora: LoRAModel,
        ModelType.ControlNet: ControlNetModel,
        ModelType.TextualInversion: TextualInversionModel,
        ModelType.IPAdapter: IPAdapterModel,
        ModelType.CLIPVision: CLIPVisionModel,
        ModelType.T2IAdapter: T2IAdapterModel,
    },
    BaseModelType.StableDiffusion2: {
        ModelType.ONNX: ONNXStableDiffusion2Model,
        ModelType.Main: StableDiffusion2Model,
        ModelType.Vae: VaeModel,
        ModelType.Lora: LoRAModel,
        ModelType.ControlNet: ControlNetModel,
        ModelType.TextualInversion: TextualInversionModel,
        ModelType.IPAdapter: IPAdapterModel,
        ModelType.CLIPVision: CLIPVisionModel,
        ModelType.T2IAdapter: T2IAdapterModel,
    },
    BaseModelType.StableDiffusionXL: {
        ModelType.Main: StableDiffusionXLModel,
        ModelType.Vae: VaeModel,
        # will not work until support written
        ModelType.Lora: LoRAModel,
        ModelType.ControlNet: ControlNetModel,
        ModelType.TextualInversion: TextualInversionModel,
        ModelType.ONNX: ONNXStableDiffusion2Model,
        ModelType.IPAdapter: IPAdapterModel,
        ModelType.CLIPVision: CLIPVisionModel,
        ModelType.T2IAdapter: T2IAdapterModel,
    },
    BaseModelType.StableDiffusionXLRefiner: {
        ModelType.Main: StableDiffusionXLModel,
        ModelType.Vae: VaeModel,
        # will not work until support written
        ModelType.Lora: LoRAModel,
        ModelType.ControlNet: ControlNetModel,
        ModelType.TextualInversion: TextualInversionModel,
        ModelType.ONNX: ONNXStableDiffusion2Model,
        ModelType.IPAdapter: IPAdapterModel,
        ModelType.CLIPVision: CLIPVisionModel,
        ModelType.T2IAdapter: T2IAdapterModel,
    },
    BaseModelType.Any: {
        ModelType.CLIPVision: CLIPVisionModel,
        # The following model types are not expected to be used with BaseModelType.Any.
        ModelType.ONNX: ONNXStableDiffusion2Model,
        ModelType.Main: StableDiffusion2Model,
        ModelType.Vae: VaeModel,
        ModelType.Lora: LoRAModel,
        ModelType.ControlNet: ControlNetModel,
        ModelType.TextualInversion: TextualInversionModel,
        ModelType.IPAdapter: IPAdapterModel,
        ModelType.T2IAdapter: T2IAdapterModel,
    },
    # BaseModelType.Kandinsky2_1: {
    #    ModelType.Main: Kandinsky2_1Model,
    #    ModelType.MoVQ: MoVQModel,
    #    ModelType.Lora: LoRAModel,
    #    ModelType.ControlNet: ControlNetModel,
    #    ModelType.TextualInversion: TextualInversionModel,
    # },
 }
 MODEL_CONFIGS = []
 OPENAPI_MODEL_CONFIGS = []
 class OpenAPIModelInfoBase(BaseModel):
    model_name: str
    base_model: BaseModelType
    model_type: ModelType
    model_config = ConfigDict(protected_namespaces=())
 for _base_model, models in MODEL_CLASSES.items():
    for model_type, model_class in models.items():
        model_configs = set(model_class._get_configs().values())
        model_configs.discard(None)
        MODEL_CONFIGS.extend(model_configs)
        # LS: sort to get the checkpoint configs first, which makes
        # for a better template in the Swagger docs
        for cfg in sorted(model_configs, key=lambda x: str(x)):
            model_name, cfg_name = cfg.__qualname__.split(".")[-2:]
            openapi_cfg_name = model_name + cfg_name
            if openapi_cfg_name in vars():
                continue
            api_wrapper = create_model(
                openapi_cfg_name,
                __base__=(cfg, OpenAPIModelInfoBase),
                model_type=(Literal[model_type], model_type),  # type: ignore
            )
            vars()[openapi_cfg_name] = api_wrapper
            OPENAPI_MODEL_CONFIGS.append(api_wrapper)
 def get_model_config_enums():
    enums = []
    for model_config in MODEL_CONFIGS:
        if hasattr(inspect, "get_annotations"):
            fields = inspect.get_annotations(model_config)
        else:
            fields = model_config.__annotations__
        try:
            field = fields["model_format"]
        except Exception:
            raise Exception("format field not found")
        # model_format: None
        # model_format: SomeModelFormat
        # model_format: Literal[SomeModelFormat.Diffusers]
        # model_format: Literal[SomeModelFormat.Diffusers, SomeModelFormat.Checkpoint]
        if isinstance(field, type) and issubclass(field, str) and issubclass(field, Enum):
            enums.append(field)
        elif get_origin(field) is Literal and all(
            isinstance(arg, str) and isinstance(arg, Enum) for arg in field.__args__
        ):
            enums.append(type(field.__args__[0]))
        elif field is None:
            pass
        else:
            raise Exception(f"Unsupported format definition in {model_configs.__qualname__}")
    return enums
--- a/invokeai/backend/model_management_OLD/models/base.py
+++ b/invokeai/backend/model_management_OLD/models/base.py
@ -1,681 +0,0 @@
 import inspect
 import json
 import os
 import sys
 import typing
 import warnings
 from abc import ABCMeta, abstractmethod
 from contextlib import suppress
 from enum import Enum
 from pathlib import Path
 from typing import Any, Callable, Dict, Generic, List, Literal, Optional, Type, TypeVar, Union
 import numpy as np
 import onnx
 import safetensors.torch
 import torch
 from diffusers import ConfigMixin, DiffusionPipeline
 from diffusers import logging as diffusers_logging
 from onnx import numpy_helper
 from onnxruntime import InferenceSession, SessionOptions, get_available_providers
 from picklescan.scanner import scan_file_path
 from pydantic import BaseModel, ConfigDict, Field
 from transformers import logging as transformers_logging
 class DuplicateModelException(Exception):
    pass
 class InvalidModelException(Exception):
    pass
 class ModelNotFoundException(Exception):
    pass
 class BaseModelType(str, Enum):
    Any = "any"  # For models that are not associated with any particular base model.
    StableDiffusion1 = "sd-1"
    StableDiffusion2 = "sd-2"
    StableDiffusionXL = "sdxl"
    StableDiffusionXLRefiner = "sdxl-refiner"
    # Kandinsky2_1 = "kandinsky-2.1"
 class ModelType(str, Enum):
    ONNX = "onnx"
    Main = "main"
    Vae = "vae"
    Lora = "lora"
    ControlNet = "controlnet"  # used by model_probe
    TextualInversion = "embedding"
    IPAdapter = "ip_adapter"
    CLIPVision = "clip_vision"
    T2IAdapter = "t2i_adapter"
 class SubModelType(str, Enum):
    UNet = "unet"
    TextEncoder = "text_encoder"
    TextEncoder2 = "text_encoder_2"
    Tokenizer = "tokenizer"
    Tokenizer2 = "tokenizer_2"
    Vae = "vae"
    VaeDecoder = "vae_decoder"
    VaeEncoder = "vae_encoder"
    Scheduler = "scheduler"
    SafetyChecker = "safety_checker"
    # MoVQ = "movq"
 class ModelVariantType(str, Enum):
    Normal = "normal"
    Inpaint = "inpaint"
    Depth = "depth"
 class SchedulerPredictionType(str, Enum):
    Epsilon = "epsilon"
    VPrediction = "v_prediction"
    Sample = "sample"
 class ModelError(str, Enum):
    NotFound = "not_found"
 def model_config_json_schema_extra(schema: dict[str, Any]) -> None:
    if "required" not in schema:
        schema["required"] = []
    schema["required"].append("model_type")
 class ModelConfigBase(BaseModel):
    path: str  # or Path
    description: Optional[str] = Field(None)
    model_format: Optional[str] = Field(None)
    error: Optional[ModelError] = Field(None)
    model_config = ConfigDict(
        use_enum_values=True, protected_namespaces=(), json_schema_extra=model_config_json_schema_extra
    )
 class EmptyConfigLoader(ConfigMixin):
    @classmethod
    def load_config(cls, *args, **kwargs):
        cls.config_name = kwargs.pop("config_name")
        return super().load_config(*args, **kwargs)
 T_co = TypeVar("T_co", covariant=True)
 class classproperty(Generic[T_co]):
    def __init__(self, fget: Callable[[Any], T_co]) -> None:
        self.fget = fget
    def __get__(self, instance: Optional[Any], owner: Type[Any]) -> T_co:
        return self.fget(owner)
    def __set__(self, instance: Optional[Any], value: Any) -> None:
        raise AttributeError("cannot set attribute")
 class ModelBase(metaclass=ABCMeta):
    # model_path: str
    # base_model: BaseModelType
    # model_type: ModelType
    def __init__(
        self,
        model_path: str,
        base_model: BaseModelType,
        model_type: ModelType,
    ):
        self.model_path = model_path
        self.base_model = base_model
        self.model_type = model_type
    def _hf_definition_to_type(self, subtypes: List[str]) -> Type:
        if len(subtypes) < 2:
            raise Exception("Invalid subfolder definition!")
        if all(t is None for t in subtypes):
            return None
        elif any(t is None for t in subtypes):
            raise Exception(f"Unsupported definition: {subtypes}")
        if subtypes[0] in ["diffusers", "transformers"]:
            res_type = sys.modules[subtypes[0]]
            subtypes = subtypes[1:]
        else:
            res_type = sys.modules["diffusers"]
            res_type = res_type.pipelines
        for subtype in subtypes:
            res_type = getattr(res_type, subtype)
        return res_type
    @classmethod
    def _get_configs(cls):
        with suppress(Exception):
            return cls.__configs
        configs = {}
        for name in dir(cls):
            if name.startswith("__"):
                continue
            value = getattr(cls, name)
            if not isinstance(value, type) or not issubclass(value, ModelConfigBase):
                continue
            if hasattr(inspect, "get_annotations"):
                fields = inspect.get_annotations(value)
            else:
                fields = value.__annotations__
            try:
                field = fields["model_format"]
            except Exception:
                raise Exception(f"Invalid config definition - format field not found({cls.__qualname__})")
            if isinstance(field, type) and issubclass(field, str) and issubclass(field, Enum):
                for model_format in field:
                    configs[model_format.value] = value
            elif typing.get_origin(field) is Literal and all(
                isinstance(arg, str) and isinstance(arg, Enum) for arg in field.__args__
            ):
                for model_format in field.__args__:
                    configs[model_format.value] = value
            elif field is None:
                configs[None] = value
            else:
                raise Exception(f"Unsupported format definition in {cls.__qualname__}")
        cls.__configs = configs
        return cls.__configs
    @classmethod
    def create_config(cls, **kwargs) -> ModelConfigBase:
        if "model_format" not in kwargs:
            raise Exception("Field 'model_format' not found in model config")
        configs = cls._get_configs()
        return configs[kwargs["model_format"]](**kwargs)
    @classmethod
    def probe_config(cls, path: str, **kwargs) -> ModelConfigBase:
        return cls.create_config(
            path=path,
            model_format=cls.detect_format(path),
        )
    @classmethod
    @abstractmethod
    def detect_format(cls, path: str) -> str:
        raise NotImplementedError()
    @classproperty
    @abstractmethod
    def save_to_config(cls) -> bool:
        raise NotImplementedError()
    @abstractmethod
    def get_size(self, child_type: Optional[SubModelType] = None) -> int:
        raise NotImplementedError()
    @abstractmethod
    def get_model(
        self,
        torch_dtype: Optional[torch.dtype],
        child_type: Optional[SubModelType] = None,
    ) -> Any:
        raise NotImplementedError()
 class DiffusersModel(ModelBase):
    # child_types: Dict[str, Type]
    # child_sizes: Dict[str, int]
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        super().__init__(model_path, base_model, model_type)
        self.child_types: Dict[str, Type] = {}
        self.child_sizes: Dict[str, int] = {}
        try:
            config_data = DiffusionPipeline.load_config(self.model_path)
            # config_data = json.loads(os.path.join(self.model_path, "model_index.json"))
        except Exception:
            raise Exception("Invalid diffusers model! (model_index.json not found or invalid)")
        config_data.pop("_ignore_files", None)
        # retrieve all folder_names that contain relevant files
        child_components = [k for k, v in config_data.items() if isinstance(v, list)]
        for child_name in child_components:
            child_type = self._hf_definition_to_type(config_data[child_name])
            self.child_types[child_name] = child_type
            self.child_sizes[child_name] = calc_model_size_by_fs(self.model_path, subfolder=child_name)
    def get_size(self, child_type: Optional[SubModelType] = None):
        if child_type is None:
            return sum(self.child_sizes.values())
        else:
            return self.child_sizes[child_type]
    def get_model(
        self,
        torch_dtype: Optional[torch.dtype],
        child_type: Optional[SubModelType] = None,
    ):
        # return pipeline in different function to pass more arguments
        if child_type is None:
            raise Exception("Child model type can't be null on diffusers model")
        if child_type not in self.child_types:
            return None  # TODO: or raise
        if torch_dtype == torch.float16:
            variants = ["fp16", None]
        else:
            variants = [None, "fp16"]
        # TODO: better error handling(differentiate not found from others)
        for variant in variants:
            try:
                # TODO: set cache_dir to /dev/null to be sure that cache not used?
                model = self.child_types[child_type].from_pretrained(
                    self.model_path,
                    subfolder=child_type.value,
                    torch_dtype=torch_dtype,
                    variant=variant,
                    local_files_only=True,
                )
                break
            except Exception as e:
                if not str(e).startswith("Error no file"):
                    print("====ERR LOAD====")
                    print(f"{variant}: {e}")
                pass
        else:
            raise Exception(f"Failed to load {self.base_model}:{self.model_type}:{child_type} model")
        # calc more accurate size
        self.child_sizes[child_type] = calc_model_size_by_data(model)
        return model
    # def convert_if_required(model_path: str, cache_path: str, config: Optional[dict]) -> str:
 def calc_model_size_by_fs(model_path: str, subfolder: Optional[str] = None, variant: Optional[str] = None):
    if subfolder is not None:
        model_path = os.path.join(model_path, subfolder)
    # this can happen when, for example, the safety checker
    # is not downloaded.
    if not os.path.exists(model_path):
        return 0
    all_files = os.listdir(model_path)
    all_files = [f for f in all_files if os.path.isfile(os.path.join(model_path, f))]
    fp16_files = {f for f in all_files if ".fp16." in f or ".fp16-" in f}
    bit8_files = {f for f in all_files if ".8bit." in f or ".8bit-" in f}
    other_files = set(all_files) - fp16_files - bit8_files
    if variant is None:
        files = other_files
    elif variant == "fp16":
        files = fp16_files
    elif variant == "8bit":
        files = bit8_files
    else:
        raise NotImplementedError(f"Unknown variant: {variant}")
    # try read from index if exists
    index_postfix = ".index.json"
    if variant is not None:
        index_postfix = f".index.{variant}.json"
    for file in files:
        if not file.endswith(index_postfix):
            continue
        try:
            with open(os.path.join(model_path, file), "r") as f:
                index_data = json.loads(f.read())
            return int(index_data["metadata"]["total_size"])
        except Exception:
            pass
    # calculate files size if there is no index file
    formats = [
        (".safetensors",),  # safetensors
        (".bin",),  # torch
        (".onnx", ".pb"),  # onnx
        (".msgpack",),  # flax
        (".ckpt",),  # tf
        (".h5",),  # tf2
    ]
    for file_format in formats:
        model_files = [f for f in files if f.endswith(file_format)]
        if len(model_files) == 0:
            continue
        model_size = 0
        for model_file in model_files:
            file_stats = os.stat(os.path.join(model_path, model_file))
            model_size += file_stats.st_size
        return model_size
    # raise NotImplementedError(f"Unknown model structure! Files: {all_files}")
    return 0  # scheduler/feature_extractor/tokenizer - models without loading to gpu
 def calc_model_size_by_data(model) -> int:
    if isinstance(model, DiffusionPipeline):
        return _calc_pipeline_by_data(model)
    elif isinstance(model, torch.nn.Module):
        return _calc_model_by_data(model)
    elif isinstance(model, IAIOnnxRuntimeModel):
        return _calc_onnx_model_by_data(model)
    else:
        return 0
 def _calc_pipeline_by_data(pipeline) -> int:
    res = 0
    for submodel_key in pipeline.components.keys():
        submodel = getattr(pipeline, submodel_key)
        if submodel is not None and isinstance(submodel, torch.nn.Module):
            res += _calc_model_by_data(submodel)
    return res
 def _calc_model_by_data(model) -> int:
    mem_params = sum([param.nelement() * param.element_size() for param in model.parameters()])
    mem_bufs = sum([buf.nelement() * buf.element_size() for buf in model.buffers()])
    mem = mem_params + mem_bufs  # in bytes
    return mem
 def _calc_onnx_model_by_data(model) -> int:
    tensor_size = model.tensors.size() * 2  # The session doubles this
    mem = tensor_size  # in bytes
    return mem
 def _fast_safetensors_reader(path: str):
    checkpoint = {}
    device = torch.device("meta")
    with open(path, "rb") as f:
        definition_len = int.from_bytes(f.read(8), "little")
        definition_json = f.read(definition_len)
        definition = json.loads(definition_json)
        if "__metadata__" in definition and definition["__metadata__"].get("format", "pt") not in {
            "pt",
            "torch",
            "pytorch",
        }:
            raise Exception("Supported only pytorch safetensors files")
        definition.pop("__metadata__", None)
        for key, info in definition.items():
            dtype = {
                "I8": torch.int8,
                "I16": torch.int16,
                "I32": torch.int32,
                "I64": torch.int64,
                "F16": torch.float16,
                "F32": torch.float32,
                "F64": torch.float64,
            }[info["dtype"]]
            checkpoint[key] = torch.empty(info["shape"], dtype=dtype, device=device)
    return checkpoint
 def read_checkpoint_meta(path: Union[str, Path], scan: bool = False):
    if str(path).endswith(".safetensors"):
        try:
            checkpoint = _fast_safetensors_reader(path)
        except Exception:
            # TODO: create issue for support "meta"?
            checkpoint = safetensors.torch.load_file(path, device="cpu")
    else:
        if scan:
            scan_result = scan_file_path(path)
            if scan_result.infected_files != 0:
                raise Exception(f'The model file "{path}" is potentially infected by malware. Aborting import.')
        checkpoint = torch.load(path, map_location=torch.device("meta"))
    return checkpoint
 class SilenceWarnings(object):
    def __init__(self):
        self.transformers_verbosity = transformers_logging.get_verbosity()
        self.diffusers_verbosity = diffusers_logging.get_verbosity()
    def __enter__(self):
        transformers_logging.set_verbosity_error()
        diffusers_logging.set_verbosity_error()
        warnings.simplefilter("ignore")
    def __exit__(self, type, value, traceback):
        transformers_logging.set_verbosity(self.transformers_verbosity)
        diffusers_logging.set_verbosity(self.diffusers_verbosity)
        warnings.simplefilter("default")
 ONNX_WEIGHTS_NAME = "model.onnx"
 class IAIOnnxRuntimeModel:
    class _tensor_access:
        def __init__(self, model):
            self.model = model
            self.indexes = {}
            for idx, obj in enumerate(self.model.proto.graph.initializer):
                self.indexes[obj.name] = idx
        def __getitem__(self, key: str):
            value = self.model.proto.graph.initializer[self.indexes[key]]
            return numpy_helper.to_array(value)
        def __setitem__(self, key: str, value: np.ndarray):
            new_node = numpy_helper.from_array(value)
            # set_external_data(new_node, location="in-memory-location")
            new_node.name = key
            # new_node.ClearField("raw_data")
            del self.model.proto.graph.initializer[self.indexes[key]]
            self.model.proto.graph.initializer.insert(self.indexes[key], new_node)
            # self.model.data[key] = OrtValue.ortvalue_from_numpy(value)
        # __delitem__
        def __contains__(self, key: str):
            return self.indexes[key] in self.model.proto.graph.initializer
        def items(self):
            raise NotImplementedError("tensor.items")
            # return [(obj.name, obj) for obj in self.raw_proto]
        def keys(self):
            return self.indexes.keys()
        def values(self):
            raise NotImplementedError("tensor.values")
            # return [obj for obj in self.raw_proto]
        def size(self):
            bytesSum = 0
            for node in self.model.proto.graph.initializer:
                bytesSum += sys.getsizeof(node.raw_data)
            return bytesSum
    class _access_helper:
        def __init__(self, raw_proto):
            self.indexes = {}
            self.raw_proto = raw_proto
            for idx, obj in enumerate(raw_proto):
                self.indexes[obj.name] = idx
        def __getitem__(self, key: str):
            return self.raw_proto[self.indexes[key]]
        def __setitem__(self, key: str, value):
            index = self.indexes[key]
            del self.raw_proto[index]
            self.raw_proto.insert(index, value)
        # __delitem__
        def __contains__(self, key: str):
            return key in self.indexes
        def items(self):
            return [(obj.name, obj) for obj in self.raw_proto]
        def keys(self):
            return self.indexes.keys()
        def values(self):
            return list(self.raw_proto)
    def __init__(self, model_path: str, provider: Optional[str]):
        self.path = model_path
        self.session = None
        self.provider = provider
        """
        self.data_path = self.path + "_data"
        if not os.path.exists(self.data_path):
            print(f"Moving model tensors to separate file: {self.data_path}")
            tmp_proto = onnx.load(model_path, load_external_data=True)
            onnx.save_model(tmp_proto, self.path, save_as_external_data=True, all_tensors_to_one_file=True, location=os.path.basename(self.data_path), size_threshold=1024, convert_attribute=False)
            del tmp_proto
            gc.collect()
        self.proto = onnx.load(model_path, load_external_data=False)
        """
        self.proto = onnx.load(model_path, load_external_data=True)
        # self.data = dict()
        # for tensor in self.proto.graph.initializer:
        #     name = tensor.name
        #     if tensor.HasField("raw_data"):
        #         npt = numpy_helper.to_array(tensor)
        #         orv = OrtValue.ortvalue_from_numpy(npt)
        #         # self.data[name] = orv
        #         # set_external_data(tensor, location="in-memory-location")
        #         tensor.name = name
        #         # tensor.ClearField("raw_data")
        self.nodes = self._access_helper(self.proto.graph.node)
        # self.initializers = self._access_helper(self.proto.graph.initializer)
        # print(self.proto.graph.input)
        # print(self.proto.graph.initializer)
        self.tensors = self._tensor_access(self)
    # TODO: integrate with model manager/cache
    def create_session(self, height=None, width=None):
        if self.session is None or self.session_width != width or self.session_height != height:
            # onnx.save(self.proto, "tmp.onnx")
            # onnx.save_model(self.proto, "tmp.onnx", save_as_external_data=True, all_tensors_to_one_file=True, location="tmp.onnx_data", size_threshold=1024, convert_attribute=False)
            # TODO: something to be able to get weight when they already moved outside of model proto
            # (trimmed_model, external_data) = buffer_external_data_tensors(self.proto)
            sess = SessionOptions()
            # self._external_data.update(**external_data)
            # sess.add_external_initializers(list(self.data.keys()), list(self.data.values()))
            # sess.enable_profiling = True
            # sess.intra_op_num_threads = 1
            # sess.inter_op_num_threads = 1
            # sess.execution_mode = ExecutionMode.ORT_SEQUENTIAL
            # sess.graph_optimization_level = GraphOptimizationLevel.ORT_ENABLE_ALL
            # sess.enable_cpu_mem_arena = True
            # sess.enable_mem_pattern = True
            # sess.add_session_config_entry("session.intra_op.use_xnnpack_threadpool", "1") ########### It's the key code
            self.session_height = height
            self.session_width = width
            if height and width:
                sess.add_free_dimension_override_by_name("unet_sample_batch", 2)
                sess.add_free_dimension_override_by_name("unet_sample_channels", 4)
                sess.add_free_dimension_override_by_name("unet_hidden_batch", 2)
                sess.add_free_dimension_override_by_name("unet_hidden_sequence", 77)
                sess.add_free_dimension_override_by_name("unet_sample_height", self.session_height)
                sess.add_free_dimension_override_by_name("unet_sample_width", self.session_width)
                sess.add_free_dimension_override_by_name("unet_time_batch", 1)
            providers = []
            if self.provider:
                providers.append(self.provider)
            else:
                providers = get_available_providers()
            if "TensorrtExecutionProvider" in providers:
                providers.remove("TensorrtExecutionProvider")
            try:
                self.session = InferenceSession(self.proto.SerializeToString(), providers=providers, sess_options=sess)
            except Exception as e:
                raise e
            # self.session = InferenceSession("tmp.onnx", providers=[self.provider], sess_options=self.sess_options)
            # self.io_binding = self.session.io_binding()
    def release_session(self):
        self.session = None
        import gc
        gc.collect()
        return
    def __call__(self, **kwargs):
        if self.session is None:
            raise Exception("You should call create_session before running model")
        inputs = {k: np.array(v) for k, v in kwargs.items()}
        # output_names = self.session.get_outputs()
        # for k in inputs:
        #     self.io_binding.bind_cpu_input(k, inputs[k])
        # for name in output_names:
        #     self.io_binding.bind_output(name.name)
        # self.session.run_with_iobinding(self.io_binding, None)
        # return self.io_binding.copy_outputs_to_cpu()
        return self.session.run(None, inputs)
    # compatability with diffusers load code
    @classmethod
    def from_pretrained(
        cls,
        model_id: Union[str, Path],
        subfolder: Union[str, Path] = None,
        file_name: Optional[str] = None,
        provider: Optional[str] = None,
        sess_options: Optional["SessionOptions"] = None,
        **kwargs,
    ):
        file_name = file_name or ONNX_WEIGHTS_NAME
        if os.path.isdir(model_id):
            model_path = model_id
            if subfolder is not None:
                model_path = os.path.join(model_path, subfolder)
            model_path = os.path.join(model_path, file_name)
        else:
            model_path = model_id
        # load model from local directory
        if not os.path.isfile(model_path):
            raise Exception(f"Model not found: {model_path}")
        # TODO: session options
        return cls(model_path, provider=provider)
--- a/invokeai/backend/model_management_OLD/models/clip_vision.py
+++ b/invokeai/backend/model_management_OLD/models/clip_vision.py
@ -1,82 +0,0 @@
 import os
 from enum import Enum
 from typing import Literal, Optional
 import torch
 from transformers import CLIPVisionModelWithProjection
 from invokeai.backend.model_management.models.base import (
    BaseModelType,
    InvalidModelException,
    ModelBase,
    ModelConfigBase,
    ModelType,
    SubModelType,
    calc_model_size_by_data,
    calc_model_size_by_fs,
    classproperty,
 )
 class CLIPVisionModelFormat(str, Enum):
    Diffusers = "diffusers"
 class CLIPVisionModel(ModelBase):
    class DiffusersConfig(ModelConfigBase):
        model_format: Literal[CLIPVisionModelFormat.Diffusers]
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert model_type == ModelType.CLIPVision
        super().__init__(model_path, base_model, model_type)
        self.model_size = calc_model_size_by_fs(self.model_path)
    @classmethod
    def detect_format(cls, path: str) -> str:
        if not os.path.exists(path):
            raise ModuleNotFoundError(f"No CLIP Vision model at path '{path}'.")
        if os.path.isdir(path) and os.path.exists(os.path.join(path, "config.json")):
            return CLIPVisionModelFormat.Diffusers
        raise InvalidModelException(f"Unexpected CLIP Vision model format: {path}")
    @classproperty
    def save_to_config(cls) -> bool:
        return True
    def get_size(self, child_type: Optional[SubModelType] = None) -> int:
        if child_type is not None:
            raise ValueError("There are no child models in a CLIP Vision model.")
        return self.model_size
    def get_model(
        self,
        torch_dtype: Optional[torch.dtype],
        child_type: Optional[SubModelType] = None,
    ) -> CLIPVisionModelWithProjection:
        if child_type is not None:
            raise ValueError("There are no child models in a CLIP Vision model.")
        model = CLIPVisionModelWithProjection.from_pretrained(self.model_path, torch_dtype=torch_dtype)
        # Calculate a more accurate model size.
        self.model_size = calc_model_size_by_data(model)
        return model
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        format = cls.detect_format(model_path)
        if format == CLIPVisionModelFormat.Diffusers:
            return model_path
        else:
            raise ValueError(f"Unsupported format: '{format}'.")
--- a/invokeai/backend/model_management_OLD/models/controlnet.py
+++ b/invokeai/backend/model_management_OLD/models/controlnet.py
@ -1,162 +0,0 @@
 import os
 from enum import Enum
 from pathlib import Path
 from typing import Literal, Optional
 import torch
 import invokeai.backend.util.logging as logger
 from invokeai.app.services.config import InvokeAIAppConfig
 from .base import (
    BaseModelType,
    EmptyConfigLoader,
    InvalidModelException,
    ModelBase,
    ModelConfigBase,
    ModelNotFoundException,
    ModelType,
    SubModelType,
    calc_model_size_by_data,
    calc_model_size_by_fs,
    classproperty,
 )
 class ControlNetModelFormat(str, Enum):
    Checkpoint = "checkpoint"
    Diffusers = "diffusers"
 class ControlNetModel(ModelBase):
    # model_class: Type
    # model_size: int
    class DiffusersConfig(ModelConfigBase):
        model_format: Literal[ControlNetModelFormat.Diffusers]
    class CheckpointConfig(ModelConfigBase):
        model_format: Literal[ControlNetModelFormat.Checkpoint]
        config: str
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert model_type == ModelType.ControlNet
        super().__init__(model_path, base_model, model_type)
        try:
            config = EmptyConfigLoader.load_config(self.model_path, config_name="config.json")
            # config = json.loads(os.path.join(self.model_path, "config.json"))
        except Exception:
            raise Exception("Invalid controlnet model! (config.json not found or invalid)")
        model_class_name = config.get("_class_name", None)
        if model_class_name not in {"ControlNetModel"}:
            raise Exception(f"Invalid ControlNet model! Unknown _class_name: {model_class_name}")
        try:
            self.model_class = self._hf_definition_to_type(["diffusers", model_class_name])
            self.model_size = calc_model_size_by_fs(self.model_path)
        except Exception:
            raise Exception("Invalid ControlNet model!")
    def get_size(self, child_type: Optional[SubModelType] = None):
        if child_type is not None:
            raise Exception("There is no child models in controlnet model")
        return self.model_size
    def get_model(
        self,
        torch_dtype: Optional[torch.dtype],
        child_type: Optional[SubModelType] = None,
    ):
        if child_type is not None:
            raise Exception("There are no child models in controlnet model")
        model = None
        for variant in ["fp16", None]:
            try:
                model = self.model_class.from_pretrained(
                    self.model_path,
                    torch_dtype=torch_dtype,
                    variant=variant,
                )
                break
            except Exception:
                pass
        if not model:
            raise ModelNotFoundException()
        # calc more accurate size
        self.model_size = calc_model_size_by_data(model)
        return model
    @classproperty
    def save_to_config(cls) -> bool:
        return False
    @classmethod
    def detect_format(cls, path: str):
        if not os.path.exists(path):
            raise ModelNotFoundException()
        if os.path.isdir(path):
            if os.path.exists(os.path.join(path, "config.json")):
                return ControlNetModelFormat.Diffusers
        if os.path.isfile(path):
            if any(path.endswith(f".{ext}") for ext in ["safetensors", "ckpt", "pt", "pth"]):
                return ControlNetModelFormat.Checkpoint
        raise InvalidModelException(f"Not a valid model: {path}")
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        if cls.detect_format(model_path) == ControlNetModelFormat.Checkpoint:
            return _convert_controlnet_ckpt_and_cache(
                model_path=model_path,
                model_config=config.config,
                output_path=output_path,
                base_model=base_model,
            )
        else:
            return model_path
 def _convert_controlnet_ckpt_and_cache(
    model_path: str,
    output_path: str,
    base_model: BaseModelType,
    model_config: str,
 ) -> str:
    """
    Convert the controlnet from checkpoint format to diffusers format,
    cache it to disk, and return Path to converted
    file. If already on disk then just returns Path.
    """
    app_config = InvokeAIAppConfig.get_config()
    weights = app_config.root_path / model_path
    output_path = Path(output_path)
    logger.info(f"Converting {weights} to diffusers format")
    # return cached version if it exists
    if output_path.exists():
        return output_path
    # to avoid circular import errors
    from ..convert_ckpt_to_diffusers import convert_controlnet_to_diffusers
    convert_controlnet_to_diffusers(
        weights,
        output_path,
        original_config_file=app_config.root_path / model_config,
        image_size=512,
        scan_needed=True,
        from_safetensors=weights.suffix == ".safetensors",
    )
    return output_path
--- a/invokeai/backend/model_management_OLD/models/ip_adapter.py
+++ b/invokeai/backend/model_management_OLD/models/ip_adapter.py
@ -1,98 +0,0 @@
 import os
 import typing
 from enum import Enum
 from typing import Literal, Optional
 import torch
 from invokeai.backend.ip_adapter.ip_adapter import IPAdapter, IPAdapterPlus, build_ip_adapter
 from invokeai.backend.model_management.models.base import (
    BaseModelType,
    InvalidModelException,
    ModelBase,
    ModelConfigBase,
    ModelType,
    SubModelType,
    calc_model_size_by_fs,
    classproperty,
 )
 class IPAdapterModelFormat(str, Enum):
    # The custom IP-Adapter model format defined by InvokeAI.
    InvokeAI = "invokeai"
 class IPAdapterModel(ModelBase):
    class InvokeAIConfig(ModelConfigBase):
        model_format: Literal[IPAdapterModelFormat.InvokeAI]
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert model_type == ModelType.IPAdapter
        super().__init__(model_path, base_model, model_type)
        self.model_size = calc_model_size_by_fs(self.model_path)
    @classmethod
    def detect_format(cls, path: str) -> str:
        if not os.path.exists(path):
            raise ModuleNotFoundError(f"No IP-Adapter model at path '{path}'.")
        if os.path.isdir(path):
            model_file = os.path.join(path, "ip_adapter.bin")
            image_encoder_config_file = os.path.join(path, "image_encoder.txt")
            if os.path.exists(model_file) and os.path.exists(image_encoder_config_file):
                return IPAdapterModelFormat.InvokeAI
        raise InvalidModelException(f"Unexpected IP-Adapter model format: {path}")
    @classproperty
    def save_to_config(cls) -> bool:
        return True
    def get_size(self, child_type: Optional[SubModelType] = None) -> int:
        if child_type is not None:
            raise ValueError("There are no child models in an IP-Adapter model.")
        return self.model_size
    def get_model(
        self,
        torch_dtype: torch.dtype,
        child_type: Optional[SubModelType] = None,
    ) -> typing.Union[IPAdapter, IPAdapterPlus]:
        if child_type is not None:
            raise ValueError("There are no child models in an IP-Adapter model.")
        model = build_ip_adapter(
            ip_adapter_ckpt_path=os.path.join(self.model_path, "ip_adapter.bin"),
            device=torch.device("cpu"),
            dtype=torch_dtype,
        )
        self.model_size = model.calc_size()
        return model
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        format = cls.detect_format(model_path)
        if format == IPAdapterModelFormat.InvokeAI:
            return model_path
        else:
            raise ValueError(f"Unsupported format: '{format}'.")
 def get_ip_adapter_image_encoder_model_id(model_path: str):
    """Read the ID of the image encoder associated with the IP-Adapter at `model_path`."""
    image_encoder_config_file = os.path.join(model_path, "image_encoder.txt")
    with open(image_encoder_config_file, "r") as f:
        image_encoder_model = f.readline().strip()
    return image_encoder_model
--- a/invokeai/backend/model_management_OLD/models/lora.py
+++ b/invokeai/backend/model_management_OLD/models/lora.py
@ -1,696 +0,0 @@
 import bisect
 import os
 from enum import Enum
 from pathlib import Path
 from typing import Dict, Optional, Union
 import torch
 from safetensors.torch import load_file
 from .base import (
    BaseModelType,
    InvalidModelException,
    ModelBase,
    ModelConfigBase,
    ModelNotFoundException,
    ModelType,
    SubModelType,
    classproperty,
 )
 class LoRAModelFormat(str, Enum):
    LyCORIS = "lycoris"
    Diffusers = "diffusers"
 class LoRAModel(ModelBase):
    # model_size: int
    class Config(ModelConfigBase):
        model_format: LoRAModelFormat  # TODO:
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert model_type == ModelType.Lora
        super().__init__(model_path, base_model, model_type)
        self.model_size = os.path.getsize(self.model_path)
    def get_size(self, child_type: Optional[SubModelType] = None):
        if child_type is not None:
            raise Exception("There is no child models in lora")
        return self.model_size
    def get_model(
        self,
        torch_dtype: Optional[torch.dtype],
        child_type: Optional[SubModelType] = None,
    ):
        if child_type is not None:
            raise Exception("There is no child models in lora")
        model = LoRAModelRaw.from_checkpoint(
            file_path=self.model_path,
            dtype=torch_dtype,
            base_model=self.base_model,
        )
        self.model_size = model.calc_size()
        return model
    @classproperty
    def save_to_config(cls) -> bool:
        return True
    @classmethod
    def detect_format(cls, path: str):
        if not os.path.exists(path):
            raise ModelNotFoundException()
        if os.path.isdir(path):
            for ext in ["safetensors", "bin"]:
                if os.path.exists(os.path.join(path, f"pytorch_lora_weights.{ext}")):
                    return LoRAModelFormat.Diffusers
        if os.path.isfile(path):
            if any(path.endswith(f".{ext}") for ext in ["safetensors", "ckpt", "pt"]):
                return LoRAModelFormat.LyCORIS
        raise InvalidModelException(f"Not a valid model: {path}")
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        if cls.detect_format(model_path) == LoRAModelFormat.Diffusers:
            for ext in ["safetensors", "bin"]:  # return path to the safetensors file inside the folder
                path = Path(model_path, f"pytorch_lora_weights.{ext}")
                if path.exists():
                    return path
        else:
            return model_path
 class LoRALayerBase:
    # rank: Optional[int]
    # alpha: Optional[float]
    # bias: Optional[torch.Tensor]
    # layer_key: str
    # @property
    # def scale(self):
    #    return self.alpha / self.rank if (self.alpha and self.rank) else 1.0
    def __init__(
        self,
        layer_key: str,
        values: dict,
    ):
        if "alpha" in values:
            self.alpha = values["alpha"].item()
        else:
            self.alpha = None
        if "bias_indices" in values and "bias_values" in values and "bias_size" in values:
            self.bias = torch.sparse_coo_tensor(
                values["bias_indices"],
                values["bias_values"],
                tuple(values["bias_size"]),
            )
        else:
            self.bias = None
        self.rank = None  # set in layer implementation
        self.layer_key = layer_key
    def get_weight(self, orig_weight: torch.Tensor):
        raise NotImplementedError()
    def calc_size(self) -> int:
        model_size = 0
        for val in [self.bias]:
            if val is not None:
                model_size += val.nelement() * val.element_size()
        return model_size
    def to(
        self,
        device: Optional[torch.device] = None,
        dtype: Optional[torch.dtype] = None,
    ):
        if self.bias is not None:
            self.bias = self.bias.to(device=device, dtype=dtype)
 # TODO: find and debug lora/locon with bias
 class LoRALayer(LoRALayerBase):
    # up: torch.Tensor
    # mid: Optional[torch.Tensor]
    # down: torch.Tensor
    def __init__(
        self,
        layer_key: str,
        values: dict,
    ):
        super().__init__(layer_key, values)
        self.up = values["lora_up.weight"]
        self.down = values["lora_down.weight"]
        if "lora_mid.weight" in values:
            self.mid = values["lora_mid.weight"]
        else:
            self.mid = None
        self.rank = self.down.shape[0]
    def get_weight(self, orig_weight: torch.Tensor):
        if self.mid is not None:
            up = self.up.reshape(self.up.shape[0], self.up.shape[1])
            down = self.down.reshape(self.down.shape[0], self.down.shape[1])
            weight = torch.einsum("m n w h, i m, n j -> i j w h", self.mid, up, down)
        else:
            weight = self.up.reshape(self.up.shape[0], -1) @ self.down.reshape(self.down.shape[0], -1)
        return weight
    def calc_size(self) -> int:
        model_size = super().calc_size()
        for val in [self.up, self.mid, self.down]:
            if val is not None:
                model_size += val.nelement() * val.element_size()
        return model_size
    def to(
        self,
        device: Optional[torch.device] = None,
        dtype: Optional[torch.dtype] = None,
    ):
        super().to(device=device, dtype=dtype)
        self.up = self.up.to(device=device, dtype=dtype)
        self.down = self.down.to(device=device, dtype=dtype)
        if self.mid is not None:
            self.mid = self.mid.to(device=device, dtype=dtype)
 class LoHALayer(LoRALayerBase):
    # w1_a: torch.Tensor
    # w1_b: torch.Tensor
    # w2_a: torch.Tensor
    # w2_b: torch.Tensor
    # t1: Optional[torch.Tensor] = None
    # t2: Optional[torch.Tensor] = None
    def __init__(
        self,
        layer_key: str,
        values: dict,
    ):
        super().__init__(layer_key, values)
        self.w1_a = values["hada_w1_a"]
        self.w1_b = values["hada_w1_b"]
        self.w2_a = values["hada_w2_a"]
        self.w2_b = values["hada_w2_b"]
        if "hada_t1" in values:
            self.t1 = values["hada_t1"]
        else:
            self.t1 = None
        if "hada_t2" in values:
            self.t2 = values["hada_t2"]
        else:
            self.t2 = None
        self.rank = self.w1_b.shape[0]
    def get_weight(self, orig_weight: torch.Tensor):
        if self.t1 is None:
            weight = (self.w1_a @ self.w1_b) * (self.w2_a @ self.w2_b)
        else:
            rebuild1 = torch.einsum("i j k l, j r, i p -> p r k l", self.t1, self.w1_b, self.w1_a)
            rebuild2 = torch.einsum("i j k l, j r, i p -> p r k l", self.t2, self.w2_b, self.w2_a)
            weight = rebuild1 * rebuild2
        return weight
    def calc_size(self) -> int:
        model_size = super().calc_size()
        for val in [self.w1_a, self.w1_b, self.w2_a, self.w2_b, self.t1, self.t2]:
            if val is not None:
                model_size += val.nelement() * val.element_size()
        return model_size
    def to(
        self,
        device: Optional[torch.device] = None,
        dtype: Optional[torch.dtype] = None,
    ):
        super().to(device=device, dtype=dtype)
        self.w1_a = self.w1_a.to(device=device, dtype=dtype)
        self.w1_b = self.w1_b.to(device=device, dtype=dtype)
        if self.t1 is not None:
            self.t1 = self.t1.to(device=device, dtype=dtype)
        self.w2_a = self.w2_a.to(device=device, dtype=dtype)
        self.w2_b = self.w2_b.to(device=device, dtype=dtype)
        if self.t2 is not None:
            self.t2 = self.t2.to(device=device, dtype=dtype)
 class LoKRLayer(LoRALayerBase):
    # w1: Optional[torch.Tensor] = None
    # w1_a: Optional[torch.Tensor] = None
    # w1_b: Optional[torch.Tensor] = None
    # w2: Optional[torch.Tensor] = None
    # w2_a: Optional[torch.Tensor] = None
    # w2_b: Optional[torch.Tensor] = None
    # t2: Optional[torch.Tensor] = None
    def __init__(
        self,
        layer_key: str,
        values: dict,
    ):
        super().__init__(layer_key, values)
        if "lokr_w1" in values:
            self.w1 = values["lokr_w1"]
            self.w1_a = None
            self.w1_b = None
        else:
            self.w1 = None
            self.w1_a = values["lokr_w1_a"]
            self.w1_b = values["lokr_w1_b"]
        if "lokr_w2" in values:
            self.w2 = values["lokr_w2"]
            self.w2_a = None
            self.w2_b = None
        else:
            self.w2 = None
            self.w2_a = values["lokr_w2_a"]
            self.w2_b = values["lokr_w2_b"]
        if "lokr_t2" in values:
            self.t2 = values["lokr_t2"]
        else:
            self.t2 = None
        if "lokr_w1_b" in values:
            self.rank = values["lokr_w1_b"].shape[0]
        elif "lokr_w2_b" in values:
            self.rank = values["lokr_w2_b"].shape[0]
        else:
            self.rank = None  # unscaled
    def get_weight(self, orig_weight: torch.Tensor):
        w1 = self.w1
        if w1 is None:
            w1 = self.w1_a @ self.w1_b
        w2 = self.w2
        if w2 is None:
            if self.t2 is None:
                w2 = self.w2_a @ self.w2_b
            else:
                w2 = torch.einsum("i j k l, i p, j r -> p r k l", self.t2, self.w2_a, self.w2_b)
        if len(w2.shape) == 4:
            w1 = w1.unsqueeze(2).unsqueeze(2)
        w2 = w2.contiguous()
        weight = torch.kron(w1, w2)
        return weight
    def calc_size(self) -> int:
        model_size = super().calc_size()
        for val in [self.w1, self.w1_a, self.w1_b, self.w2, self.w2_a, self.w2_b, self.t2]:
            if val is not None:
                model_size += val.nelement() * val.element_size()
        return model_size
    def to(
        self,
        device: Optional[torch.device] = None,
        dtype: Optional[torch.dtype] = None,
    ):
        super().to(device=device, dtype=dtype)
        if self.w1 is not None:
            self.w1 = self.w1.to(device=device, dtype=dtype)
        else:
            self.w1_a = self.w1_a.to(device=device, dtype=dtype)
            self.w1_b = self.w1_b.to(device=device, dtype=dtype)
        if self.w2 is not None:
            self.w2 = self.w2.to(device=device, dtype=dtype)
        else:
            self.w2_a = self.w2_a.to(device=device, dtype=dtype)
            self.w2_b = self.w2_b.to(device=device, dtype=dtype)
        if self.t2 is not None:
            self.t2 = self.t2.to(device=device, dtype=dtype)
 class FullLayer(LoRALayerBase):
    # weight: torch.Tensor
    def __init__(
        self,
        layer_key: str,
        values: dict,
    ):
        super().__init__(layer_key, values)
        self.weight = values["diff"]
        if len(values.keys()) > 1:
            _keys = list(values.keys())
            _keys.remove("diff")
            raise NotImplementedError(f"Unexpected keys in lora diff layer: {_keys}")
        self.rank = None  # unscaled
    def get_weight(self, orig_weight: torch.Tensor):
        return self.weight
    def calc_size(self) -> int:
        model_size = super().calc_size()
        model_size += self.weight.nelement() * self.weight.element_size()
        return model_size
    def to(
        self,
        device: Optional[torch.device] = None,
        dtype: Optional[torch.dtype] = None,
    ):
        super().to(device=device, dtype=dtype)
        self.weight = self.weight.to(device=device, dtype=dtype)
 class IA3Layer(LoRALayerBase):
    # weight: torch.Tensor
    # on_input: torch.Tensor
    def __init__(
        self,
        layer_key: str,
        values: dict,
    ):
        super().__init__(layer_key, values)
        self.weight = values["weight"]
        self.on_input = values["on_input"]
        self.rank = None  # unscaled
    def get_weight(self, orig_weight: torch.Tensor):
        weight = self.weight
        if not self.on_input:
            weight = weight.reshape(-1, 1)
        return orig_weight * weight
    def calc_size(self) -> int:
        model_size = super().calc_size()
        model_size += self.weight.nelement() * self.weight.element_size()
        model_size += self.on_input.nelement() * self.on_input.element_size()
        return model_size
    def to(
        self,
        device: Optional[torch.device] = None,
        dtype: Optional[torch.dtype] = None,
    ):
        super().to(device=device, dtype=dtype)
        self.weight = self.weight.to(device=device, dtype=dtype)
        self.on_input = self.on_input.to(device=device, dtype=dtype)
 # TODO: rename all methods used in model logic with Info postfix and remove here Raw postfix
 class LoRAModelRaw:  # (torch.nn.Module):
    _name: str
    layers: Dict[str, LoRALayer]
    def __init__(
        self,
        name: str,
        layers: Dict[str, LoRALayer],
    ):
        self._name = name
        self.layers = layers
    @property
    def name(self):
        return self._name
    def to(
        self,
        device: Optional[torch.device] = None,
        dtype: Optional[torch.dtype] = None,
    ):
        # TODO: try revert if exception?
        for _key, layer in self.layers.items():
            layer.to(device=device, dtype=dtype)
    def calc_size(self) -> int:
        model_size = 0
        for _, layer in self.layers.items():
            model_size += layer.calc_size()
        return model_size
    @classmethod
    def _convert_sdxl_keys_to_diffusers_format(cls, state_dict):
        """Convert the keys of an SDXL LoRA state_dict to diffusers format.
        The input state_dict can be in either Stability AI format or diffusers format. If the state_dict is already in
        diffusers format, then this function will have no effect.
        This function is adapted from:
        https://github.com/bmaltais/kohya_ss/blob/2accb1305979ba62f5077a23aabac23b4c37e935/networks/lora_diffusers.py#L385-L409
        Args:
            state_dict (Dict[str, Tensor]): The SDXL LoRA state_dict.
        Raises:
            ValueError: If state_dict contains an unrecognized key, or not all keys could be converted.
        Returns:
            Dict[str, Tensor]: The diffusers-format state_dict.
        """
        converted_count = 0  # The number of Stability AI keys converted to diffusers format.
        not_converted_count = 0  # The number of keys that were not converted.
        # Get a sorted list of Stability AI UNet keys so that we can efficiently search for keys with matching prefixes.
        # For example, we want to efficiently find `input_blocks_4_1` in the list when searching for
        # `input_blocks_4_1_proj_in`.
        stability_unet_keys = list(SDXL_UNET_STABILITY_TO_DIFFUSERS_MAP)
        stability_unet_keys.sort()
        new_state_dict = {}
        for full_key, value in state_dict.items():
            if full_key.startswith("lora_unet_"):
                search_key = full_key.replace("lora_unet_", "")
                # Use bisect to find the key in stability_unet_keys that *may* match the search_key's prefix.
                position = bisect.bisect_right(stability_unet_keys, search_key)
                map_key = stability_unet_keys[position - 1]
                # Now, check if the map_key *actually* matches the search_key.
                if search_key.startswith(map_key):
                    new_key = full_key.replace(map_key, SDXL_UNET_STABILITY_TO_DIFFUSERS_MAP[map_key])
                    new_state_dict[new_key] = value
                    converted_count += 1
                else:
                    new_state_dict[full_key] = value
                    not_converted_count += 1
            elif full_key.startswith("lora_te1_") or full_key.startswith("lora_te2_"):
                # The CLIP text encoders have the same keys in both Stability AI and diffusers formats.
                new_state_dict[full_key] = value
                continue
            else:
                raise ValueError(f"Unrecognized SDXL LoRA key prefix: '{full_key}'.")
        if converted_count > 0 and not_converted_count > 0:
            raise ValueError(
                f"The SDXL LoRA could only be partially converted to diffusers format. converted={converted_count},"
                f" not_converted={not_converted_count}"
            )
        return new_state_dict
    @classmethod
    def from_checkpoint(
        cls,
        file_path: Union[str, Path],
        device: Optional[torch.device] = None,
        dtype: Optional[torch.dtype] = None,
        base_model: Optional[BaseModelType] = None,
    ):
        device = device or torch.device("cpu")
        dtype = dtype or torch.float32
        if isinstance(file_path, str):
            file_path = Path(file_path)
        model = cls(
            name=file_path.stem,  # TODO:
            layers={},
        )
        if file_path.suffix == ".safetensors":
            state_dict = load_file(file_path.absolute().as_posix(), device="cpu")
        else:
            state_dict = torch.load(file_path, map_location="cpu")
        state_dict = cls._group_state(state_dict)
        if base_model == BaseModelType.StableDiffusionXL:
            state_dict = cls._convert_sdxl_keys_to_diffusers_format(state_dict)
        for layer_key, values in state_dict.items():
            # lora and locon
            if "lora_down.weight" in values:
                layer = LoRALayer(layer_key, values)
            # loha
            elif "hada_w1_b" in values:
                layer = LoHALayer(layer_key, values)
            # lokr
            elif "lokr_w1_b" in values or "lokr_w1" in values:
                layer = LoKRLayer(layer_key, values)
            # diff
            elif "diff" in values:
                layer = FullLayer(layer_key, values)
            # ia3
            elif "weight" in values and "on_input" in values:
                layer = IA3Layer(layer_key, values)
            else:
                print(f">> Encountered unknown lora layer module in {model.name}: {layer_key} - {list(values.keys())}")
                raise Exception("Unknown lora format!")
            # lower memory consumption by removing already parsed layer values
            state_dict[layer_key].clear()
            layer.to(device=device, dtype=dtype)
            model.layers[layer_key] = layer
        return model
    @staticmethod
    def _group_state(state_dict: dict):
        state_dict_groupped = {}
        for key, value in state_dict.items():
            stem, leaf = key.split(".", 1)
            if stem not in state_dict_groupped:
                state_dict_groupped[stem] = {}
            state_dict_groupped[stem][leaf] = value
        return state_dict_groupped
 # code from
 # https://github.com/bmaltais/kohya_ss/blob/2accb1305979ba62f5077a23aabac23b4c37e935/networks/lora_diffusers.py#L15C1-L97C32
 def make_sdxl_unet_conversion_map():
    """Create a dict mapping state_dict keys from Stability AI SDXL format to diffusers SDXL format."""
    unet_conversion_map_layer = []
    for i in range(3):  # num_blocks is 3 in sdxl
        # loop over downblocks/upblocks
        for j in range(2):
            # loop over resnets/attentions for downblocks
            hf_down_res_prefix = f"down_blocks.{i}.resnets.{j}."
            sd_down_res_prefix = f"input_blocks.{3*i + j + 1}.0."
            unet_conversion_map_layer.append((sd_down_res_prefix, hf_down_res_prefix))
            if i < 3:
                # no attention layers in down_blocks.3
                hf_down_atn_prefix = f"down_blocks.{i}.attentions.{j}."
                sd_down_atn_prefix = f"input_blocks.{3*i + j + 1}.1."
                unet_conversion_map_layer.append((sd_down_atn_prefix, hf_down_atn_prefix))
        for j in range(3):
            # loop over resnets/attentions for upblocks
            hf_up_res_prefix = f"up_blocks.{i}.resnets.{j}."
            sd_up_res_prefix = f"output_blocks.{3*i + j}.0."
            unet_conversion_map_layer.append((sd_up_res_prefix, hf_up_res_prefix))
            # if i > 0: commentout for sdxl
            # no attention layers in up_blocks.0
            hf_up_atn_prefix = f"up_blocks.{i}.attentions.{j}."
            sd_up_atn_prefix = f"output_blocks.{3*i + j}.1."
            unet_conversion_map_layer.append((sd_up_atn_prefix, hf_up_atn_prefix))
        if i < 3:
            # no downsample in down_blocks.3
            hf_downsample_prefix = f"down_blocks.{i}.downsamplers.0.conv."
            sd_downsample_prefix = f"input_blocks.{3*(i+1)}.0.op."
            unet_conversion_map_layer.append((sd_downsample_prefix, hf_downsample_prefix))
            # no upsample in up_blocks.3
            hf_upsample_prefix = f"up_blocks.{i}.upsamplers.0."
            sd_upsample_prefix = f"output_blocks.{3*i + 2}.{2}."  # change for sdxl
            unet_conversion_map_layer.append((sd_upsample_prefix, hf_upsample_prefix))
    hf_mid_atn_prefix = "mid_block.attentions.0."
    sd_mid_atn_prefix = "middle_block.1."
    unet_conversion_map_layer.append((sd_mid_atn_prefix, hf_mid_atn_prefix))
    for j in range(2):
        hf_mid_res_prefix = f"mid_block.resnets.{j}."
        sd_mid_res_prefix = f"middle_block.{2*j}."
        unet_conversion_map_layer.append((sd_mid_res_prefix, hf_mid_res_prefix))
    unet_conversion_map_resnet = [
        # (stable-diffusion, HF Diffusers)
        ("in_layers.0.", "norm1."),
        ("in_layers.2.", "conv1."),
        ("out_layers.0.", "norm2."),
        ("out_layers.3.", "conv2."),
        ("emb_layers.1.", "time_emb_proj."),
        ("skip_connection.", "conv_shortcut."),
    ]
    unet_conversion_map = []
    for sd, hf in unet_conversion_map_layer:
        if "resnets" in hf:
            for sd_res, hf_res in unet_conversion_map_resnet:
                unet_conversion_map.append((sd + sd_res, hf + hf_res))
        else:
            unet_conversion_map.append((sd, hf))
    for j in range(2):
        hf_time_embed_prefix = f"time_embedding.linear_{j+1}."
        sd_time_embed_prefix = f"time_embed.{j*2}."
        unet_conversion_map.append((sd_time_embed_prefix, hf_time_embed_prefix))
    for j in range(2):
        hf_label_embed_prefix = f"add_embedding.linear_{j+1}."
        sd_label_embed_prefix = f"label_emb.0.{j*2}."
        unet_conversion_map.append((sd_label_embed_prefix, hf_label_embed_prefix))
    unet_conversion_map.append(("input_blocks.0.0.", "conv_in."))
    unet_conversion_map.append(("out.0.", "conv_norm_out."))
    unet_conversion_map.append(("out.2.", "conv_out."))
    return unet_conversion_map
 SDXL_UNET_STABILITY_TO_DIFFUSERS_MAP = {
    sd.rstrip(".").replace(".", "_"): hf.rstrip(".").replace(".", "_") for sd, hf in make_sdxl_unet_conversion_map()
 }
--- a/invokeai/backend/model_management_OLD/models/sdxl.py
+++ b/invokeai/backend/model_management_OLD/models/sdxl.py
@ -1,148 +0,0 @@
 import json
 import os
 from enum import Enum
 from pathlib import Path
 from typing import Literal, Optional
 from omegaconf import OmegaConf
 from pydantic import Field
 from invokeai.app.services.config import InvokeAIAppConfig
 from invokeai.backend.model_management.detect_baked_in_vae import has_baked_in_sdxl_vae
 from invokeai.backend.util.logging import InvokeAILogger
 from .base import (
    BaseModelType,
    DiffusersModel,
    InvalidModelException,
    ModelConfigBase,
    ModelType,
    ModelVariantType,
    classproperty,
    read_checkpoint_meta,
 )
 class StableDiffusionXLModelFormat(str, Enum):
    Checkpoint = "checkpoint"
    Diffusers = "diffusers"
 class StableDiffusionXLModel(DiffusersModel):
    # TODO: check that configs overwriten properly
    class DiffusersConfig(ModelConfigBase):
        model_format: Literal[StableDiffusionXLModelFormat.Diffusers]
        vae: Optional[str] = Field(None)
        variant: ModelVariantType
    class CheckpointConfig(ModelConfigBase):
        model_format: Literal[StableDiffusionXLModelFormat.Checkpoint]
        vae: Optional[str] = Field(None)
        config: str
        variant: ModelVariantType
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert base_model in {BaseModelType.StableDiffusionXL, BaseModelType.StableDiffusionXLRefiner}
        assert model_type == ModelType.Main
        super().__init__(
            model_path=model_path,
            base_model=BaseModelType.StableDiffusionXL,
            model_type=ModelType.Main,
        )
    @classmethod
    def probe_config(cls, path: str, **kwargs):
        model_format = cls.detect_format(path)
        ckpt_config_path = kwargs.get("config", None)
        if model_format == StableDiffusionXLModelFormat.Checkpoint:
            if ckpt_config_path:
                ckpt_config = OmegaConf.load(ckpt_config_path)
                in_channels = ckpt_config["model"]["params"]["unet_config"]["params"]["in_channels"]
            else:
                checkpoint = read_checkpoint_meta(path)
                checkpoint = checkpoint.get("state_dict", checkpoint)
                in_channels = checkpoint["model.diffusion_model.input_blocks.0.0.weight"].shape[1]
        elif model_format == StableDiffusionXLModelFormat.Diffusers:
            unet_config_path = os.path.join(path, "unet", "config.json")
            if os.path.exists(unet_config_path):
                with open(unet_config_path, "r") as f:
                    unet_config = json.loads(f.read())
                in_channels = unet_config["in_channels"]
            else:
                raise InvalidModelException(f"{path} is not a recognized Stable Diffusion diffusers model")
        else:
            raise NotImplementedError(f"Unknown stable diffusion 2.* format: {model_format}")
        if in_channels == 9:
            variant = ModelVariantType.Inpaint
        elif in_channels == 5:
            variant = ModelVariantType.Depth
        elif in_channels == 4:
            variant = ModelVariantType.Normal
        else:
            raise Exception("Unkown stable diffusion 2.* model format")
        if ckpt_config_path is None:
            # avoid circular import
            from .stable_diffusion import _select_ckpt_config
            ckpt_config_path = _select_ckpt_config(kwargs.get("model_base", BaseModelType.StableDiffusionXL), variant)
        return cls.create_config(
            path=path,
            model_format=model_format,
            config=ckpt_config_path,
            variant=variant,
        )
    @classproperty
    def save_to_config(cls) -> bool:
        return True
    @classmethod
    def detect_format(cls, model_path: str):
        if os.path.isdir(model_path):
            return StableDiffusionXLModelFormat.Diffusers
        else:
            return StableDiffusionXLModelFormat.Checkpoint
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        # The convert script adapted from the diffusers package uses
        # strings for the base model type. To avoid making too many
        # source code changes, we simply translate here
        if Path(output_path).exists():
            return output_path
        if isinstance(config, cls.CheckpointConfig):
            from invokeai.backend.model_management.models.stable_diffusion import _convert_ckpt_and_cache
            # Hack in VAE-fp16 fix - If model sdxl-vae-fp16-fix is installed,
            # then we bake it into the converted model unless there is already
            # a nonstandard VAE installed.
            kwargs = {}
            app_config = InvokeAIAppConfig.get_config()
            vae_path = app_config.models_path / "sdxl/vae/sdxl-vae-fp16-fix"
            if vae_path.exists() and not has_baked_in_sdxl_vae(Path(model_path)):
                InvokeAILogger.get_logger().warning("No baked-in VAE detected. Inserting sdxl-vae-fp16-fix.")
                kwargs["vae_path"] = vae_path
            return _convert_ckpt_and_cache(
                version=base_model,
                model_config=config,
                output_path=output_path,
                use_safetensors=True,
                **kwargs,
            )
        else:
            return model_path
--- a/invokeai/backend/model_management_OLD/models/stable_diffusion.py
+++ b/invokeai/backend/model_management_OLD/models/stable_diffusion.py
@ -1,337 +0,0 @@
 import json
 import os
 from enum import Enum
 from pathlib import Path
 from typing import Literal, Optional, Union
 from diffusers import StableDiffusionInpaintPipeline, StableDiffusionPipeline
 from omegaconf import OmegaConf
 from pydantic import Field
 import invokeai.backend.util.logging as logger
 from invokeai.app.services.config import InvokeAIAppConfig
 from .base import (
    BaseModelType,
    DiffusersModel,
    InvalidModelException,
    ModelConfigBase,
    ModelNotFoundException,
    ModelType,
    ModelVariantType,
    SilenceWarnings,
    classproperty,
    read_checkpoint_meta,
 )
 from .sdxl import StableDiffusionXLModel
 class StableDiffusion1ModelFormat(str, Enum):
    Checkpoint = "checkpoint"
    Diffusers = "diffusers"
 class StableDiffusion1Model(DiffusersModel):
    class DiffusersConfig(ModelConfigBase):
        model_format: Literal[StableDiffusion1ModelFormat.Diffusers]
        vae: Optional[str] = Field(None)
        variant: ModelVariantType
    class CheckpointConfig(ModelConfigBase):
        model_format: Literal[StableDiffusion1ModelFormat.Checkpoint]
        vae: Optional[str] = Field(None)
        config: str
        variant: ModelVariantType
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert base_model == BaseModelType.StableDiffusion1
        assert model_type == ModelType.Main
        super().__init__(
            model_path=model_path,
            base_model=BaseModelType.StableDiffusion1,
            model_type=ModelType.Main,
        )
    @classmethod
    def probe_config(cls, path: str, **kwargs):
        model_format = cls.detect_format(path)
        ckpt_config_path = kwargs.get("config", None)
        if model_format == StableDiffusion1ModelFormat.Checkpoint:
            if ckpt_config_path:
                ckpt_config = OmegaConf.load(ckpt_config_path)
                ckpt_config["model"]["params"]["unet_config"]["params"]["in_channels"]
            else:
                checkpoint = read_checkpoint_meta(path)
                checkpoint = checkpoint.get("state_dict", checkpoint)
                in_channels = checkpoint["model.diffusion_model.input_blocks.0.0.weight"].shape[1]
        elif model_format == StableDiffusion1ModelFormat.Diffusers:
            unet_config_path = os.path.join(path, "unet", "config.json")
            if os.path.exists(unet_config_path):
                with open(unet_config_path, "r") as f:
                    unet_config = json.loads(f.read())
                in_channels = unet_config["in_channels"]
            else:
                raise NotImplementedError(f"{path} is not a supported stable diffusion diffusers format")
        else:
            raise NotImplementedError(f"Unknown stable diffusion 1.* format: {model_format}")
        if in_channels == 9:
            variant = ModelVariantType.Inpaint
        elif in_channels == 4:
            variant = ModelVariantType.Normal
        else:
            raise Exception("Unkown stable diffusion 1.* model format")
        if ckpt_config_path is None:
            ckpt_config_path = _select_ckpt_config(BaseModelType.StableDiffusion1, variant)
        return cls.create_config(
            path=path,
            model_format=model_format,
            config=ckpt_config_path,
            variant=variant,
        )
    @classproperty
    def save_to_config(cls) -> bool:
        return True
    @classmethod
    def detect_format(cls, model_path: str):
        if not os.path.exists(model_path):
            raise ModelNotFoundException()
        if os.path.isdir(model_path):
            if os.path.exists(os.path.join(model_path, "model_index.json")):
                return StableDiffusion1ModelFormat.Diffusers
        if os.path.isfile(model_path):
            if any(model_path.endswith(f".{ext}") for ext in ["safetensors", "ckpt", "pt"]):
                return StableDiffusion1ModelFormat.Checkpoint
        raise InvalidModelException(f"Not a valid model: {model_path}")
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        if isinstance(config, cls.CheckpointConfig):
            return _convert_ckpt_and_cache(
                version=BaseModelType.StableDiffusion1,
                model_config=config,
                load_safety_checker=False,
                output_path=output_path,
            )
        else:
            return model_path
 class StableDiffusion2ModelFormat(str, Enum):
    Checkpoint = "checkpoint"
    Diffusers = "diffusers"
 class StableDiffusion2Model(DiffusersModel):
    # TODO: check that configs overwriten properly
    class DiffusersConfig(ModelConfigBase):
        model_format: Literal[StableDiffusion2ModelFormat.Diffusers]
        vae: Optional[str] = Field(None)
        variant: ModelVariantType
    class CheckpointConfig(ModelConfigBase):
        model_format: Literal[StableDiffusion2ModelFormat.Checkpoint]
        vae: Optional[str] = Field(None)
        config: str
        variant: ModelVariantType
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert base_model == BaseModelType.StableDiffusion2
        assert model_type == ModelType.Main
        super().__init__(
            model_path=model_path,
            base_model=BaseModelType.StableDiffusion2,
            model_type=ModelType.Main,
        )
    @classmethod
    def probe_config(cls, path: str, **kwargs):
        model_format = cls.detect_format(path)
        ckpt_config_path = kwargs.get("config", None)
        if model_format == StableDiffusion2ModelFormat.Checkpoint:
            if ckpt_config_path:
                ckpt_config = OmegaConf.load(ckpt_config_path)
                ckpt_config["model"]["params"]["unet_config"]["params"]["in_channels"]
            else:
                checkpoint = read_checkpoint_meta(path)
                checkpoint = checkpoint.get("state_dict", checkpoint)
                in_channels = checkpoint["model.diffusion_model.input_blocks.0.0.weight"].shape[1]
        elif model_format == StableDiffusion2ModelFormat.Diffusers:
            unet_config_path = os.path.join(path, "unet", "config.json")
            if os.path.exists(unet_config_path):
                with open(unet_config_path, "r") as f:
                    unet_config = json.loads(f.read())
                in_channels = unet_config["in_channels"]
            else:
                raise Exception("Not supported stable diffusion diffusers format(possibly onnx?)")
        else:
            raise NotImplementedError(f"Unknown stable diffusion 2.* format: {model_format}")
        if in_channels == 9:
            variant = ModelVariantType.Inpaint
        elif in_channels == 5:
            variant = ModelVariantType.Depth
        elif in_channels == 4:
            variant = ModelVariantType.Normal
        else:
            raise Exception("Unkown stable diffusion 2.* model format")
        if ckpt_config_path is None:
            ckpt_config_path = _select_ckpt_config(BaseModelType.StableDiffusion2, variant)
        return cls.create_config(
            path=path,
            model_format=model_format,
            config=ckpt_config_path,
            variant=variant,
        )
    @classproperty
    def save_to_config(cls) -> bool:
        return True
    @classmethod
    def detect_format(cls, model_path: str):
        if not os.path.exists(model_path):
            raise ModelNotFoundException()
        if os.path.isdir(model_path):
            if os.path.exists(os.path.join(model_path, "model_index.json")):
                return StableDiffusion2ModelFormat.Diffusers
        if os.path.isfile(model_path):
            if any(model_path.endswith(f".{ext}") for ext in ["safetensors", "ckpt", "pt"]):
                return StableDiffusion2ModelFormat.Checkpoint
        raise InvalidModelException(f"Not a valid model: {model_path}")
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        if isinstance(config, cls.CheckpointConfig):
            return _convert_ckpt_and_cache(
                version=BaseModelType.StableDiffusion2,
                model_config=config,
                output_path=output_path,
            )
        else:
            return model_path
 # TODO: rework
 # pass precision - currently defaulting to fp16
 def _convert_ckpt_and_cache(
    version: BaseModelType,
    model_config: Union[
        StableDiffusion1Model.CheckpointConfig,
        StableDiffusion2Model.CheckpointConfig,
        StableDiffusionXLModel.CheckpointConfig,
    ],
    output_path: str,
    use_save_model: bool = False,
    **kwargs,
 ) -> str:
    """
    Convert the checkpoint model indicated in mconfig into a
    diffusers, cache it to disk, and return Path to converted
    file. If already on disk then just returns Path.
    """
    app_config = InvokeAIAppConfig.get_config()
    weights = app_config.models_path / model_config.path
    config_file = app_config.root_path / model_config.config
    output_path = Path(output_path)
    variant = model_config.variant
    pipeline_class = StableDiffusionInpaintPipeline if variant == "inpaint" else StableDiffusionPipeline
    # return cached version if it exists
    if output_path.exists():
        return output_path
    # to avoid circular import errors
    from ...util.devices import choose_torch_device, torch_dtype
    from ..convert_ckpt_to_diffusers import convert_ckpt_to_diffusers
    model_base_to_model_type = {
        BaseModelType.StableDiffusion1: "FrozenCLIPEmbedder",
        BaseModelType.StableDiffusion2: "FrozenOpenCLIPEmbedder",
        BaseModelType.StableDiffusionXL: "SDXL",
        BaseModelType.StableDiffusionXLRefiner: "SDXL-Refiner",
    }
    logger.info(f"Converting {weights} to diffusers format")
    with SilenceWarnings():
        convert_ckpt_to_diffusers(
            weights,
            output_path,
            model_type=model_base_to_model_type[version],
            model_version=version,
            model_variant=model_config.variant,
            original_config_file=config_file,
            extract_ema=True,
            scan_needed=True,
            pipeline_class=pipeline_class,
            from_safetensors=weights.suffix == ".safetensors",
            precision=torch_dtype(choose_torch_device()),
            **kwargs,
        )
    return output_path
 def _select_ckpt_config(version: BaseModelType, variant: ModelVariantType):
    ckpt_configs = {
        BaseModelType.StableDiffusion1: {
            ModelVariantType.Normal: "v1-inference.yaml",
            ModelVariantType.Inpaint: "v1-inpainting-inference.yaml",
        },
        BaseModelType.StableDiffusion2: {
            ModelVariantType.Normal: "v2-inference-v.yaml",  # best guess, as we can't differentiate with base(512)
            ModelVariantType.Inpaint: "v2-inpainting-inference.yaml",
            ModelVariantType.Depth: "v2-midas-inference.yaml",
        },
        BaseModelType.StableDiffusionXL: {
            ModelVariantType.Normal: "sd_xl_base.yaml",
            ModelVariantType.Inpaint: None,
            ModelVariantType.Depth: None,
        },
        BaseModelType.StableDiffusionXLRefiner: {
            ModelVariantType.Normal: "sd_xl_refiner.yaml",
            ModelVariantType.Inpaint: None,
            ModelVariantType.Depth: None,
        },
    }
    app_config = InvokeAIAppConfig.get_config()
    try:
        config_path = app_config.legacy_conf_path / ckpt_configs[version][variant]
        if config_path.is_relative_to(app_config.root_path):
            config_path = config_path.relative_to(app_config.root_path)
        return str(config_path)
    except Exception:
        return None
--- a/invokeai/backend/model_management_OLD/models/stable_diffusion_onnx.py
+++ b/invokeai/backend/model_management_OLD/models/stable_diffusion_onnx.py
@ -1,150 +0,0 @@
 from enum import Enum
 from typing import Literal
 from diffusers import OnnxRuntimeModel
 from .base import (
    BaseModelType,
    DiffusersModel,
    IAIOnnxRuntimeModel,
    ModelConfigBase,
    ModelType,
    ModelVariantType,
    SchedulerPredictionType,
    classproperty,
 )
 class StableDiffusionOnnxModelFormat(str, Enum):
    Olive = "olive"
    Onnx = "onnx"
 class ONNXStableDiffusion1Model(DiffusersModel):
    class Config(ModelConfigBase):
        model_format: Literal[StableDiffusionOnnxModelFormat.Onnx]
        variant: ModelVariantType
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert base_model == BaseModelType.StableDiffusion1
        assert model_type == ModelType.ONNX
        super().__init__(
            model_path=model_path,
            base_model=BaseModelType.StableDiffusion1,
            model_type=ModelType.ONNX,
        )
        for child_name, child_type in self.child_types.items():
            if child_type is OnnxRuntimeModel:
                self.child_types[child_name] = IAIOnnxRuntimeModel
            # TODO: check that no optimum models provided
    @classmethod
    def probe_config(cls, path: str, **kwargs):
        model_format = cls.detect_format(path)
        in_channels = 4  # TODO:
        if in_channels == 9:
            variant = ModelVariantType.Inpaint
        elif in_channels == 4:
            variant = ModelVariantType.Normal
        else:
            raise Exception("Unkown stable diffusion 1.* model format")
        return cls.create_config(
            path=path,
            model_format=model_format,
            variant=variant,
        )
    @classproperty
    def save_to_config(cls) -> bool:
        return True
    @classmethod
    def detect_format(cls, model_path: str):
        # TODO: Detect onnx vs olive
        return StableDiffusionOnnxModelFormat.Onnx
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        return model_path
 class ONNXStableDiffusion2Model(DiffusersModel):
    # TODO: check that configs overwriten properly
    class Config(ModelConfigBase):
        model_format: Literal[StableDiffusionOnnxModelFormat.Onnx]
        variant: ModelVariantType
        prediction_type: SchedulerPredictionType
        upcast_attention: bool
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert base_model == BaseModelType.StableDiffusion2
        assert model_type == ModelType.ONNX
        super().__init__(
            model_path=model_path,
            base_model=BaseModelType.StableDiffusion2,
            model_type=ModelType.ONNX,
        )
        for child_name, child_type in self.child_types.items():
            if child_type is OnnxRuntimeModel:
                self.child_types[child_name] = IAIOnnxRuntimeModel
            # TODO: check that no optimum models provided
    @classmethod
    def probe_config(cls, path: str, **kwargs):
        model_format = cls.detect_format(path)
        in_channels = 4  # TODO:
        if in_channels == 9:
            variant = ModelVariantType.Inpaint
        elif in_channels == 5:
            variant = ModelVariantType.Depth
        elif in_channels == 4:
            variant = ModelVariantType.Normal
        else:
            raise Exception("Unkown stable diffusion 2.* model format")
        if variant == ModelVariantType.Normal:
            prediction_type = SchedulerPredictionType.VPrediction
            upcast_attention = True
        else:
            prediction_type = SchedulerPredictionType.Epsilon
            upcast_attention = False
        return cls.create_config(
            path=path,
            model_format=model_format,
            variant=variant,
            prediction_type=prediction_type,
            upcast_attention=upcast_attention,
        )
    @classproperty
    def save_to_config(cls) -> bool:
        return True
    @classmethod
    def detect_format(cls, model_path: str):
        # TODO: Detect onnx vs olive
        return StableDiffusionOnnxModelFormat.Onnx
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        return model_path
--- a/invokeai/backend/model_management_OLD/models/t2i_adapter.py
+++ b/invokeai/backend/model_management_OLD/models/t2i_adapter.py
@ -1,102 +0,0 @@
 import os
 from enum import Enum
 from typing import Literal, Optional
 import torch
 from diffusers import T2IAdapter
 from invokeai.backend.model_management.models.base import (
    BaseModelType,
    EmptyConfigLoader,
    InvalidModelException,
    ModelBase,
    ModelConfigBase,
    ModelNotFoundException,
    ModelType,
    SubModelType,
    calc_model_size_by_data,
    calc_model_size_by_fs,
    classproperty,
 )
 class T2IAdapterModelFormat(str, Enum):
    Diffusers = "diffusers"
 class T2IAdapterModel(ModelBase):
    class DiffusersConfig(ModelConfigBase):
        model_format: Literal[T2IAdapterModelFormat.Diffusers]
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert model_type == ModelType.T2IAdapter
        super().__init__(model_path, base_model, model_type)
        config = EmptyConfigLoader.load_config(self.model_path, config_name="config.json")
        model_class_name = config.get("_class_name", None)
        if model_class_name not in {"T2IAdapter"}:
            raise InvalidModelException(f"Invalid T2I-Adapter model. Unknown _class_name: '{model_class_name}'.")
        self.model_class = self._hf_definition_to_type(["diffusers", model_class_name])
        self.model_size = calc_model_size_by_fs(self.model_path)
    def get_size(self, child_type: Optional[SubModelType] = None):
        if child_type is not None:
            raise ValueError(f"T2I-Adapters do not have child models. Invalid child type: '{child_type}'.")
        return self.model_size
    def get_model(
        self,
        torch_dtype: Optional[torch.dtype],
        child_type: Optional[SubModelType] = None,
    ) -> T2IAdapter:
        if child_type is not None:
            raise ValueError(f"T2I-Adapters do not have child models. Invalid child type: '{child_type}'.")
        model = None
        for variant in ["fp16", None]:
            try:
                model = self.model_class.from_pretrained(
                    self.model_path,
                    torch_dtype=torch_dtype,
                    variant=variant,
                )
                break
            except Exception:
                pass
        if not model:
            raise ModelNotFoundException()
        # Calculate a more accurate size after loading the model into memory.
        self.model_size = calc_model_size_by_data(model)
        return model
    @classproperty
    def save_to_config(cls) -> bool:
        return False
    @classmethod
    def detect_format(cls, path: str):
        if not os.path.exists(path):
            raise ModelNotFoundException(f"Model not found at '{path}'.")
        if os.path.isdir(path):
            if os.path.exists(os.path.join(path, "config.json")):
                return T2IAdapterModelFormat.Diffusers
        raise InvalidModelException(f"Unsupported T2I-Adapter format: '{path}'.")
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        format = cls.detect_format(model_path)
        if format == T2IAdapterModelFormat.Diffusers:
            return model_path
        else:
            raise ValueError(f"Unsupported format: '{format}'.")
--- a/invokeai/backend/model_management_OLD/models/textual_inversion.py
+++ b/invokeai/backend/model_management_OLD/models/textual_inversion.py
@ -1,87 +0,0 @@
 import os
 from typing import Optional
 import torch
 # TODO: naming
 from ..lora import TextualInversionModel as TextualInversionModelRaw
 from .base import (
    BaseModelType,
    InvalidModelException,
    ModelBase,
    ModelConfigBase,
    ModelNotFoundException,
    ModelType,
    SubModelType,
    classproperty,
 )
 class TextualInversionModel(ModelBase):
    # model_size: int
    class Config(ModelConfigBase):
        model_format: None
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert model_type == ModelType.TextualInversion
        super().__init__(model_path, base_model, model_type)
        self.model_size = os.path.getsize(self.model_path)
    def get_size(self, child_type: Optional[SubModelType] = None):
        if child_type is not None:
            raise Exception("There is no child models in textual inversion")
        return self.model_size
    def get_model(
        self,
        torch_dtype: Optional[torch.dtype],
        child_type: Optional[SubModelType] = None,
    ):
        if child_type is not None:
            raise Exception("There is no child models in textual inversion")
        checkpoint_path = self.model_path
        if os.path.isdir(checkpoint_path):
            checkpoint_path = os.path.join(checkpoint_path, "learned_embeds.bin")
        if not os.path.exists(checkpoint_path):
            raise ModelNotFoundException()
        model = TextualInversionModelRaw.from_checkpoint(
            file_path=checkpoint_path,
            dtype=torch_dtype,
        )
        self.model_size = model.embedding.nelement() * model.embedding.element_size()
        return model
    @classproperty
    def save_to_config(cls) -> bool:
        return False
    @classmethod
    def detect_format(cls, path: str):
        if not os.path.exists(path):
            raise ModelNotFoundException()
        if os.path.isdir(path):
            if os.path.exists(os.path.join(path, "learned_embeds.bin")):
                return None  # diffusers-ti
        if os.path.isfile(path):
            if any(path.endswith(f".{ext}") for ext in ["safetensors", "ckpt", "pt", "bin"]):
                return None
        raise InvalidModelException(f"Not a valid model: {path}")
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,
        base_model: BaseModelType,
    ) -> str:
        return model_path
--- a/invokeai/backend/model_management_OLD/models/vae.py
+++ b/invokeai/backend/model_management_OLD/models/vae.py
@ -1,179 +0,0 @@
 import os
 from enum import Enum
 from pathlib import Path
 from typing import Optional
 import safetensors
 import torch
 from omegaconf import OmegaConf
 from invokeai.app.services.config import InvokeAIAppConfig
 from .base import (
    BaseModelType,
    EmptyConfigLoader,
    InvalidModelException,
    ModelBase,
    ModelConfigBase,
    ModelNotFoundException,
    ModelType,
    ModelVariantType,
    SubModelType,
    calc_model_size_by_data,
    calc_model_size_by_fs,
    classproperty,
 )
 class VaeModelFormat(str, Enum):
    Checkpoint = "checkpoint"
    Diffusers = "diffusers"
 class VaeModel(ModelBase):
    # vae_class: Type
    # model_size: int
    class Config(ModelConfigBase):
        model_format: VaeModelFormat
    def __init__(self, model_path: str, base_model: BaseModelType, model_type: ModelType):
        assert model_type == ModelType.Vae
        super().__init__(model_path, base_model, model_type)
        try:
            config = EmptyConfigLoader.load_config(self.model_path, config_name="config.json")
            # config = json.loads(os.path.join(self.model_path, "config.json"))
        except Exception:
            raise Exception("Invalid vae model! (config.json not found or invalid)")
        try:
            vae_class_name = config.get("_class_name", "AutoencoderKL")
            self.vae_class = self._hf_definition_to_type(["diffusers", vae_class_name])
            self.model_size = calc_model_size_by_fs(self.model_path)
        except Exception:
            raise Exception("Invalid vae model! (Unkown vae type)")
    def get_size(self, child_type: Optional[SubModelType] = None):
        if child_type is not None:
            raise Exception("There is no child models in vae model")
        return self.model_size
    def get_model(
        self,
        torch_dtype: Optional[torch.dtype],
        child_type: Optional[SubModelType] = None,
    ):
        if child_type is not None:
            raise Exception("There is no child models in vae model")
        model = self.vae_class.from_pretrained(
            self.model_path,
            torch_dtype=torch_dtype,
        )
        # calc more accurate size
        self.model_size = calc_model_size_by_data(model)
        return model
    @classproperty
    def save_to_config(cls) -> bool:
        return False
    @classmethod
    def detect_format(cls, path: str):
        if not os.path.exists(path):
            raise ModelNotFoundException(f"Does not exist as local file: {path}")
        if os.path.isdir(path):
            if os.path.exists(os.path.join(path, "config.json")):
                return VaeModelFormat.Diffusers
        if os.path.isfile(path):
            if any(path.endswith(f".{ext}") for ext in ["safetensors", "ckpt", "pt"]):
                return VaeModelFormat.Checkpoint
        raise InvalidModelException(f"Not a valid model: {path}")
    @classmethod
    def convert_if_required(
        cls,
        model_path: str,
        output_path: str,
        config: ModelConfigBase,  # empty config or config of parent model
        base_model: BaseModelType,
    ) -> str:
        if cls.detect_format(model_path) == VaeModelFormat.Checkpoint:
            return _convert_vae_ckpt_and_cache(
                weights_path=model_path,
                output_path=output_path,
                base_model=base_model,
                model_config=config,
            )
        else:
            return model_path
 # TODO: rework
 def _convert_vae_ckpt_and_cache(
    weights_path: str,
    output_path: str,
    base_model: BaseModelType,
    model_config: ModelConfigBase,
 ) -> str:
    """
    Convert the VAE indicated in mconfig into a diffusers AutoencoderKL
    object, cache it to disk, and return Path to converted
    file. If already on disk then just returns Path.
    """
    app_config = InvokeAIAppConfig.get_config()
    weights_path = app_config.root_dir / weights_path
    output_path = Path(output_path)
    """
    this size used only in when tiling enabled to separate input in tiles
    sizes in configs from stable diffusion githubs(1 and 2) set to 256
    on huggingface it:
    1.5 - 512
    1.5-inpainting - 256
    2-inpainting - 512
    2-depth - 256
    2-base - 512
    2 - 768
    2.1-base - 768
    2.1 - 768
    """
    image_size = 512
    # return cached version if it exists
    if output_path.exists():
        return output_path
    if base_model in {BaseModelType.StableDiffusion1, BaseModelType.StableDiffusion2}:
        from .stable_diffusion import _select_ckpt_config
        # all sd models use same vae settings
        config_file = _select_ckpt_config(base_model, ModelVariantType.Normal)
    else:
        raise Exception(f"Vae conversion not supported for model type: {base_model}")
    # this avoids circular import error
    from ..convert_ckpt_to_diffusers import convert_ldm_vae_to_diffusers
    if weights_path.suffix == ".safetensors":
        checkpoint = safetensors.torch.load_file(weights_path, device="cpu")
    else:
        checkpoint = torch.load(weights_path, map_location="cpu")
    # sometimes weights are hidden under "state_dict", and sometimes not
    if "state_dict" in checkpoint:
        checkpoint = checkpoint["state_dict"]
    config = OmegaConf.load(app_config.root_path / config_file)
    vae_model = convert_ldm_vae_to_diffusers(
        checkpoint=checkpoint,
        vae_config=config,
        image_size=image_size,
    )
    vae_model.save_pretrained(output_path, safe_serialization=True)
    return output_path
--- a/invokeai/backend/model_management_OLD/seamless.py
+++ b/invokeai/backend/model_management_OLD/seamless.py
@ -1,84 +0,0 @@
 from __future__ import annotations
 from contextlib import contextmanager
 from typing import Callable, List, Union
 import torch.nn as nn
 from diffusers.models.autoencoders.autoencoder_kl import AutoencoderKL
 from diffusers.models.unets.unet_2d_condition import UNet2DConditionModel
 def _conv_forward_asymmetric(self, input, weight, bias):
    """
    Patch for Conv2d._conv_forward that supports asymmetric padding
    """
    working = nn.functional.pad(input, self.asymmetric_padding["x"], mode=self.asymmetric_padding_mode["x"])
    working = nn.functional.pad(working, self.asymmetric_padding["y"], mode=self.asymmetric_padding_mode["y"])
    return nn.functional.conv2d(
        working,
        weight,
        bias,
        self.stride,
        nn.modules.utils._pair(0),
        self.dilation,
        self.groups,
    )
@contextmanager
 def set_seamless(model: Union[UNet2DConditionModel, AutoencoderKL], seamless_axes: List[str]):
    # Callable: (input: Tensor, weight: Tensor, bias: Optional[Tensor]) -> Tensor
    to_restore: list[tuple[nn.Conv2d | nn.ConvTranspose2d, Callable]] = []
    try:
        # Hard coded to skip down block layers, allowing for seamless tiling at the expense of prompt adherence
        skipped_layers = 1
        for m_name, m in model.named_modules():
            if not isinstance(m, (nn.Conv2d, nn.ConvTranspose2d)):
                continue
            if isinstance(model, UNet2DConditionModel) and m_name.startswith("down_blocks.") and ".resnets." in m_name:
                # down_blocks.1.resnets.1.conv1
                _, block_num, _, resnet_num, submodule_name = m_name.split(".")
                block_num = int(block_num)
                resnet_num = int(resnet_num)
                if block_num >= len(model.down_blocks) - skipped_layers:
                    continue
                # Skip the second resnet (could be configurable)
                if resnet_num > 0:
                    continue
                # Skip Conv2d layers (could be configurable)
                if submodule_name == "conv2":
                    continue
            m.asymmetric_padding_mode = {}
            m.asymmetric_padding = {}
            m.asymmetric_padding_mode["x"] = "circular" if ("x" in seamless_axes) else "constant"
            m.asymmetric_padding["x"] = (
                m._reversed_padding_repeated_twice[0],
                m._reversed_padding_repeated_twice[1],
                0,
                0,
            )
            m.asymmetric_padding_mode["y"] = "circular" if ("y" in seamless_axes) else "constant"
            m.asymmetric_padding["y"] = (
                0,
                0,
                m._reversed_padding_repeated_twice[2],
                m._reversed_padding_repeated_twice[3],
            )
            to_restore.append((m, m._conv_forward))
            m._conv_forward = _conv_forward_asymmetric.__get__(m, nn.Conv2d)
        yield
    finally:
        for module, orig_conv_forward in to_restore:
            module._conv_forward = orig_conv_forward
            if hasattr(module, "asymmetric_padding_mode"):
                del module.asymmetric_padding_mode
            if hasattr(module, "asymmetric_padding"):
                del module.asymmetric_padding
--- a/invokeai/backend/model_management_OLD/util.py
+++ b/invokeai/backend/model_management_OLD/util.py
@ -1,79 +0,0 @@
 # Copyright (c) 2023 The InvokeAI Development Team
 """Utilities used by the Model Manager"""
 def lora_token_vector_length(checkpoint: dict) -> int:
    """
    Given a checkpoint in memory, return the lora token vector length
    :param checkpoint: The checkpoint
    """
    def _get_shape_1(key: str, tensor, checkpoint) -> int:
        lora_token_vector_length = None
        if "." not in key:
            return lora_token_vector_length  # wrong key format
        model_key, lora_key = key.split(".", 1)
        # check lora/locon
        if lora_key == "lora_down.weight":
            lora_token_vector_length = tensor.shape[1]
        # check loha (don't worry about hada_t1/hada_t2 as it used only in 4d shapes)
        elif lora_key in ["hada_w1_b", "hada_w2_b"]:
            lora_token_vector_length = tensor.shape[1]
        # check lokr (don't worry about lokr_t2 as it used only in 4d shapes)
        elif "lokr_" in lora_key:
            if model_key + ".lokr_w1" in checkpoint:
                _lokr_w1 = checkpoint[model_key + ".lokr_w1"]
            elif model_key + "lokr_w1_b" in checkpoint:
                _lokr_w1 = checkpoint[model_key + ".lokr_w1_b"]
            else:
                return lora_token_vector_length  # unknown format
            if model_key + ".lokr_w2" in checkpoint:
                _lokr_w2 = checkpoint[model_key + ".lokr_w2"]
            elif model_key + "lokr_w2_b" in checkpoint:
                _lokr_w2 = checkpoint[model_key + ".lokr_w2_b"]
            else:
                return lora_token_vector_length  # unknown format
            lora_token_vector_length = _lokr_w1.shape[1] * _lokr_w2.shape[1]
        elif lora_key == "diff":
            lora_token_vector_length = tensor.shape[1]
        # ia3 can be detected only by shape[0] in text encoder
        elif lora_key == "weight" and "lora_unet_" not in model_key:
            lora_token_vector_length = tensor.shape[0]
        return lora_token_vector_length
    lora_token_vector_length = None
    lora_te1_length = None
    lora_te2_length = None
    for key, tensor in checkpoint.items():
        if key.startswith("lora_unet_") and ("_attn2_to_k." in key or "_attn2_to_v." in key):
            lora_token_vector_length = _get_shape_1(key, tensor, checkpoint)
        elif key.startswith("lora_unet_") and (
            "time_emb_proj.lora_down" in key
        ):  # recognizes format at https://civitai.com/models/224641
            lora_token_vector_length = _get_shape_1(key, tensor, checkpoint)
        elif key.startswith("lora_te") and "_self_attn_" in key:
            tmp_length = _get_shape_1(key, tensor, checkpoint)
            if key.startswith("lora_te_"):
                lora_token_vector_length = tmp_length
            elif key.startswith("lora_te1_"):
                lora_te1_length = tmp_length
            elif key.startswith("lora_te2_"):
                lora_te2_length = tmp_length
        if lora_te1_length is not None and lora_te2_length is not None:
            lora_token_vector_length = lora_te1_length + lora_te2_length
        if lora_token_vector_length is not None:
            break
    return lora_token_vector_length
--- a/invokeai/backend/model_manager/init.py
+++ b/invokeai/backend/model_manager/init.py
@ -1,5 +1,4 @@
 """Re-export frequently-used symbols from the Model Manager backend."""
 from .config import (
    AnyModel,
    AnyModelConfig,
@ -33,3 +32,42 @@ __all__ = [
    "SchedulerPredictionType",
    "SubModelType",
 ]
 ########## to help populate the openapi_schema with format enums for each config ###########
 # This code is no longer necessary?
 # leave it here just in case
 #
 # import inspect
 # from enum import Enum
 # from typing import Any, Iterable, Dict, get_args, Set
 # def _expand(something: Any) -> Iterable[type]:
 #     if isinstance(something, type):
 #         yield something
 #     else:
 #         for x in get_args(something):
 #             for y in _expand(x):
 #                 yield y
 # def _find_format(cls: type) -> Iterable[Enum]:
 #     if hasattr(inspect, "get_annotations"):
 #         fields = inspect.get_annotations(cls)
 #     else:
 #         fields = cls.__annotations__
 #     if "format" in fields:
 #         for x in get_args(fields["format"]):
 #             yield x
 #     for parent_class in cls.__bases__:
 #         for x in _find_format(parent_class):
 #             yield x
 #     return None
 # def get_model_config_formats() -> Dict[str, Set[Enum]]:
 #     result: Dict[str, Set[Enum]] = {}
 #     for model_config in _expand(AnyModelConfig):
 #         for field in _find_format(model_config):
 #             if field is None:
 #                 continue
 #             if not result.get(model_config.__qualname__):
 #                 result[model_config.__qualname__] = set()
 #             result[model_config.__qualname__].add(field)
 #     return result
--- a/invokeai/backend/model_manager/load/init.py
+++ b/invokeai/backend/model_manager/load/init.py
@ -6,12 +6,22 @@ from importlib import import_module
 from pathlib import Path
 from .convert_cache.convert_cache_default import ModelConvertCache
-from .load_base import AnyModelLoader, LoadedModel
+from .load_base import LoadedModel, ModelLoaderBase
 from .load_default import ModelLoader
 from .model_cache.model_cache_default import ModelCache
 from .model_loader_registry import ModelLoaderRegistry, ModelLoaderRegistryBase
 # This registers the subclasses that implement loaders of specific model types
 loaders = [x.stem for x in Path(Path(__file__).parent, "model_loaders").glob("*.py") if x.stem != "__init__"]
 for module in loaders:
    import_module(f"{__package__}.model_loaders.{module}")
-__all__ = ["AnyModelLoader", "LoadedModel", "ModelCache", "ModelConvertCache"]
+__all__ = [
    "LoadedModel",
    "ModelCache",
    "ModelConvertCache",
    "ModelLoaderBase",
    "ModelLoader",
    "ModelLoaderRegistryBase",
    "ModelLoaderRegistry",
 ]
--- a/invokeai/backend/model_manager/load/load_base.py
+++ b/invokeai/backend/model_manager/load/load_base.py
@ -1,37 +1,22 @@
 # Copyright (c) 2024, Lincoln D. Stein and the InvokeAI Development Team
 """
 Base class for model loading in InvokeAI.
 Use like this:
  loader = AnyModelLoader(...)
  loaded_model = loader.get_model('019ab39adfa1840455')
  with loaded_model as model:  # context manager moves model into VRAM
       # do something with loaded_model
 """
 import hashlib
 from abc import ABC, abstractmethod
 from dataclasses import dataclass
 from logging import Logger
 from pathlib import Path
-from typing import Any, Callable, Dict, Optional, Tuple, Type
+from typing import Any, Optional
 from invokeai.app.services.config import InvokeAIAppConfig
 from invokeai.backend.model_manager.config import (
    AnyModel,
    AnyModelConfig,
    BaseModelType,
    ModelConfigBase,
    ModelFormat,
    ModelType,
    SubModelType,
    VaeCheckpointConfig,
    VaeDiffusersConfig,
 )
 from invokeai.backend.model_manager.load.convert_cache.convert_cache_base import ModelConvertCacheBase
 from invokeai.backend.model_manager.load.model_cache.model_cache_base import ModelCacheBase, ModelLockerBase
 from invokeai.backend.util.logging import InvokeAILogger
@dataclass
@ -56,6 +41,14 @@ class LoadedModel:
        return self._locker.model
 # TODO(MM2):
 # Some "intermediary" subclasses in the ModelLoaderBase class hierarchy define methods that their subclasses don't
 # know about. I think the problem may be related to this class being an ABC.
 #
 # For example, GenericDiffusersLoader defines `get_hf_load_class()`, and StableDiffusionDiffusersModel attempts to
 # call it. However, the method is not defined in the ABC, so it is not guaranteed to be implemented.
 class ModelLoaderBase(ABC):
    """Abstract base class for loading models into RAM/VRAM."""
@ -71,7 +64,7 @@ class ModelLoaderBase(ABC):
        pass
    @abstractmethod
-    def load_model(self, model_config: ModelConfigBase, submodel_type: Optional[SubModelType] = None) -> LoadedModel:
+    def load_model(self, model_config: AnyModelConfig, submodel_type: Optional[SubModelType] = None) -> LoadedModel:
        """
        Return a model given its confguration.
@ -90,106 +83,3 @@ class ModelLoaderBase(ABC):
    ) -> int:
        """Return size in bytes of the model, calculated before loading."""
        pass
 # TO DO: Better name?
 class AnyModelLoader:
    """This class manages the model loaders and invokes the correct one to load a model of given base and type."""
    # this tracks the loader subclasses
    _registry: Dict[str, Type[ModelLoaderBase]] = {}
    _logger: Logger = InvokeAILogger.get_logger()
    def __init__(
        self,
        app_config: InvokeAIAppConfig,
        logger: Logger,
        ram_cache: ModelCacheBase[AnyModel],
        convert_cache: ModelConvertCacheBase,
    ):
        """Initialize AnyModelLoader with its dependencies."""
        self._app_config = app_config
        self._logger = logger
        self._ram_cache = ram_cache
        self._convert_cache = convert_cache
    @property
    def ram_cache(self) -> ModelCacheBase[AnyModel]:
        """Return the RAM cache associated used by the loaders."""
        return self._ram_cache
    @property
    def convert_cache(self) -> ModelConvertCacheBase:
        """Return the convert cache associated used by the loaders."""
        return self._convert_cache
    def load_model(self, model_config: ModelConfigBase, submodel_type: Optional[SubModelType] = None) -> LoadedModel:
        """
        Return a model given its configuration.
        :param key: model key, as known to the config backend
        :param submodel_type: an ModelType enum indicating the portion of
               the model to retrieve (e.g. ModelType.Vae)
        """
        implementation, model_config, submodel_type = self.__class__.get_implementation(model_config, submodel_type)
        return implementation(
            app_config=self._app_config,
            logger=self._logger,
            ram_cache=self._ram_cache,
            convert_cache=self._convert_cache,
        ).load_model(model_config, submodel_type)
    @staticmethod
    def _to_registry_key(base: BaseModelType, type: ModelType, format: ModelFormat) -> str:
        return "-".join([base.value, type.value, format.value])
    @classmethod
    def get_implementation(
        cls, config: ModelConfigBase, submodel_type: Optional[SubModelType]
    ) -> Tuple[Type[ModelLoaderBase], ModelConfigBase, Optional[SubModelType]]:
        """Get subclass of ModelLoaderBase registered to handle base and type."""
        # We have to handle VAE overrides here because this will change the model type and the corresponding implementation returned
        conf2, submodel_type = cls._handle_subtype_overrides(config, submodel_type)
        key1 = cls._to_registry_key(conf2.base, conf2.type, conf2.format)  # for a specific base type
        key2 = cls._to_registry_key(BaseModelType.Any, conf2.type, conf2.format)  # with wildcard Any
        implementation = cls._registry.get(key1) or cls._registry.get(key2)
        if not implementation:
            raise NotImplementedError(
                f"No subclass of LoadedModel is registered for base={config.base}, type={config.type}, format={config.format}"
            )
        return implementation, conf2, submodel_type
    @classmethod
    def _handle_subtype_overrides(
        cls, config: ModelConfigBase, submodel_type: Optional[SubModelType]
    ) -> Tuple[ModelConfigBase, Optional[SubModelType]]:
        if submodel_type == SubModelType.Vae and hasattr(config, "vae") and config.vae is not None:
            model_path = Path(config.vae)
            config_class = (
                VaeCheckpointConfig if model_path.suffix in [".pt", ".safetensors", ".ckpt"] else VaeDiffusersConfig
            )
            hash = hashlib.md5(model_path.as_posix().encode("utf-8")).hexdigest()
            new_conf = config_class(path=model_path.as_posix(), name=model_path.stem, base=config.base, key=hash)
            submodel_type = None
        else:
            new_conf = config
        return new_conf, submodel_type
    @classmethod
    def register(
        cls, type: ModelType, format: ModelFormat, base: BaseModelType = BaseModelType.Any
    ) -> Callable[[Type[ModelLoaderBase]], Type[ModelLoaderBase]]:
        """Define a decorator which registers the subclass of loader."""
        def decorator(subclass: Type[ModelLoaderBase]) -> Type[ModelLoaderBase]:
            cls._logger.debug(f"Registering class {subclass.__name__} to load models of type {base}/{type}/{format}")
            key = cls._to_registry_key(base, type, format)
            if key in cls._registry:
                raise Exception(
                    f"{subclass.__name__} is trying to register as a loader for {base}/{type}/{format}, but this type of model has already been registered by {cls._registry[key].__name__}"
                )
            cls._registry[key] = subclass
            return subclass
        return decorator
--- a/invokeai/backend/model_manager/load/load_default.py
+++ b/invokeai/backend/model_manager/load/load_default.py
@ -1,13 +1,9 @@
 # Copyright (c) 2024, Lincoln D. Stein and the InvokeAI Development Team
 """Default implementation of model loading in InvokeAI."""
 import sys
 from logging import Logger
 from pathlib import Path
-from typing import Any, Dict, Optional, Tuple
+from typing import Optional, Tuple
 from diffusers import ModelMixin
 from diffusers.configuration_utils import ConfigMixin
 from invokeai.app.services.config import InvokeAIAppConfig
 from invokeai.backend.model_manager import (
@ -25,17 +21,6 @@ from invokeai.backend.model_manager.load.optimizations import skip_torch_weight_
 from invokeai.backend.util.devices import choose_torch_device, torch_dtype
 class ConfigLoader(ConfigMixin):
    """Subclass of ConfigMixin for loading diffusers configuration files."""
    @classmethod
    def load_config(cls, *args: Any, **kwargs: Any) -> Dict[str, Any]:
        """Load a diffusrs ConfigMixin configuration."""
        cls.config_name = kwargs.pop("config_name")
        # Diffusers doesn't provide typing info
        return super().load_config(*args, **kwargs)  # type: ignore
 # TO DO: The loader is not thread safe!
 class ModelLoader(ModelLoaderBase):
    """Default implementation of ModelLoaderBase."""
@ -137,43 +122,6 @@ class ModelLoader(ModelLoaderBase):
            variant=config.repo_variant if hasattr(config, "repo_variant") else None,
        )
    def _load_diffusers_config(self, model_path: Path, config_name: str = "config.json") -> Dict[str, Any]:
        return ConfigLoader.load_config(model_path, config_name=config_name)
    # TO DO: Add exception handling
    def _hf_definition_to_type(self, module: str, class_name: str) -> ModelMixin:  # fix with correct type
        if module in ["diffusers", "transformers"]:
            res_type = sys.modules[module]
        else:
            res_type = sys.modules["diffusers"].pipelines
        result: ModelMixin = getattr(res_type, class_name)
        return result
    # TO DO: Add exception handling
    def _get_hf_load_class(self, model_path: Path, submodel_type: Optional[SubModelType] = None) -> ModelMixin:
        if submodel_type:
            try:
                config = self._load_diffusers_config(model_path, config_name="model_index.json")
                module, class_name = config[submodel_type.value]
                return self._hf_definition_to_type(module=module, class_name=class_name)
            except KeyError as e:
                raise InvalidModelConfigException(
                    f'The "{submodel_type}" submodel is not available for this model.'
                ) from e
        else:
            try:
                config = self._load_diffusers_config(model_path, config_name="config.json")
                class_name = config.get("_class_name", None)
                if class_name:
                    return self._hf_definition_to_type(module="diffusers", class_name=class_name)
                if config.get("model_type", None) == "clip_vision_model":
                    class_name = config.get("architectures")[0]
                    return self._hf_definition_to_type(module="transformers", class_name=class_name)
                if not class_name:
                    raise InvalidModelConfigException("Unable to decifer Load Class based on given config.json")
            except KeyError as e:
                raise InvalidModelConfigException("An expected config.json file is missing from this model.") from e
    # This needs to be implemented in subclasses that handle checkpoints
    def _convert_model(self, config: AnyModelConfig, model_path: Path, output_path: Path) -> Path:
        raise NotImplementedError
--- a/invokeai/backend/model_manager/load/memory_snapshot.py
+++ b/invokeai/backend/model_manager/load/memory_snapshot.py
@ -55,7 +55,7 @@ class MemorySnapshot:
            vram = None
        try:
-            malloc_info = LibcUtil().mallinfo2()  # type: ignore
+            malloc_info = LibcUtil().mallinfo2()
        except (OSError, AttributeError):
            # OSError: This is expected in environments that do not have the 'libc.so.6' shared library.
            # AttributeError: This is expected in environments that have `libc.so.6` but do not have the `mallinfo2` (e.g. glibc < 2.33)
--- a/invokeai/backend/model_manager/load/model_loader_registry.py
+++ b/invokeai/backend/model_manager/load/model_loader_registry.py
@ -0,0 +1,122 @@
 # Copyright (c) 2024 Lincoln D. Stein and the InvokeAI Development team
 """
 This module implements a system in which model loaders register the
 type, base and format of models that they know how to load.
 Use like this:
  cls, model_config, submodel_type = ModelLoaderRegistry.get_implementation(model_config, submodel_type)  # type: ignore
  loaded_model = cls(
       app_config=app_config,
       logger=logger,
       ram_cache=ram_cache,
       convert_cache=convert_cache
    ).load_model(model_config, submodel_type)
 """
 import hashlib
 from abc import ABC, abstractmethod
 from pathlib import Path
 from typing import Callable, Dict, Optional, Tuple, Type
 from ..config import (
    AnyModelConfig,
    BaseModelType,
    ModelConfigBase,
    ModelFormat,
    ModelType,
    SubModelType,
    VaeCheckpointConfig,
    VaeDiffusersConfig,
 )
 from . import ModelLoaderBase
 class ModelLoaderRegistryBase(ABC):
    """This class allows model loaders to register their type, base and format."""
    @classmethod
    @abstractmethod
    def register(
        cls, type: ModelType, format: ModelFormat, base: BaseModelType = BaseModelType.Any
    ) -> Callable[[Type[ModelLoaderBase]], Type[ModelLoaderBase]]:
        """Define a decorator which registers the subclass of loader."""
    @classmethod
    @abstractmethod
    def get_implementation(
        cls, config: AnyModelConfig, submodel_type: Optional[SubModelType]
    ) -> Tuple[Type[ModelLoaderBase], ModelConfigBase, Optional[SubModelType]]:
        """
        Get subclass of ModelLoaderBase registered to handle base and type.
        Parameters:
        :param config: Model configuration record, as returned by ModelRecordService
        :param submodel_type: Submodel to fetch (main models only)
        :return: tuple(loader_class, model_config, submodel_type)
        Note that the returned model config may be different from one what passed
        in, in the event that a submodel type is provided.
        """
 class ModelLoaderRegistry:
    """
    This class allows model loaders to register their type, base and format.
    """
    _registry: Dict[str, Type[ModelLoaderBase]] = {}
    @classmethod
    def register(
        cls, type: ModelType, format: ModelFormat, base: BaseModelType = BaseModelType.Any
    ) -> Callable[[Type[ModelLoaderBase]], Type[ModelLoaderBase]]:
        """Define a decorator which registers the subclass of loader."""
        def decorator(subclass: Type[ModelLoaderBase]) -> Type[ModelLoaderBase]:
            key = cls._to_registry_key(base, type, format)
            if key in cls._registry:
                raise Exception(
                    f"{subclass.__name__} is trying to register as a loader for {base}/{type}/{format}, but this type of model has already been registered by {cls._registry[key].__name__}"
                )
            cls._registry[key] = subclass
            return subclass
        return decorator
    @classmethod
    def get_implementation(
        cls, config: AnyModelConfig, submodel_type: Optional[SubModelType]
    ) -> Tuple[Type[ModelLoaderBase], ModelConfigBase, Optional[SubModelType]]:
        """Get subclass of ModelLoaderBase registered to handle base and type."""
        # We have to handle VAE overrides here because this will change the model type and the corresponding implementation returned
        conf2, submodel_type = cls._handle_subtype_overrides(config, submodel_type)
        key1 = cls._to_registry_key(conf2.base, conf2.type, conf2.format)  # for a specific base type
        key2 = cls._to_registry_key(BaseModelType.Any, conf2.type, conf2.format)  # with wildcard Any
        implementation = cls._registry.get(key1) or cls._registry.get(key2)
        if not implementation:
            raise NotImplementedError(
                f"No subclass of LoadedModel is registered for base={config.base}, type={config.type}, format={config.format}"
            )
        return implementation, conf2, submodel_type
    @classmethod
    def _handle_subtype_overrides(
        cls, config: AnyModelConfig, submodel_type: Optional[SubModelType]
    ) -> Tuple[ModelConfigBase, Optional[SubModelType]]:
        if submodel_type == SubModelType.Vae and hasattr(config, "vae") and config.vae is not None:
            model_path = Path(config.vae)
            config_class = (
                VaeCheckpointConfig if model_path.suffix in [".pt", ".safetensors", ".ckpt"] else VaeDiffusersConfig
            )
            hash = hashlib.md5(model_path.as_posix().encode("utf-8")).hexdigest()
            new_conf = config_class(path=model_path.as_posix(), name=model_path.stem, base=config.base, key=hash)
            submodel_type = None
        else:
            new_conf = config
        return new_conf, submodel_type
    @staticmethod
    def _to_registry_key(base: BaseModelType, type: ModelType, format: ModelFormat) -> str:
        return "-".join([base.value, type.value, format.value])
--- a/invokeai/backend/model_manager/load/model_loaders/controlnet.py
+++ b/invokeai/backend/model_manager/load/model_loaders/controlnet.py
@ -13,13 +13,13 @@ from invokeai.backend.model_manager import (
    ModelType,
 )
 from invokeai.backend.model_manager.convert_ckpt_to_diffusers import convert_controlnet_to_diffusers
 from invokeai.backend.model_manager.load.load_base import AnyModelLoader
 from .. import ModelLoaderRegistry
 from .generic_diffusers import GenericDiffusersLoader
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.ControlNet, format=ModelFormat.Diffusers)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.ControlNet, format=ModelFormat.Diffusers)
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.ControlNet, format=ModelFormat.Checkpoint)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.ControlNet, format=ModelFormat.Checkpoint)
 class ControlnetLoader(GenericDiffusersLoader):
    """Class to load ControlNet models."""
--- a/invokeai/backend/model_manager/load/model_loaders/generic_diffusers.py
+++ b/invokeai/backend/model_manager/load/model_loaders/generic_diffusers.py
@ -1,24 +1,27 @@
 # Copyright (c) 2024, Lincoln D. Stein and the InvokeAI Development Team
 """Class for simple diffusers model loading in InvokeAI."""
 import sys
 from pathlib import Path
-from typing import Optional
+from typing import Any, Dict, Optional
 from diffusers import ConfigMixin, ModelMixin
 from invokeai.backend.model_manager import (
    AnyModel,
    BaseModelType,
    InvalidModelConfigException,
    ModelFormat,
    ModelRepoVariant,
    ModelType,
    SubModelType,
 )
-from ..load_base import AnyModelLoader
+from .. import ModelLoader, ModelLoaderRegistry
 from ..load_default import ModelLoader
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.CLIPVision, format=ModelFormat.Diffusers)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.CLIPVision, format=ModelFormat.Diffusers)
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.T2IAdapter, format=ModelFormat.Diffusers)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.T2IAdapter, format=ModelFormat.Diffusers)
 class GenericDiffusersLoader(ModelLoader):
    """Class to load simple diffusers models."""
@ -28,9 +31,60 @@ class GenericDiffusersLoader(ModelLoader):
        model_variant: Optional[ModelRepoVariant] = None,
        submodel_type: Optional[SubModelType] = None,
    ) -> AnyModel:
-        model_class = self._get_hf_load_class(model_path)
+        model_class = self.get_hf_load_class(model_path)
        if submodel_type is not None:
            raise Exception(f"There are no submodels in models of type {model_class}")
        variant = model_variant.value if model_variant else None
        result: AnyModel = model_class.from_pretrained(model_path, torch_dtype=self._torch_dtype, variant=variant)  # type: ignore
        return result
    # TO DO: Add exception handling
    def get_hf_load_class(self, model_path: Path, submodel_type: Optional[SubModelType] = None) -> ModelMixin:
        """Given the model path and submodel, returns the diffusers ModelMixin subclass needed to load."""
        if submodel_type:
            try:
                config = self._load_diffusers_config(model_path, config_name="model_index.json")
                module, class_name = config[submodel_type.value]
                result = self._hf_definition_to_type(module=module, class_name=class_name)
            except KeyError as e:
                raise InvalidModelConfigException(
                    f'The "{submodel_type}" submodel is not available for this model.'
                ) from e
        else:
            try:
                config = self._load_diffusers_config(model_path, config_name="config.json")
                class_name = config.get("_class_name", None)
                if class_name:
                    result = self._hf_definition_to_type(module="diffusers", class_name=class_name)
                if config.get("model_type", None) == "clip_vision_model":
                    class_name = config.get("architectures")
                    assert class_name is not None
                    result = self._hf_definition_to_type(module="transformers", class_name=class_name[0])
                if not class_name:
                    raise InvalidModelConfigException("Unable to decifer Load Class based on given config.json")
            except KeyError as e:
                raise InvalidModelConfigException("An expected config.json file is missing from this model.") from e
        return result
    # TO DO: Add exception handling
    def _hf_definition_to_type(self, module: str, class_name: str) -> ModelMixin:  # fix with correct type
        if module in ["diffusers", "transformers"]:
            res_type = sys.modules[module]
        else:
            res_type = sys.modules["diffusers"].pipelines
        result: ModelMixin = getattr(res_type, class_name)
        return result
    def _load_diffusers_config(self, model_path: Path, config_name: str = "config.json") -> Dict[str, Any]:
        return ConfigLoader.load_config(model_path, config_name=config_name)
 class ConfigLoader(ConfigMixin):
    """Subclass of ConfigMixin for loading diffusers configuration files."""
    @classmethod
    def load_config(cls, *args: Any, **kwargs: Any) -> Dict[str, Any]:
        """Load a diffusrs ConfigMixin configuration."""
        cls.config_name = kwargs.pop("config_name")
        # Diffusers doesn't provide typing info
        return super().load_config(*args, **kwargs)  # type: ignore
--- a/invokeai/backend/model_manager/load/model_loaders/ip_adapter.py
+++ b/invokeai/backend/model_manager/load/model_loaders/ip_adapter.py
@ -15,11 +15,10 @@ from invokeai.backend.model_manager import (
    ModelType,
    SubModelType,
 )
-from invokeai.backend.model_manager.load.load_base import AnyModelLoader
+from invokeai.backend.model_manager.load import ModelLoader, ModelLoaderRegistry
 from invokeai.backend.model_manager.load.load_default import ModelLoader
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.IPAdapter, format=ModelFormat.InvokeAI)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.IPAdapter, format=ModelFormat.InvokeAI)
 class IPAdapterInvokeAILoader(ModelLoader):
    """Class to load IP Adapter diffusers models."""
--- a/invokeai/backend/model_manager/load/model_loaders/lora.py
+++ b/invokeai/backend/model_manager/load/model_loaders/lora.py
@ -18,13 +18,13 @@ from invokeai.backend.model_manager import (
    SubModelType,
 )
 from invokeai.backend.model_manager.load.convert_cache import ModelConvertCacheBase
 from invokeai.backend.model_manager.load.load_base import AnyModelLoader
 from invokeai.backend.model_manager.load.load_default import ModelLoader
 from invokeai.backend.model_manager.load.model_cache.model_cache_base import ModelCacheBase
 from .. import ModelLoader, ModelLoaderRegistry
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.Lora, format=ModelFormat.Diffusers)
+
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.Lora, format=ModelFormat.Lycoris)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.Lora, format=ModelFormat.Diffusers)
@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.Lora, format=ModelFormat.Lycoris)
 class LoraLoader(ModelLoader):
    """Class to load LoRA models."""
--- a/invokeai/backend/model_manager/load/model_loaders/onnx.py
+++ b/invokeai/backend/model_manager/load/model_loaders/onnx.py
@ -13,13 +13,14 @@ from invokeai.backend.model_manager import (
    ModelType,
    SubModelType,
 )
-from invokeai.backend.model_manager.load.load_base import AnyModelLoader
+
-from invokeai.backend.model_manager.load.load_default import ModelLoader
+from .. import ModelLoaderRegistry
 from .generic_diffusers import GenericDiffusersLoader
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.ONNX, format=ModelFormat.Onnx)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.ONNX, format=ModelFormat.Onnx)
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.ONNX, format=ModelFormat.Olive)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.ONNX, format=ModelFormat.Olive)
-class OnnyxDiffusersModel(ModelLoader):
+class OnnyxDiffusersModel(GenericDiffusersLoader):
    """Class to load onnx models."""
    def _load_model(
@ -30,7 +31,7 @@ class OnnyxDiffusersModel(ModelLoader):
    ) -> AnyModel:
        if not submodel_type is not None:
            raise Exception("A submodel type must be provided when loading onnx pipelines.")
-        load_class = self._get_hf_load_class(model_path, submodel_type)
+        load_class = self.get_hf_load_class(model_path, submodel_type)
        variant = model_variant.value if model_variant else None
        model_path = model_path / submodel_type.value
        result: AnyModel = load_class.from_pretrained(
--- a/invokeai/backend/model_manager/load/model_loaders/stable_diffusion.py
+++ b/invokeai/backend/model_manager/load/model_loaders/stable_diffusion.py
@ -19,13 +19,14 @@ from invokeai.backend.model_manager import (
 )
 from invokeai.backend.model_manager.config import MainCheckpointConfig
 from invokeai.backend.model_manager.convert_ckpt_to_diffusers import convert_ckpt_to_diffusers
-from invokeai.backend.model_manager.load.load_base import AnyModelLoader
+
-from invokeai.backend.model_manager.load.load_default import ModelLoader
+from .. import ModelLoaderRegistry
 from .generic_diffusers import GenericDiffusersLoader
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.Main, format=ModelFormat.Diffusers)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.Main, format=ModelFormat.Diffusers)
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.Main, format=ModelFormat.Checkpoint)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.Main, format=ModelFormat.Checkpoint)
-class StableDiffusionDiffusersModel(ModelLoader):
+class StableDiffusionDiffusersModel(GenericDiffusersLoader):
    """Class to load main models."""
    model_base_to_model_type = {
@ -43,7 +44,7 @@ class StableDiffusionDiffusersModel(ModelLoader):
    ) -> AnyModel:
        if not submodel_type is not None:
            raise Exception("A submodel type must be provided when loading main pipelines.")
-        load_class = self._get_hf_load_class(model_path, submodel_type)
+        load_class = self.get_hf_load_class(model_path, submodel_type)
        variant = model_variant.value if model_variant else None
        model_path = model_path / submodel_type.value
        result: AnyModel = load_class.from_pretrained(
--- a/invokeai/backend/model_manager/load/model_loaders/textual_inversion.py
+++ b/invokeai/backend/model_manager/load/model_loaders/textual_inversion.py
@ -5,7 +5,6 @@
 from pathlib import Path
 from typing import Optional, Tuple
 from invokeai.backend.textual_inversion import TextualInversionModelRaw
 from invokeai.backend.model_manager import (
    AnyModel,
    AnyModelConfig,
@ -15,12 +14,15 @@ from invokeai.backend.model_manager import (
    ModelType,
    SubModelType,
 )
-from invokeai.backend.model_manager.load.load_base import AnyModelLoader
+from invokeai.backend.textual_inversion import TextualInversionModelRaw
-from invokeai.backend.model_manager.load.load_default import ModelLoader
+
 from .. import ModelLoader, ModelLoaderRegistry
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.TextualInversion, format=ModelFormat.EmbeddingFile)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.TextualInversion, format=ModelFormat.EmbeddingFile)
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.TextualInversion, format=ModelFormat.EmbeddingFolder)
+@ModelLoaderRegistry.register(
    base=BaseModelType.Any, type=ModelType.TextualInversion, format=ModelFormat.EmbeddingFolder
 )
 class TextualInversionLoader(ModelLoader):
    """Class to load TI models."""
--- a/invokeai/backend/model_manager/load/model_loaders/vae.py
+++ b/invokeai/backend/model_manager/load/model_loaders/vae.py
@ -14,14 +14,14 @@ from invokeai.backend.model_manager import (
    ModelType,
 )
 from invokeai.backend.model_manager.convert_ckpt_to_diffusers import convert_ldm_vae_to_diffusers
 from invokeai.backend.model_manager.load.load_base import AnyModelLoader
 from .. import ModelLoaderRegistry
 from .generic_diffusers import GenericDiffusersLoader
-@AnyModelLoader.register(base=BaseModelType.Any, type=ModelType.Vae, format=ModelFormat.Diffusers)
+@ModelLoaderRegistry.register(base=BaseModelType.Any, type=ModelType.Vae, format=ModelFormat.Diffusers)
-@AnyModelLoader.register(base=BaseModelType.StableDiffusion1, type=ModelType.Vae, format=ModelFormat.Checkpoint)
+@ModelLoaderRegistry.register(base=BaseModelType.StableDiffusion1, type=ModelType.Vae, format=ModelFormat.Checkpoint)
-@AnyModelLoader.register(base=BaseModelType.StableDiffusion2, type=ModelType.Vae, format=ModelFormat.Checkpoint)
+@ModelLoaderRegistry.register(base=BaseModelType.StableDiffusion2, type=ModelType.Vae, format=ModelFormat.Checkpoint)
 class VaeLoader(GenericDiffusersLoader):
    """Class to load VAE models."""
--- a/invokeai/backend/model_manager/load/optimizations.py
+++ b/invokeai/backend/model_manager/load/optimizations.py
@ -1,16 +1,16 @@
 from contextlib import contextmanager
 from typing import Any, Generator
 import torch
-def _no_op(*args, **kwargs):
+def _no_op(*args: Any, **kwargs: Any) -> None:
    pass
@contextmanager
-def skip_torch_weight_init():
+def skip_torch_weight_init() -> Generator[None, None, None]:
-    """A context manager that monkey-patches several of the common torch layers (torch.nn.Linear, torch.nn.Conv1d, etc.)
+    """Monkey patch several of the common torch layers (torch.nn.Linear, torch.nn.Conv1d, etc.) to skip weight initialization.
    to skip weight initialization.
    By default, `torch.nn.Linear` and `torch.nn.ConvNd` layers initialize their weights (according to a particular
    distribution) when __init__ is called. This weight initialization step can take a significant amount of time, and is
@ -18,13 +18,14 @@ def skip_torch_weight_init():
    monkey-patches common torch layers to skip the weight initialization step.
    """
    torch_modules = [torch.nn.Linear, torch.nn.modules.conv._ConvNd, torch.nn.Embedding]
-    saved_functions = [m.reset_parameters for m in torch_modules]
+    saved_functions = [hasattr(m, "reset_parameters") and m.reset_parameters for m in torch_modules]
    try:
        for torch_module in torch_modules:
            assert hasattr(torch_module, "reset_parameters")
            torch_module.reset_parameters = _no_op
        yield None
    finally:
        for torch_module, saved_function in zip(torch_modules, saved_functions, strict=True):
            assert hasattr(torch_module, "reset_parameters")
            torch_module.reset_parameters = saved_function
--- a/invokeai/backend/model_manager/merge.py
+++ b/invokeai/backend/model_manager/merge.py
@ -13,7 +13,7 @@ from typing import Any, List, Optional, Set
 import torch
 from diffusers import AutoPipelineForText2Image
-from diffusers import logging as dlogging
+from diffusers.utils import logging as dlogging
 from invokeai.app.services.model_install import ModelInstallServiceBase
 from invokeai.backend.util.devices import choose_torch_device, torch_dtype
@ -76,7 +76,7 @@ class ModelMerger(object):
                custom_pipeline="checkpoint_merger",
                torch_dtype=dtype,
                variant=variant,
-            )
+            )  # type: ignore
            merged_pipe = pipe.merge(
                pretrained_model_name_or_path_list=model_paths,
                alpha=alpha,
--- a/invokeai/backend/model_manager/metadata/metadata_base.py
+++ b/invokeai/backend/model_manager/metadata/metadata_base.py
@ -54,8 +54,8 @@ class LicenseRestrictions(BaseModel):
    AllowDifferentLicense: bool = Field(
        description="if true, derivatives of this model be redistributed under a different license", default=False
    )
-    AllowCommercialUse: CommercialUsage = Field(
+    AllowCommercialUse: Optional[CommercialUsage] = Field(
-        description="Type of commercial use allowed or 'No' if no commercial use is allowed.", default_factory=set
+        description="Type of commercial use allowed or 'No' if no commercial use is allowed.", default=None
    )
@ -139,7 +139,10 @@ class CivitaiMetadata(ModelMetadataWithFiles):
    @property
    def allow_commercial_use(self) -> bool:
        """Return True if commercial use is allowed."""
-        return self.restrictions.AllowCommercialUse != CommercialUsage("None")
+        if self.restrictions.AllowCommercialUse is None:
            return False
        else:
            return self.restrictions.AllowCommercialUse != CommercialUsage("None")
    @property
    def allow_derivatives(self) -> bool:
--- a/invokeai/backend/model_manager/probe.py
+++ b/invokeai/backend/model_manager/probe.py
@ -8,7 +8,6 @@ import torch
 from picklescan.scanner import scan_file_path
 import invokeai.backend.util.logging as logger
 from .util.model_util import lora_token_vector_length, read_checkpoint_meta
 from invokeai.backend.util.util import SilenceWarnings
 from .config import (
@ -23,6 +22,7 @@ from .config import (
    SchedulerPredictionType,
 )
 from .hash import FastModelHash
 from .util.model_util import lora_token_vector_length, read_checkpoint_meta
 CkptType = Dict[str, Any]
@ -53,6 +53,7 @@ LEGACY_CONFIGS: Dict[BaseModelType, Dict[ModelVariantType, Union[str, Dict[Sched
    },
 }
 class ProbeBase(object):
    """Base class for probes."""
--- a/invokeai/backend/model_manager/search.py
+++ b/invokeai/backend/model_manager/search.py
@ -116,9 +116,9 @@ class ModelSearch(ModelSearchBase):
       # returns all models that have 'anime' in the path
    """
-    models_found: Optional[Set[Path]] = Field(default=None)
+    models_found: Set[Path] = Field(default_factory=set)
-    scanned_dirs: Optional[Set[Path]] = Field(default=None)
+    scanned_dirs: Set[Path] = Field(default_factory=set)
-    pruned_paths: Optional[Set[Path]] = Field(default=None)
+    pruned_paths: Set[Path] = Field(default_factory=set)
    def search_started(self) -> None:
        self.models_found = set()
--- a/invokeai/backend/model_manager/util/libc_util.py
+++ b/invokeai/backend/model_manager/util/libc_util.py
@ -35,7 +35,7 @@ class Struct_mallinfo2(ctypes.Structure):
        ("keepcost", ctypes.c_size_t),
    ]
-    def __str__(self):
+    def __str__(self) -> str:
        s = ""
        s += f"{'arena': <10}= {(self.arena/2**30):15.5f}   # Non-mmapped space allocated (GB) (uordblks + fordblks)\n"
        s += f"{'ordblks': <10}= {(self.ordblks): >15}   # Number of free chunks\n"
@ -62,7 +62,7 @@ class LibcUtil:
    TODO: Improve cross-OS compatibility of this class.
    """
-    def __init__(self):
+    def __init__(self) -> None:
        self._libc = ctypes.cdll.LoadLibrary("libc.so.6")
    def mallinfo2(self) -> Struct_mallinfo2:
@ -72,4 +72,5 @@ class LibcUtil:
        """
        mallinfo2 = self._libc.mallinfo2
        mallinfo2.restype = Struct_mallinfo2
-        return mallinfo2()
+        result: Struct_mallinfo2 = mallinfo2()
        return result
--- a/invokeai/backend/model_manager/util/model_util.py
+++ b/invokeai/backend/model_manager/util/model_util.py
@ -1,12 +1,15 @@
 """Utilities for parsing model files, used mostly by probe.py"""
 import json
 import torch
 from typing import Union
 from pathlib import Path
 from typing import Dict, Optional, Union
 import safetensors
 import torch
 from picklescan.scanner import scan_file_path
-def _fast_safetensors_reader(path: str):
+
 def _fast_safetensors_reader(path: str) -> Dict[str, torch.Tensor]:
    checkpoint = {}
    device = torch.device("meta")
    with open(path, "rb") as f:
@ -37,10 +40,12 @@ def _fast_safetensors_reader(path: str):
    return checkpoint
-def read_checkpoint_meta(path: Union[str, Path], scan: bool = False):
+
 def read_checkpoint_meta(path: Union[str, Path], scan: bool = False) -> Dict[str, torch.Tensor]:
    if str(path).endswith(".safetensors"):
        try:
-            checkpoint = _fast_safetensors_reader(path)
+            path_str = path.as_posix() if isinstance(path, Path) else path
            checkpoint = _fast_safetensors_reader(path_str)
        except Exception:
            # TODO: create issue for support "meta"?
            checkpoint = safetensors.torch.load_file(path, device="cpu")
@ -52,14 +57,15 @@ def read_checkpoint_meta(path: Union[str, Path], scan: bool = False):
        checkpoint = torch.load(path, map_location=torch.device("meta"))
    return checkpoint
-def lora_token_vector_length(checkpoint: dict) -> int:
+
 def lora_token_vector_length(checkpoint: Dict[str, torch.Tensor]) -> Optional[int]:
    """
    Given a checkpoint in memory, return the lora token vector length
    :param checkpoint: The checkpoint
    """
-    def _get_shape_1(key: str, tensor, checkpoint) -> int:
+    def _get_shape_1(key: str, tensor: torch.Tensor, checkpoint: Dict[str, torch.Tensor]) -> Optional[int]:
        lora_token_vector_length = None
        if "." not in key:
--- a/invokeai/backend/onnx/onnx_runtime.py
+++ b/invokeai/backend/onnx/onnx_runtime.py
@ -8,6 +8,7 @@ import numpy as np
 import onnx
 from onnx import numpy_helper
 from onnxruntime import InferenceSession, SessionOptions, get_available_providers
 from ..raw_model import RawModel
 ONNX_WEIGHTS_NAME = "model.onnx"
@ -15,7 +16,7 @@ ONNX_WEIGHTS_NAME = "model.onnx"
 # NOTE FROM LS: This was copied from Stalker's original implementation.
 # I have not yet gone through and fixed all the type hints
-class IAIOnnxRuntimeModel:
+class IAIOnnxRuntimeModel(RawModel):
    class _tensor_access:
        def __init__(self, model):  # type: ignore
            self.model = model
--- a/invokeai/backend/raw_model.py
+++ b/invokeai/backend/raw_model.py
@ -10,5 +10,6 @@ The term 'raw' was introduced to describe a wrapper around a torch.nn.Module
 that adds additional methods and attributes.
 """
 class RawModel:
    """Base class for 'Raw' model wrappers."""
--- a/invokeai/backend/stable_diffusion/seamless.py
+++ b/invokeai/backend/stable_diffusion/seamless.py
@ -1,10 +1,11 @@
 from __future__ import annotations
 from contextlib import contextmanager
-from typing import List, Union
+from typing import Callable, List, Union
 import torch.nn as nn
-from diffusers.models import AutoencoderKL, UNet2DConditionModel
+from diffusers.models.autoencoders.autoencoder_kl import AutoencoderKL
 from diffusers.models.unets.unet_2d_condition import UNet2DConditionModel
 def _conv_forward_asymmetric(self, input, weight, bias):
@ -26,70 +27,51 @@ def _conv_forward_asymmetric(self, input, weight, bias):
@contextmanager
 def set_seamless(model: Union[UNet2DConditionModel, AutoencoderKL], seamless_axes: List[str]):
    # Callable: (input: Tensor, weight: Tensor, bias: Optional[Tensor]) -> Tensor
    to_restore: list[tuple[nn.Conv2d | nn.ConvTranspose2d, Callable]] = []
    try:
-        to_restore = []
+        # Hard coded to skip down block layers, allowing for seamless tiling at the expense of prompt adherence
-
+        skipped_layers = 1
        for m_name, m in model.named_modules():
-            if isinstance(model, UNet2DConditionModel):
+            if not isinstance(m, (nn.Conv2d, nn.ConvTranspose2d)):
-                if ".attentions." in m_name:
+                continue
            if isinstance(model, UNet2DConditionModel) and m_name.startswith("down_blocks.") and ".resnets." in m_name:
                # down_blocks.1.resnets.1.conv1
                _, block_num, _, resnet_num, submodule_name = m_name.split(".")
                block_num = int(block_num)
                resnet_num = int(resnet_num)
                if block_num >= len(model.down_blocks) - skipped_layers:
                    continue
-                if ".resnets." in m_name:
+                # Skip the second resnet (could be configurable)
-                    if ".conv2" in m_name:
+                if resnet_num > 0:
                        continue
                    if ".conv_shortcut" in m_name:
                        continue
            """
            if isinstance(model, UNet2DConditionModel):
                if False and ".upsamplers." in m_name:
                    continue
-                if False and ".downsamplers." in m_name:
+                # Skip Conv2d layers (could be configurable)
                if submodule_name == "conv2":
                    continue
-                if True and ".resnets." in m_name:
+            m.asymmetric_padding_mode = {}
-                    if True and ".conv1" in m_name:
+            m.asymmetric_padding = {}
-                        if False and "down_blocks" in m_name:
+            m.asymmetric_padding_mode["x"] = "circular" if ("x" in seamless_axes) else "constant"
-                            continue
+            m.asymmetric_padding["x"] = (
-                        if False and "mid_block" in m_name:
+                m._reversed_padding_repeated_twice[0],
-                            continue
+                m._reversed_padding_repeated_twice[1],
-                        if False and "up_blocks" in m_name:
+                0,
-                            continue
+                0,
            )
            m.asymmetric_padding_mode["y"] = "circular" if ("y" in seamless_axes) else "constant"
            m.asymmetric_padding["y"] = (
                0,
                0,
                m._reversed_padding_repeated_twice[2],
                m._reversed_padding_repeated_twice[3],
            )
-                    if True and ".conv2" in m_name:
+            to_restore.append((m, m._conv_forward))
-                        continue
+            m._conv_forward = _conv_forward_asymmetric.__get__(m, nn.Conv2d)
                    if True and ".conv_shortcut" in m_name:
                        continue
                if True and ".attentions." in m_name:
                    continue
                if False and m_name in ["conv_in", "conv_out"]:
                    continue
            """
            if isinstance(m, (nn.Conv2d, nn.ConvTranspose2d)):
                m.asymmetric_padding_mode = {}
                m.asymmetric_padding = {}
                m.asymmetric_padding_mode["x"] = "circular" if ("x" in seamless_axes) else "constant"
                m.asymmetric_padding["x"] = (
                    m._reversed_padding_repeated_twice[0],
                    m._reversed_padding_repeated_twice[1],
                    0,
                    0,
                )
                m.asymmetric_padding_mode["y"] = "circular" if ("y" in seamless_axes) else "constant"
                m.asymmetric_padding["y"] = (
                    0,
                    0,
                    m._reversed_padding_repeated_twice[2],
                    m._reversed_padding_repeated_twice[3],
                )
                to_restore.append((m, m._conv_forward))
                m._conv_forward = _conv_forward_asymmetric.__get__(m, nn.Conv2d)
        yield
--- a/invokeai/backend/textual_inversion.py
+++ b/invokeai/backend/textual_inversion.py
@ -8,8 +8,10 @@ from compel.embeddings_provider import BaseTextualInversionManager
 from safetensors.torch import load_file
 from transformers import CLIPTokenizer
 from typing_extensions import Self
 from .raw_model import RawModel
 class TextualInversionModelRaw(RawModel):
    embedding: torch.Tensor  # [n, 768]|[n, 1280]
    embedding_2: Optional[torch.Tensor] = None  # [n, 768]|[n, 1280]   - for SDXL models
--- a/invokeai/backend/util/test_utils.py
+++ b/invokeai/backend/util/test_utils.py
@ -42,7 +42,7 @@ def install_and_load_model(
    # If the requested model is already installed, return its LoadedModel
    with contextlib.suppress(UnknownModelException):
        # TODO: Replace with wrapper call
-        loaded_model: LoadedModel = model_manager.load.load_model_by_attr(
+        loaded_model: LoadedModel = model_manager.load_model_by_attr(
            model_name=model_name, base_model=base_model, model_type=model_type
        )
        return loaded_model
@ -53,7 +53,7 @@ def install_and_load_model(
    assert job.complete
    try:
-        loaded_model = model_manager.load.load_model_by_config(job.config_out)
+        loaded_model = model_manager.load_model_by_config(job.config_out)
        return loaded_model
    except UnknownModelException as e:
        raise Exception(
--- a/tests/backend/model_manager/model_loading/test_model_load.py
+++ b/tests/backend/model_manager/model_loading/test_model_load.py
@ -4,18 +4,27 @@ Test model loading
 from pathlib import Path
-from invokeai.app.services.model_install import ModelInstallServiceBase
+from invokeai.app.services.model_manager import ModelManagerServiceBase
 from invokeai.app.services.model_load import ModelLoadServiceBase
 from invokeai.backend.textual_inversion import TextualInversionModelRaw
 from tests.backend.model_manager.model_manager_fixtures import *  # noqa F403
-def test_loading(mm2_installer: ModelInstallServiceBase, mm2_loader: ModelLoadServiceBase, embedding_file: Path):
+
-    store = mm2_installer.record_store
+def test_loading(mm2_model_manager: ModelManagerServiceBase, embedding_file: Path):
    store = mm2_model_manager.store
    matches = store.search_by_attr(model_name="test_embedding")
    assert len(matches) == 0
-    key = mm2_installer.register_path(embedding_file)
+    key = mm2_model_manager.install.register_path(embedding_file)
-    loaded_model = mm2_loader.load_model_by_config(store.get_model(key))
+    loaded_model = mm2_model_manager.load_model_by_config(store.get_model(key))
    assert loaded_model is not None
    assert loaded_model.config.key == key
    with loaded_model as model:
        assert isinstance(model, TextualInversionModelRaw)
    loaded_model_2 = mm2_model_manager.load_model_by_key(key)
    assert loaded_model.config.key == loaded_model_2.config.key
    loaded_model_3 = mm2_model_manager.load_model_by_attr(
        model_name=loaded_model.config.name,
        model_type=loaded_model.config.type,
        base_model=loaded_model.config.base,
    )
    assert loaded_model.config.key == loaded_model_3.config.key
--- a/tests/backend/model_manager/model_manager_fixtures.py
+++ b/tests/backend/model_manager/model_manager_fixtures.py
@ -6,17 +6,17 @@ from pathlib import Path
 from typing import Any, Dict, List
 import pytest
 from pytest import FixtureRequest
 from pydantic import BaseModel
 from pytest import FixtureRequest
 from requests.sessions import Session
 from requests_testadapter import TestAdapter, TestSession
 from invokeai.app.services.config import InvokeAIAppConfig
-from invokeai.app.services.download import DownloadQueueServiceBase, DownloadQueueService
+from invokeai.app.services.download import DownloadQueueService, DownloadQueueServiceBase
 from invokeai.app.services.events.events_base import EventServiceBase
 from invokeai.app.services.model_manager import ModelManagerServiceBase, ModelManagerService
 from invokeai.app.services.model_load import ModelLoadServiceBase, ModelLoadService
 from invokeai.app.services.model_install import ModelInstallService, ModelInstallServiceBase
 from invokeai.app.services.model_load import ModelLoadService, ModelLoadServiceBase
 from invokeai.app.services.model_manager import ModelManagerService, ModelManagerServiceBase
 from invokeai.app.services.model_metadata import ModelMetadataStoreBase, ModelMetadataStoreSQL
 from invokeai.app.services.model_records import ModelRecordServiceBase, ModelRecordServiceSQL
 from invokeai.backend.model_manager.config import (
@ -95,9 +95,7 @@ def mm2_app_config(mm2_root_dir: Path) -> InvokeAIAppConfig:
@pytest.fixture
-def mm2_download_queue(mm2_session: Session,
+def mm2_download_queue(mm2_session: Session, request: FixtureRequest) -> DownloadQueueServiceBase:
                       request: FixtureRequest
                       ) -> DownloadQueueServiceBase:
    download_queue = DownloadQueueService(requests_session=mm2_session)
    download_queue.start()
@ -107,30 +105,34 @@ def mm2_download_queue(mm2_session: Session,
    request.addfinalizer(stop_queue)
    return download_queue
@pytest.fixture
 def mm2_metadata_store(mm2_record_store: ModelRecordServiceSQL) -> ModelMetadataStoreBase:
    return mm2_record_store.metadata_store
@pytest.fixture
 def mm2_loader(mm2_app_config: InvokeAIAppConfig, mm2_record_store: ModelRecordServiceBase) -> ModelLoadServiceBase:
    ram_cache = ModelCache(
        logger=InvokeAILogger.get_logger(),
        max_cache_size=mm2_app_config.ram_cache_size,
-        max_vram_cache_size=mm2_app_config.vram_cache_size
+        max_vram_cache_size=mm2_app_config.vram_cache_size,
    )
    convert_cache = ModelConvertCache(mm2_app_config.models_convert_cache_path)
-    return ModelLoadService(app_config=mm2_app_config,
+    return ModelLoadService(
-                            record_store=mm2_record_store,
+        app_config=mm2_app_config,
-                            ram_cache=ram_cache,
+        ram_cache=ram_cache,
-                            convert_cache=convert_cache,
+        convert_cache=convert_cache,
-                          )
+    )
@pytest.fixture
-def mm2_installer(mm2_app_config: InvokeAIAppConfig,
+def mm2_installer(
-                  mm2_download_queue: DownloadQueueServiceBase,
+    mm2_app_config: InvokeAIAppConfig,
-                  mm2_session: Session,
+    mm2_download_queue: DownloadQueueServiceBase,
-                  request: FixtureRequest,
+    mm2_session: Session,
-                  ) -> ModelInstallServiceBase:
+    request: FixtureRequest,
 ) -> ModelInstallServiceBase:
    logger = InvokeAILogger.get_logger()
    db = create_mock_sqlite_database(mm2_app_config, logger)
    events = DummyEventService()
@ -213,15 +215,13 @@ def mm2_record_store(mm2_app_config: InvokeAIAppConfig) -> ModelRecordServiceBas
    store.add_model("test_config_5", raw5)
    return store
@pytest.fixture
-def mm2_model_manager(mm2_record_store: ModelRecordServiceBase,
+def mm2_model_manager(
-                      mm2_installer: ModelInstallServiceBase,
+    mm2_record_store: ModelRecordServiceBase, mm2_installer: ModelInstallServiceBase, mm2_loader: ModelLoadServiceBase
-                      mm2_loader: ModelLoadServiceBase) -> ModelManagerServiceBase:
+) -> ModelManagerServiceBase:
-    return ModelManagerService(
+    return ModelManagerService(store=mm2_record_store, install=mm2_installer, load=mm2_loader)
-        store=mm2_record_store,
+
        install=mm2_installer,
        load=mm2_loader
    )
@pytest.fixture
 def mm2_session(embedding_file: Path, diffusers_dir: Path) -> Session:
@ -306,5 +306,3 @@ def mm2_session(embedding_file: Path, diffusers_dir: Path) -> Session:
                ),
            )
    return sess
--- a/tests/backend/model_manager/test_lora.py
+++ b/tests/backend/model_manager/test_lora.py
@ -5,8 +5,8 @@
 import pytest
 import torch
 from invokeai.backend.model_patcher import ModelPatcher
 from invokeai.backend.lora import LoRALayer, LoRAModelRaw
 from invokeai.backend.model_patcher import ModelPatcher
@pytest.mark.parametrize(
--- a/tests/backend/model_manager/test_memory_snapshot.py
+++ b/tests/backend/model_manager/test_memory_snapshot.py
@ -1,7 +1,8 @@
 import pytest
 from invokeai.backend.model_manager.util.libc_util import Struct_mallinfo2
 from invokeai.backend.model_manager.load.memory_snapshot import MemorySnapshot, get_pretty_snapshot_diff
 from invokeai.backend.model_manager.util.libc_util import Struct_mallinfo2
 def test_memory_snapshot_capture():
    """Smoke test of MemorySnapshot.capture()."""