mirror of
https://github.com/invoke-ai/InvokeAI
synced 2024-08-30 20:32:17 +00:00
fix(mm): remove vram check
This check prematurely reports insufficient VRAM on Windows. See #6106 for details.
This commit is contained in:
parent
540d506ec9
commit
a09d705e4c
@ -269,9 +269,6 @@ class ModelCache(ModelCacheBase[AnyModel]):
|
|||||||
if torch.device(source_device).type == torch.device(target_device).type:
|
if torch.device(source_device).type == torch.device(target_device).type:
|
||||||
return
|
return
|
||||||
|
|
||||||
# may raise an exception here if insufficient GPU VRAM
|
|
||||||
self._check_free_vram(target_device, cache_entry.size)
|
|
||||||
|
|
||||||
start_model_to_time = time.time()
|
start_model_to_time = time.time()
|
||||||
snapshot_before = self._capture_memory_snapshot()
|
snapshot_before = self._capture_memory_snapshot()
|
||||||
cache_entry.model.to(target_device)
|
cache_entry.model.to(target_device)
|
||||||
@ -420,24 +417,3 @@ class ModelCache(ModelCacheBase[AnyModel]):
|
|||||||
mps.empty_cache()
|
mps.empty_cache()
|
||||||
|
|
||||||
self.logger.debug(f"After making room: cached_models={len(self._cached_models)}")
|
self.logger.debug(f"After making room: cached_models={len(self._cached_models)}")
|
||||||
|
|
||||||
def _free_vram(self, device: torch.device) -> int:
|
|
||||||
vram_device = ( # mem_get_info() needs an indexed device
|
|
||||||
device if device.index is not None else torch.device(str(device), index=0)
|
|
||||||
)
|
|
||||||
free_mem, _ = torch.cuda.mem_get_info(vram_device)
|
|
||||||
for _, cache_entry in self._cached_models.items():
|
|
||||||
if cache_entry.loaded and not cache_entry.locked:
|
|
||||||
free_mem += cache_entry.size
|
|
||||||
return free_mem
|
|
||||||
|
|
||||||
def _check_free_vram(self, target_device: torch.device, needed_size: int) -> None:
|
|
||||||
if target_device.type != "cuda":
|
|
||||||
return
|
|
||||||
free_mem = self._free_vram(target_device)
|
|
||||||
if needed_size > free_mem:
|
|
||||||
needed_gb = round(needed_size / GIG, 2)
|
|
||||||
free_gb = round(free_mem / GIG, 2)
|
|
||||||
raise torch.cuda.OutOfMemoryError(
|
|
||||||
f"Insufficient VRAM to load model, requested {needed_gb}GB but only had {free_gb}GB free"
|
|
||||||
)
|
|
||||||
|
Loading…
Reference in New Issue
Block a user