report VRAM usage stats during initial model loading (#419)

2024-08-30 20:32:17 +00:00 · 2022-09-07 13:23:53 -04:00
parent f6284777e6
commit dd2aedacaf
2 changed files with 24 additions and 4 deletions
--- a/ldm/generate.py
+++ b/ldm/generate.py
@ -501,12 +501,22 @@ class Generate:
    def _load_model_from_config(self, config, ckpt):
        print(f'>> Loading model from {ckpt}')
        # for usage statistics
        device_type = choose_torch_device()
        if device_type == 'cuda':
            torch.cuda.reset_peak_memory_stats() 
        tic = time.time()
        # this does the work
        pl_sd = torch.load(ckpt, map_location='cpu')
        sd = pl_sd['state_dict']
        model = instantiate_from_config(config.model)
        m, u = model.load_state_dict(sd, strict=False)
        model.to(self.device)
        model.eval()
        if self.full_precision:
            print(
                '>> Using slower but more accurate full-precision math (--full_precision)'
@ -516,6 +526,20 @@ class Generate:
                '>> Using half precision math. Call with --full_precision to use more accurate but VRAM-intensive full precision.'
            )
            model.half()
        # usage statistics
        toc = time.time()
        print(
            f'>> Model loaded in', '%4.2fs' % (toc - tic)
        )
        if device_type == 'cuda':
            print(
                '>> Max VRAM used to load the model:',
                '%4.2fG' % (torch.cuda.max_memory_allocated() / 1e9),
                '\n>> Current VRAM usage:'
                '%4.2fG' % (torch.cuda.memory_allocated() / 1e9),
            )
        return model
    def _load_img(self, path, width, height, fit=False):
--- a/scripts/dream.py
+++ b/scripts/dream.py
@ -91,11 +91,7 @@ def main():
        print(">> changed to seamless tiling mode")
    # preload the model
    tic = time.time()
    t2i.load_model()
    print(
        f'>> model loaded in', '%4.2fs' % (time.time() - tic)
    )
    if not infile:
        print(