From a4b029d03c952067287a9e5b0ceb2c2a58d18cc0 Mon Sep 17 00:00:00 2001
From: Lincoln Stein <lstein@gmail.com>
Date: Tue, 15 Aug 2023 18:21:31 -0400
Subject: [PATCH] write RAM usage and change after each generation

---
 invokeai/app/services/invocation_stats.py | 50 ++++++++++++++++-------
 1 file changed, 36 insertions(+), 14 deletions(-)

diff --git a/invokeai/app/services/invocation_stats.py b/invokeai/app/services/invocation_stats.py
index 50320a6611..9d50375c09 100644
--- a/invokeai/app/services/invocation_stats.py
+++ b/invokeai/app/services/invocation_stats.py
@@ -29,6 +29,7 @@ The abstract base class for this class is InvocationStatsServiceBase. An impleme
 writes to the system log is stored in InvocationServices.performance_statistics.
 """
 
+import psutil
 import time
 from abc import ABC, abstractmethod
 from contextlib import AbstractContextManager
@@ -83,13 +84,14 @@ class InvocationStatsServiceBase(ABC):
         pass
 
     @abstractmethod
-    def update_invocation_stats(
-        self,
-        graph_id: str,
-        invocation_type: str,
-        time_used: float,
-        vram_used: float,
-    ):
+    def update_invocation_stats(self,
+                                graph_id: str,
+                                invocation_type: str,
+                                time_used: float,
+                                vram_used: float,
+                                ram_used: float,
+                                ram_changed: float,
+                                ):
         """
         Add timing information on execution of a node. Usually
         used internally.
@@ -97,6 +99,8 @@ class InvocationStatsServiceBase(ABC):
         :param invocation_type: String literal type of the node
         :param time_used: Time used by node's exection (sec)
         :param vram_used: Maximum VRAM used during exection (GB)
+        :param ram_used: Current RAM available (GB)
+        :param ram_changed: Change in RAM usage over course of the run (GB)
         """
         pass
 
@@ -140,18 +144,23 @@ class InvocationStatsService(InvocationStatsServiceBase):
             self.collector = collector
             self.graph_id = graph_id
             self.start_time = 0
+            self.ram_info = None
 
         def __enter__(self):
             self.start_time = time.time()
             if torch.cuda.is_available():
                 torch.cuda.reset_peak_memory_stats()
+            self.ram_info = psutil.virtual_memory()
+            
 
         def __exit__(self, *args):
             self.collector.update_invocation_stats(
-                self.graph_id,
-                self.invocation.type,
-                time.time() - self.start_time,
-                torch.cuda.max_memory_allocated() / 1e9 if torch.cuda.is_available() else 0.0,
+                graph_id = self.graph_id,
+                invocation_type = self.invocation.type,
+                time_used = time.time() - self.start_time,
+                vram_used = torch.cuda.max_memory_allocated() / 1e9 if torch.cuda.is_available() else 0.0,
+                ram_used = psutil.virtual_memory().used / 1e9,
+                ram_changed = (psutil.virtual_memory().used - self.ram_info.used) / 1e9,
             )
 
     def collect_stats(
@@ -179,13 +188,23 @@ class InvocationStatsService(InvocationStatsServiceBase):
         except KeyError:
             logger.warning(f"Attempted to clear statistics for unknown graph {graph_execution_id}")
 
-    def update_invocation_stats(self, graph_id: str, invocation_type: str, time_used: float, vram_used: float):
+    def update_invocation_stats(self,
+                                graph_id: str,
+                                invocation_type: str,
+                                time_used: float,
+                                vram_used: float,
+                                ram_used: float,
+                                ram_changed: float,
+                                ):
         """
         Add timing information on execution of a node. Usually
         used internally.
         :param graph_id: ID of the graph that is currently executing
         :param invocation_type: String literal type of the node
-        :param time_used: Floating point seconds used by node's exection
+        :param time_used: Time used by node's exection (sec)
+        :param vram_used: Maximum VRAM used during exection (GB)
+        :param ram_used: Current RAM available (GB)
+        :param ram_changed: Change in RAM usage over course of the run (GB)
         """
         if not self._stats[graph_id].nodes.get(invocation_type):
             self._stats[graph_id].nodes[invocation_type] = NodeStats()
@@ -193,6 +212,8 @@ class InvocationStatsService(InvocationStatsServiceBase):
         stats.calls += 1
         stats.time_used += time_used
         stats.max_vram = max(stats.max_vram, vram_used)
+        stats.ram_used = ram_used
+        stats.ram_changed = ram_changed
 
     def log_stats(self):
         """
@@ -214,8 +235,9 @@ class InvocationStatsService(InvocationStatsServiceBase):
                 total_time += stats.time_used
 
             logger.info(f"TOTAL GRAPH EXECUTION TIME:  {total_time:7.3f}s")
+            logger.info("Current RAM used: " + "%4.2fG" % stats.ram_used + f" (delta={stats.ram_changed:4.2f}G)")
             if torch.cuda.is_available():
-                logger.info("Current VRAM utilization " + "%4.2fG" % (torch.cuda.memory_allocated() / 1e9))
+                logger.info("Current VRAM used: " + "%4.2fG" % (torch.cuda.memory_allocated() / 1e9))
 
             completed.add(graph_id)