[hotfix] add deconstructor for stateful tensor (#848)

* add deconstructor for stateful tensor * fix colo init context
2022-04-24 15:03:04 +08:00 · 2022-04-24 15:03:04 +08:00 · 0dea140760
parent 0f7ed8c192
commit 0dea140760
3 changed files with 20 additions and 12 deletions
--- a/colossalai/gemini/gemini_context.py
+++ b/colossalai/gemini/gemini_context.py
@ -33,13 +33,16 @@ class GeminiMemoryManager(object):
    def register_new_instance(self):
        self._cnter += 1
    def delete_instance(self):
        self._cnter -= 1
    def print_info(self):
-        print(
+        print(f"Total number: {self.total_number}",
            f"Total number: {self.total_number}",
              f"Total CPU memory occupation: {self.total_mem['cpu']}",
-            f"Total CUDA memory occupation: {self.total_mem['cuda']}\n", sep='\n')
+              f"Total CUDA memory occupation: {self.total_mem['cuda']}\n",
              sep='\n')
        for state in self.states_cls:
-            print(
+            print(f"{state}: CPU memory occupation: {self.state_mem['cpu'][state]}",
-                f"{state}: CPU memory occupation: {self.state_mem['cpu'][state]}",
+                  f"{state}: CUDA memory occupation: {self.state_mem['cuda'][state]}\n",
-                f"{state}: CUDA memory occupation: {self.state_mem['cuda'][state]}\n", sep='\n')
+                  sep='\n')
--- a/colossalai/gemini/stateful_tensor.py
+++ b/colossalai/gemini/stateful_tensor.py
@ -202,3 +202,8 @@ class StatefulTensor(object):
        # update the information of each state
        manager.state_mem[from_type][state] -= size
        manager.state_mem[to_type][state] += size
    def __del__(self):
        self.set_null()
        StatefulTensor.GST_MGR.delete_instance()
        del self
--- a/colossalai/utils/model/colo_init_context.py
+++ b/colossalai/utils/model/colo_init_context.py
@ -12,7 +12,7 @@ class ColoInitContext(InsertPostInitMethodToModuleSubClasses):
        super().__init__()
        self._lazy_memory_allocate = lazy_memory_allocate
-    def _post_init_method(self, module: torch.nn.Module):
+    def _post_init_method(self, module: torch.nn.Module, *args, **kwargs):
        """
        The function to call at the end of the constructor of each module.
        FIXME(fjr) The module may be passed to this function multiple times?