ColossalAI/colossalai/utils/model/utils.py

# This code has been adapted from the DeepSpeed library.
# Copyright (c) Microsoft Corporation.
# Licensed under the MIT License.

import functools
from typing import Optional

import torch


def substitute_init_recursively(cls, func, visited: set):
    for subcls in cls.__subclasses__():
        substitute_init_recursively(subcls, func, visited)
        if subcls not in visited:
            func(subcls)
            visited.add(subcls)


def call_to_str(base, *args, **kwargs):
    """Construct a string representation of a call.

    Args:
        base (str): name of the call
        args (tuple, optional): args to ``base``
        kwargs (dict, optional): kwargs supplied to ``base``

    Returns:
        str: A string representation of base(*args, **kwargs)
    """
    name = f'{base}('
    if args:
        name += ', '.join(repr(arg) for arg in args)
        if kwargs:
            name += ', '
    if kwargs:
        name += ', '.join(f'{key}={repr(arg)}' for key, arg in kwargs.items())
    name += ')'
    return name


class InsertPostInitMethodToModuleSubClasses(object):

    def __init__(self, default_dtype: Optional[torch.dtype] = None):
        self._old_default_dtype = None
        self._default_dtype = default_dtype

    def __enter__(self):
        r"""
        Enter the context scope.
        """
        if self._default_dtype is not None:
            self._old_default_dtype = torch.get_default_dtype()
            torch.set_default_dtype(self._default_dtype)

        def preprocess_after(f):

            @functools.wraps(f)
            def wrapper(module: torch.nn.Module, *args, **kwargs):
                f(module, *args, **kwargs)
                self._post_init_method(module, *args, **kwargs)

            return wrapper

        def _enable_class(cls):
            cls._old_init = cls.__init__
            cls.__init__ = preprocess_after(cls.__init__)

        # The function is called during init subclass.
        def _init_subclass(cls, **kwargs):
            cls.__init__ = preprocess_after(cls.__init__)

        # Replace .__init__() for all existing subclasses of torch.nn.Module
        # Execution self._post_init_method after the default init function.
        substitute_init_recursively(torch.nn.modules.module.Module, _enable_class, set())

        # holding on to the current __init__subclass__ for exit
        torch.nn.modules.module.Module._old_init_subclass = (torch.nn.modules.module.Module.__init_subclass__)
        # Replace .__init__() for future subclasses of torch.nn.Module
        torch.nn.modules.module.Module.__init_subclass__ = classmethod(_init_subclass)

        self._pre_context_exec()
        return self

    def __exit__(self, exc_type, exc_value, traceback):

        if self._default_dtype is not None:
            torch.set_default_dtype(self._old_default_dtype)

        def _disable_class(cls):
            if not hasattr(cls, '_old_init'):
                raise AttributeError(
                    f"_old_init is not found in the {cls.__name__}, please make sure that you have imported {cls.__name__} before entering the context."
                )
            cls.__init__ = cls._old_init

        # Replace .__init__() for all existing subclasses of torch.nn.Module
        substitute_init_recursively(torch.nn.modules.module.Module, _disable_class, set())

        # Replace .__init__() for future subclasses of torch.nn.Module
        torch.nn.modules.module.Module.__init_subclass__ = (torch.nn.modules.module.Module._old_init_subclass)

        self._post_context_exec()
        # Now that we cleaned up the metaclass injection, raise the exception.
        if exc_type is not None:
            return False

    # To be implemented by inheriting classes
    def _post_init_method(self, module, *args, **kwargs):
        pass

    def _pre_context_exec(self):
        pass

    def _post_context_exec(self):
        pass
[doc] add deepspeed citation and copyright (#2996) * [doc] add deepspeed citation and copyright * [doc] add deepspeed citation and copyright * [doc] add deepspeed citation and copyright 2 years ago			`# This code has been adapted from the DeepSpeed library.`
			`# Copyright (c) Microsoft Corporation.`
			`# Licensed under the MIT License.`

[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago			`import functools`
			`from typing import Optional`

[doc] add deepspeed citation and copyright (#2996) * [doc] add deepspeed citation and copyright * [doc] add deepspeed citation and copyright * [doc] add deepspeed citation and copyright 2 years ago			`import torch`

[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago
[hotfix] fix init context (#1543) * fix init context * fix lazy init ctx 2 years ago			`def substitute_init_recursively(cls, func, visited: set):`
[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago			`for subcls in cls.__subclasses__():`
[hotfix] fix init context (#1543) * fix init context * fix lazy init ctx 2 years ago			`substitute_init_recursively(subcls, func, visited)`
			`if subcls not in visited:`
			`func(subcls)`
			`visited.add(subcls)`
[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago

[pipelinable]use pipelinable context to initialize non-pipeline model (#816) * [CLI] add CLI launcher * Revert "[CLI] add CLI launcher" This reverts commit df7e6506d4500af6a9220ef7fe4d3c7b1daebd4c. * [pipeline]add module lazy init feature to support large model initization. * [pipeline]add to_layer_list and partition method to support arbitrary non-pp model * refactor the module structure * polish * [pipelinable]add unit test for pipelinable * polish * polish * Fix CodeFactor issues. 3 years ago			`def call_to_str(base, args, *kwargs):`
			`"""Construct a string representation of a call.`

			`Args:`
			`base (str): name of the call`
			args (tuple, optional): args to ``base``
			kwargs (dict, optional): kwargs supplied to ``base``

			`Returns:`
			`str: A string representation of base(args, *kwargs)`
			`"""`
			`name = f'{base}('`
			`if args:`
			`name += ', '.join(repr(arg) for arg in args)`
			`if kwargs:`
			`name += ', '`
			`if kwargs:`
			`name += ', '.join(f'{key}={repr(arg)}' for key, arg in kwargs.items())`
			`name += ')'`
			`return name`


[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago			`class InsertPostInitMethodToModuleSubClasses(object):`

			`def __init__(self, default_dtype: Optional[torch.dtype] = None):`
			`self._old_default_dtype = None`
			`self._default_dtype = default_dtype`

			`def __enter__(self):`
			`r"""`
			`Enter the context scope.`
			`"""`
			`if self._default_dtype is not None:`
			`self._old_default_dtype = torch.get_default_dtype()`
			`torch.set_default_dtype(self._default_dtype)`

			`def preprocess_after(f):`

			`@functools.wraps(f)`
			`def wrapper(module: torch.nn.Module, args, *kwargs):`
			`f(module, args, *kwargs)`
[pipelinable]use pipelinable context to initialize non-pipeline model (#816) * [CLI] add CLI launcher * Revert "[CLI] add CLI launcher" This reverts commit df7e6506d4500af6a9220ef7fe4d3c7b1daebd4c. * [pipeline]add module lazy init feature to support large model initization. * [pipeline]add to_layer_list and partition method to support arbitrary non-pp model * refactor the module structure * polish * [pipelinable]add unit test for pipelinable * polish * polish * Fix CodeFactor issues. 3 years ago			`self._post_init_method(module, args, *kwargs)`
[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago
			`return wrapper`

			`def _enable_class(cls):`
			`cls._old_init = cls.__init__`
			`cls.__init__ = preprocess_after(cls.__init__)`

			`# The function is called during init subclass.`
			`def _init_subclass(cls, **kwargs):`
			`cls.__init__ = preprocess_after(cls.__init__)`

			`# Replace .__init__() for all existing subclasses of torch.nn.Module`
fix typo with colossalai/trainer utils zero (#3908) 1 year ago			`# Execution self._post_init_method after the default init function.`
[hotfix] fix init context (#1543) * fix init context * fix lazy init ctx 2 years ago			`substitute_init_recursively(torch.nn.modules.module.Module, _enable_class, set())`
[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago
			`# holding on to the current __init__subclass__ for exit`
			`torch.nn.modules.module.Module._old_init_subclass = (torch.nn.modules.module.Module.__init_subclass__)`
			`# Replace .__init__() for future subclasses of torch.nn.Module`
			`torch.nn.modules.module.Module.__init_subclass__ = classmethod(_init_subclass)`

			`self._pre_context_exec()`
[context] maintain the context object in with statement (#1073) 3 years ago			`return self`
[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago
			`def __exit__(self, exc_type, exc_value, traceback):`

			`if self._default_dtype is not None:`
			`torch.set_default_dtype(self._old_default_dtype)`

			`def _disable_class(cls):`
[zero] added error message to handle on-the-fly import of torch Module class (#1135) * [zero] added error message to handle on-the-fly import of torch Module class * polish code 2 years ago			`if not hasattr(cls, '_old_init'):`
			`raise AttributeError(`
			`f"_old_init is not found in the {cls.__name__}, please make sure that you have imported {cls.__name__} before entering the context."`
			`)`
[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago			`cls.__init__ = cls._old_init`

			`# Replace .__init__() for all existing subclasses of torch.nn.Module`
[hotfix] fix init context (#1543) * fix init context * fix lazy init ctx 2 years ago			`substitute_init_recursively(torch.nn.modules.module.Module, _disable_class, set())`
[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago
			`# Replace .__init__() for future subclasses of torch.nn.Module`
			`torch.nn.modules.module.Module.__init_subclass__ = (torch.nn.modules.module.Module._old_init_subclass)`

			`self._post_context_exec()`
			`# Now that we cleaned up the metaclass injection, raise the exception.`
			`if exc_type is not None:`
			`return False`

			`# To be implemented by inheriting classes`
[pipelinable]use pipelinable context to initialize non-pipeline model (#816) * [CLI] add CLI launcher * Revert "[CLI] add CLI launcher" This reverts commit df7e6506d4500af6a9220ef7fe4d3c7b1daebd4c. * [pipeline]add module lazy init feature to support large model initization. * [pipeline]add to_layer_list and partition method to support arbitrary non-pp model * refactor the module structure * polish * [pipelinable]add unit test for pipelinable * polish * polish * Fix CodeFactor issues. 3 years ago			`def _post_init_method(self, module, args, *kwargs):`
[refactor] moving InsertPostInitMethodToModuleSubClasses to utils. (#824) 3 years ago			`pass`

			`def _pre_context_exec(self):`
			`pass`

			`def _post_context_exec(self):`
			`pass`