ColossalAI/colossalai/fx/profiler/memory.py

import torch
from torch.fx import Node
from typing import Union, Dict, List, Tuple
from operator import add, floordiv, getitem, mul, neg, setitem, sub, pos
from . import META_COMPATIBILITY

__all__ = ['activation_size', 'parameter_size', 'is_inplace']

if META_COMPATIBILITY:
    aten = torch.ops.aten

    WEIRD_OPS = [
        torch.where,
    ]

    INPLACE_ATEN = [
        aten.add_.Tensor,
        aten.sub_.Tensor,
        aten.div_.Tensor,
        aten.div_.Scalar,
        aten.mul_.Tensor,
        aten.bernoulli_.float,

    # inplace reshaping
        aten.copy_.default,
        aten.detach.default,
        aten.t.default,
        aten.transpose.int,
        aten.view.default,
        aten._unsafe_view.default,
    ]

    NORMALIZATION_ATEN = [
        aten.native_batch_norm.default,
        aten.native_layer_norm.default,
    # aten.max_pool2d_with_indices.default,
    ]

    CLONE_ATEN = [
        aten.clone.default,
    ]

    __all__ += ['INPLACE_ATEN', 'WEIRD_OPS', 'NORMALIZATION_ATEN', 'CLONE_ATEN']

else:
    # TODO fill out the inplace ops
    INPLACE_OPS = [
        add,
        sub,
        mul,
        floordiv,
        neg,
        pos,
        getitem,
        setitem,
        getattr,
        torch.Tensor.cpu,
    ]

    # TODO: list all call_methods that are inplace here
    INPLACE_METHOD = [
        'transpose',
        'permute',
    # TODO: reshape may return a copy of the data if the data is not contiguous
        'reshape',
        'dim',
        'flatten',
        'size',
        'view',
        'unsqueeze',
        'to',
        'type',
        'flatten',
    ]

    # TODO: list all call_methods that are not inplace here
    NON_INPLACE_METHOD = [
        'chunk',
        'contiguous',
        'expand',
        'mean',
        'split',
    ]
    __all__ += ['INPLACE_OPS', 'INPLACE_METHOD', 'NON_INPLACE_METHOD']


def activation_size(out: Union[torch.Tensor, Dict, List, Tuple, int]) -> int:
    """Calculate activation size of a node.

    Args:
        activation (Union[torch.Tensor, Dict, List, Tuple, int]): The activation of a `torch.nn.Module` or `torch.nn.functional`

    Returns:
        int: The activation size
    """
    act_size = 0
    if isinstance(out, torch.Tensor):
        act_size += out.numel() * torch.tensor([], dtype=out.dtype).element_size()
    elif isinstance(out, dict):
        value_list = [v for _, v in out.items()]
        act_size += activation_size(value_list)
    elif isinstance(out, tuple) or isinstance(out, list):
        for element in out:
            act_size += activation_size(element)
    return act_size


def parameter_size(mod: torch.nn.Module) -> int:
    """Calculate param size of a node.

    Args:
        mod (torch.nn.Module): The target `torch.nn.Module`

    Returns:
        int: The param size
    """
    param_size = 0
    for param in mod.parameters():
        param_size += param.numel() * torch.tensor([], dtype=param.dtype).element_size()
    return param_size


def is_inplace(n: Node):
    """Get the inplace argument from torch.fx.Node

    Args:
        node (Node): torch.fx.Node

    Returns:
        bool: indicates whether this op is inplace
    """
    inplace = False
    if n.op == "call_function":
        inplace = n.kwargs.get("inplace", False)
        if META_COMPATIBILITY and n.target in INPLACE_ATEN:
            inplace = True
    elif n.op == "call_module":
        inplace = getattr(n.graph.owning_module.get_submodule(n.target), "inplace", False)

    return inplace
[fx] provide a stable but not accurate enough version of profiler. (#1547) * [fx] compute memory stat and flop count for MetaInfoProp. * [fx] modify node attribute. * [fx] modify ckpt_chen. * [fx] fix compatibility. * [fx] fix import error. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip if torch 1.11.0. * [fx] recover MetaInfoProp support for PyTorch 1.11. * [fx] provide a stable but not accurate enough version of profiler. * [fx] provide a stable but not accurate enough version of profiler. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix import error. 2022-09-07 03:21:04 +00:00			`import torch`
[fx/tuning] tune performance on rotor with meta info. (#1599) 2022-09-15 06:46:36 +00:00			`from torch.fx import Node`
[fx] provide a stable but not accurate enough version of profiler. (#1547) * [fx] compute memory stat and flop count for MetaInfoProp. * [fx] modify node attribute. * [fx] modify ckpt_chen. * [fx] fix compatibility. * [fx] fix import error. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip if torch 1.11.0. * [fx] recover MetaInfoProp support for PyTorch 1.11. * [fx] provide a stable but not accurate enough version of profiler. * [fx] provide a stable but not accurate enough version of profiler. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix import error. 2022-09-07 03:21:04 +00:00			`from typing import Union, Dict, List, Tuple`
			`from operator import add, floordiv, getitem, mul, neg, setitem, sub, pos`
			`from . import META_COMPATIBILITY`

[fx/tuning] tune performance on rotor with meta info. (#1599) 2022-09-15 06:46:36 +00:00			`__all__ = ['activation_size', 'parameter_size', 'is_inplace']`
[fx] provide a stable but not accurate enough version of profiler. (#1547) * [fx] compute memory stat and flop count for MetaInfoProp. * [fx] modify node attribute. * [fx] modify ckpt_chen. * [fx] fix compatibility. * [fx] fix import error. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip if torch 1.11.0. * [fx] recover MetaInfoProp support for PyTorch 1.11. * [fx] provide a stable but not accurate enough version of profiler. * [fx] provide a stable but not accurate enough version of profiler. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix import error. 2022-09-07 03:21:04 +00:00
			`if META_COMPATIBILITY:`
			`aten = torch.ops.aten`

			`WEIRD_OPS = [`
			`torch.where,`
			`]`

			`INPLACE_ATEN = [`
			`aten.add_.Tensor,`
			`aten.sub_.Tensor,`
			`aten.div_.Tensor,`
			`aten.div_.Scalar,`
			`aten.mul_.Tensor,`
			`aten.bernoulli_.float,`

			`# inplace reshaping`
[fx/tuning] tune performance on rotor with meta info. (#1599) 2022-09-15 06:46:36 +00:00			`aten.copy_.default,`
[fx] provide a stable but not accurate enough version of profiler. (#1547) * [fx] compute memory stat and flop count for MetaInfoProp. * [fx] modify node attribute. * [fx] modify ckpt_chen. * [fx] fix compatibility. * [fx] fix import error. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip if torch 1.11.0. * [fx] recover MetaInfoProp support for PyTorch 1.11. * [fx] provide a stable but not accurate enough version of profiler. * [fx] provide a stable but not accurate enough version of profiler. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix import error. 2022-09-07 03:21:04 +00:00			`aten.detach.default,`
			`aten.t.default,`
			`aten.transpose.int,`
			`aten.view.default,`
			`aten._unsafe_view.default,`
			`]`

[fx/tuning] tune performance on rotor with meta info. (#1599) 2022-09-15 06:46:36 +00:00			`NORMALIZATION_ATEN = [`
			`aten.native_batch_norm.default,`
			`aten.native_layer_norm.default,`
			`# aten.max_pool2d_with_indices.default,`
			`]`

			`CLONE_ATEN = [`
			`aten.clone.default,`
			`]`

			`__all__ += ['INPLACE_ATEN', 'WEIRD_OPS', 'NORMALIZATION_ATEN', 'CLONE_ATEN']`
[fx] provide a stable but not accurate enough version of profiler. (#1547) * [fx] compute memory stat and flop count for MetaInfoProp. * [fx] modify node attribute. * [fx] modify ckpt_chen. * [fx] fix compatibility. * [fx] fix import error. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip test for MetaInfoProp. * [fx] skip if torch 1.11.0. * [fx] recover MetaInfoProp support for PyTorch 1.11. * [fx] provide a stable but not accurate enough version of profiler. * [fx] provide a stable but not accurate enough version of profiler. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix compatibility in tests. * [fx] fix import error. 2022-09-07 03:21:04 +00:00
			`else:`
			`# TODO fill out the inplace ops`
			`INPLACE_OPS = [`
			`add,`
			`sub,`
			`mul,`
			`floordiv,`
			`neg,`
			`pos,`
			`getitem,`
			`setitem,`
			`getattr,`
			`torch.Tensor.cpu,`
			`]`

			`# TODO: list all call_methods that are inplace here`
			`INPLACE_METHOD = [`
			`'transpose',`
			`'permute',`
			`# TODO: reshape may return a copy of the data if the data is not contiguous`
			`'reshape',`
			`'dim',`
			`'flatten',`
			`'size',`
			`'view',`
			`'unsqueeze',`
			`'to',`
			`'type',`
			`'flatten',`
			`]`

			`# TODO: list all call_methods that are not inplace here`
			`NON_INPLACE_METHOD = [`
			`'chunk',`
			`'contiguous',`
			`'expand',`
			`'mean',`
			`'split',`
			`]`
			`__all__ += ['INPLACE_OPS', 'INPLACE_METHOD', 'NON_INPLACE_METHOD']`


			`def activation_size(out: Union[torch.Tensor, Dict, List, Tuple, int]) -> int:`
			`"""Calculate activation size of a node.`

			`Args:`
			activation (Union[torch.Tensor, Dict, List, Tuple, int]): The activation of a `torch.nn.Module` or `torch.nn.functional`

			`Returns:`
			`int: The activation size`
			`"""`
			`act_size = 0`
			`if isinstance(out, torch.Tensor):`
			`act_size += out.numel() * torch.tensor([], dtype=out.dtype).element_size()`
			`elif isinstance(out, dict):`
			`value_list = [v for _, v in out.items()]`
			`act_size += activation_size(value_list)`
			`elif isinstance(out, tuple) or isinstance(out, list):`
			`for element in out:`
			`act_size += activation_size(element)`
			`return act_size`


			`def parameter_size(mod: torch.nn.Module) -> int:`
			`"""Calculate param size of a node.`

			`Args:`
			mod (torch.nn.Module): The target `torch.nn.Module`

			`Returns:`
			`int: The param size`
			`"""`
			`param_size = 0`
			`for param in mod.parameters():`
			`param_size += param.numel() * torch.tensor([], dtype=param.dtype).element_size()`
			`return param_size`
[fx/tuning] tune performance on rotor with meta info. (#1599) 2022-09-15 06:46:36 +00:00

			`def is_inplace(n: Node):`
			`"""Get the inplace argument from torch.fx.Node`

			`Args:`
			`node (Node): torch.fx.Node`

			`Returns:`
			`bool: indicates whether this op is inplace`
			`"""`
			`inplace = False`
			`if n.op == "call_function":`
			`inplace = n.kwargs.get("inplace", False)`
			`if META_COMPATIBILITY and n.target in INPLACE_ATEN:`
			`inplace = True`
			`elif n.op == "call_module":`
			`inplace = getattr(n.graph.owning_module.get_submodule(n.target), "inplace", False)`

			`return inplace`