ColossalAI/colossalai/zero/legacy/gemini/ophooks/_shard_grad_ophook.py

import torch

from colossalai.legacy.registry import OPHOOKS

from . import BaseOpHook


@OPHOOKS.register_module
class ShardGradMemTracerHook(BaseOpHook):
    """
    A hook to process sharded param before and after FWD and BWD operator executing.
    """

    def __init__(self):
        super().__init__()

    def pre_fwd_exec(self, module: torch.nn.Module, *args):
        pass

    def post_fwd_exec(self, module: torch.nn.Module, *args):
        pass

    def pre_bwd_exec(self, module: torch.nn.Module, input, output):
        for param in module.parameters():
            assert hasattr(param, '_sharded_grad')
            param._sharded_grad.setup()

    def post_bwd_exec(self, module: torch.nn.Module, input):
        pass

    def post_iter(self):
        pass
[zero] add sharded grad and refactor grad hooks for ShardedModel (#287) 2022-03-02 10:28:29 +00:00			`import torch`
[Gemini] rename hooks related to runtime mem tracer (#2076) 2022-12-05 07:00:03 +00:00
[legacy] move builder and registry to legacy (#4603) 2023-09-04 11:56:42 +00:00			`from colossalai.legacy.registry import OPHOOKS`
[zero] add sharded grad and refactor grad hooks for ShardedModel (#287) 2022-03-02 10:28:29 +00:00
			`from . import BaseOpHook`


			`@OPHOOKS.register_module`
[Gemini] rename hooks related to runtime mem tracer (#2076) 2022-12-05 07:00:03 +00:00			`class ShardGradMemTracerHook(BaseOpHook):`
[zero] add sharded grad and refactor grad hooks for ShardedModel (#287) 2022-03-02 10:28:29 +00:00			`"""`
[doc] Fix typo under colossalai and doc(#3618) * Fixed several spelling errors under colossalai * Fix the spelling error in colossalai and docs directory * Cautious Changed the spelling error under the example folder * Update runtime_preparation_pass.py revert autograft to autograd * Update search_chunk.py utile to until * Update check_installation.py change misteach to mismatch in line 91 * Update 1D_tensor_parallel.md revert to perceptron * Update 2D_tensor_parallel.md revert to perceptron in line 73 * Update 2p5D_tensor_parallel.md revert to perceptron in line 71 * Update 3D_tensor_parallel.md revert to perceptron in line 80 * Update README.md revert to resnet in line 42 * Update reorder_graph.py revert to indice in line 7 * Update p2p.py revert to megatron in line 94 * Update initialize.py revert to torchrun in line 198 * Update routers.py change to detailed in line 63 * Update routers.py change to detailed in line 146 * Update README.md revert random number in line 402 2023-04-26 03:38:43 +00:00			`A hook to process sharded param before and after FWD and BWD operator executing.`
[zero] add sharded grad and refactor grad hooks for ShardedModel (#287) 2022-03-02 10:28:29 +00:00			`"""`

			`def __init__(self):`
			`super().__init__()`

			`def pre_fwd_exec(self, module: torch.nn.Module, *args):`
			`pass`

			`def post_fwd_exec(self, module: torch.nn.Module, *args):`
			`pass`

			`def pre_bwd_exec(self, module: torch.nn.Module, input, output):`
			`for param in module.parameters():`
			`assert hasattr(param, '_sharded_grad')`
			`param._sharded_grad.setup()`

			`def post_bwd_exec(self, module: torch.nn.Module, input):`
			`pass`

			`def post_iter(self):`
			`pass`