ColossalAI/colossalai/fx/tracer/meta_patch/patched_module.py

import math
import torch
from .registry import meta_patched_module


@meta_patched_module.register(torch.nn.Linear)
def torch_nn_linear(self, input):
    last_dim = input.shape[-1]
    assert last_dim == self.in_features, f'Expected hidden size {self.in_features} but got {last_dim} for the torch.nn.Linear patch'
    return torch.empty(input.shape[:-1] + (self.out_features,), device="meta")


@meta_patched_module.register(torch.nn.LayerNorm)
@meta_patched_module.register(torch.nn.GroupNorm)
@meta_patched_module.register(torch.nn.BatchNorm1d)
@meta_patched_module.register(torch.nn.BatchNorm2d)
@meta_patched_module.register(torch.nn.BatchNorm3d)
def torch_nn_normalize(self, input):
    # check shape
    if isinstance(self, torch.nn.BatchNorm1d):
        assert input.dim() in [2, 3]
    elif isinstance(self, torch.nn.BatchNorm2d):
        assert input.dim() == 4
    elif isinstance(self, torch.nn.BatchNorm3d):
        assert input.dim() == 5

    # normalization maintain the same shape as the input
    return input.clone()


@meta_patched_module.register(torch.nn.Embedding)
def torch_nn_embedding(self, input):
    result_shape = input.shape[:-1] + (self.embedding_dim,)
    return torch.empty(result_shape, device='meta')


@meta_patched_module.register(torch.nn.Conv1d)
def torch_nn_conv1d(self, input):
    # the output shape is calculated using the formula stated
    # at https://pytorch.org/docs/stable/generated/torch.nn.Conv1d.html#torch.nn.Conv1d
    l_in = input.shape[-1]
    c_out = self.out_channels
    l_out = math.floor((l_in + 2 * self.padding[0] - self.dilation[0] *
                        (self.kernel_size[0] - 1) - 1) / self.stride[0] + 1)
    result_shape = input.shape[:-2] + (
        c_out,
        l_out,
    )
    return torch.empty(result_shape, device='meta')


@meta_patched_module.register(torch.nn.Conv2d)
def torch_nn_conv2d(self, input):
    # the output shape is calculated using the formula stated
    # at https://pytorch.org/docs/stable/generated/torch.nn.Conv1d.html#torch.nn.Conv2d
    h_in, w_in = input.shape[-2:]
    c_out = self.out_channels
    h_out = math.floor((h_in + 2 * self.padding[0] - self.dilation[0] *
                        (self.kernel_size[0] - 1) - 1) / self.stride[0] + 1)
    w_out = math.floor((w_in + 2 * self.padding[1] - self.dilation[1] *
                        (self.kernel_size[1] - 1) - 1) / self.stride[1] + 1)
    result_shape = input.shape[:-3] + (
        c_out,
        h_out,
        w_out,
    )
    return torch.empty(result_shape, device='meta')


@meta_patched_module.register(torch.nn.Conv3d)
def torch_nn_conv3d(self, input):
    # the output shape is calculated using the formula stated
    # at https://pytorch.org/docs/stable/generated/torch.nn.Conv1d.html#torch.nn.Conv3d
    d_in, h_in, w_in = input.shape[-3:]
    c_out = self.out_channels
    d_out = math.floor((d_in + 2 * self.padding[0] - self.dilation[0] *
                        (self.kernel_size[0] - 1) - 1) / self.stride[0] + 1)
    h_out = math.floor((h_in + 2 * self.padding[1] - self.dilation[1] *
                        (self.kernel_size[1] - 1) - 1) / self.stride[1] + 1)
    w_out = math.floor((w_in + 2 * self.padding[2] - self.dilation[2] *
                        (self.kernel_size[2] - 1) - 1) / self.stride[2] + 1)
    result_shape = input.shape[:-4] + (
        c_out,
        d_out,
        h_out,
        w_out,
    )
    return torch.empty(result_shape, device='meta')
[fx] patched conv and normalization (#1188) 2022-06-29 10:58:38 +00:00			`import math`
[fx] supported data-dependent control flow in model tracing (#1185) * [fx] supported data-dependent control flow in model tracing * polish code 2022-06-29 07:05:25 +00:00			`import torch`
			`from .registry import meta_patched_module`


			`@meta_patched_module.register(torch.nn.Linear)`
			`def torch_nn_linear(self, input):`
[fx] patched conv and normalization (#1188) 2022-06-29 10:58:38 +00:00			`last_dim = input.shape[-1]`
			`assert last_dim == self.in_features, f'Expected hidden size {self.in_features} but got {last_dim} for the torch.nn.Linear patch'`
[fx] supported data-dependent control flow in model tracing (#1185) * [fx] supported data-dependent control flow in model tracing * polish code 2022-06-29 07:05:25 +00:00			`return torch.empty(input.shape[:-1] + (self.out_features,), device="meta")`
[fx] patched conv and normalization (#1188) 2022-06-29 10:58:38 +00:00

			`@meta_patched_module.register(torch.nn.LayerNorm)`
			`@meta_patched_module.register(torch.nn.GroupNorm)`
			`@meta_patched_module.register(torch.nn.BatchNorm1d)`
			`@meta_patched_module.register(torch.nn.BatchNorm2d)`
			`@meta_patched_module.register(torch.nn.BatchNorm3d)`
			`def torch_nn_normalize(self, input):`
			`# check shape`
			`if isinstance(self, torch.nn.BatchNorm1d):`
			`assert input.dim() in [2, 3]`
			`elif isinstance(self, torch.nn.BatchNorm2d):`
			`assert input.dim() == 4`
			`elif isinstance(self, torch.nn.BatchNorm3d):`
			`assert input.dim() == 5`

			`# normalization maintain the same shape as the input`
			`return input.clone()`


			`@meta_patched_module.register(torch.nn.Embedding)`
			`def torch_nn_embedding(self, input):`
			`result_shape = input.shape[:-1] + (self.embedding_dim,)`
			`return torch.empty(result_shape, device='meta')`


			`@meta_patched_module.register(torch.nn.Conv1d)`
			`def torch_nn_conv1d(self, input):`
			`# the output shape is calculated using the formula stated`
			`# at https://pytorch.org/docs/stable/generated/torch.nn.Conv1d.html#torch.nn.Conv1d`
			`l_in = input.shape[-1]`
			`c_out = self.out_channels`
			`l_out = math.floor((l_in + 2 * self.padding[0] - self.dilation[0] *`
			`(self.kernel_size[0] - 1) - 1) / self.stride[0] + 1)`
			`result_shape = input.shape[:-2] + (`
			`c_out,`
			`l_out,`
			`)`
			`return torch.empty(result_shape, device='meta')`


			`@meta_patched_module.register(torch.nn.Conv2d)`
			`def torch_nn_conv2d(self, input):`
			`# the output shape is calculated using the formula stated`
			`# at https://pytorch.org/docs/stable/generated/torch.nn.Conv1d.html#torch.nn.Conv2d`
			`h_in, w_in = input.shape[-2:]`
			`c_out = self.out_channels`
			`h_out = math.floor((h_in + 2 * self.padding[0] - self.dilation[0] *`
			`(self.kernel_size[0] - 1) - 1) / self.stride[0] + 1)`
			`w_out = math.floor((w_in + 2 * self.padding[1] - self.dilation[1] *`
			`(self.kernel_size[1] - 1) - 1) / self.stride[1] + 1)`
			`result_shape = input.shape[:-3] + (`
			`c_out,`
			`h_out,`
			`w_out,`
			`)`
			`return torch.empty(result_shape, device='meta')`


			`@meta_patched_module.register(torch.nn.Conv3d)`
			`def torch_nn_conv3d(self, input):`
			`# the output shape is calculated using the formula stated`
			`# at https://pytorch.org/docs/stable/generated/torch.nn.Conv1d.html#torch.nn.Conv3d`
			`d_in, h_in, w_in = input.shape[-3:]`
			`c_out = self.out_channels`
			`d_out = math.floor((d_in + 2 * self.padding[0] - self.dilation[0] *`
			`(self.kernel_size[0] - 1) - 1) / self.stride[0] + 1)`
			`h_out = math.floor((h_in + 2 * self.padding[1] - self.dilation[1] *`
			`(self.kernel_size[1] - 1) - 1) / self.stride[1] + 1)`
			`w_out = math.floor((w_in + 2 * self.padding[2] - self.dilation[2] *`
			`(self.kernel_size[2] - 1) - 1) / self.stride[2] + 1)`
			`result_shape = input.shape[:-4] + (`
			`c_out,`
			`d_out,`
			`h_out,`
			`w_out,`
			`)`
			`return torch.empty(result_shape, device='meta')`