ColossalAI/colossalai/booster/plugin/plugin_base.py

from abc import ABC, abstractmethod
from typing import Callable, Dict, Iterator, List, Optional, Tuple

import torch.nn as nn
from torch.optim import Optimizer
from torch.optim.lr_scheduler import _LRScheduler as LRScheduler
from torch.utils.data import DataLoader, Dataset

from colossalai.checkpoint_io import CheckpointIO
from colossalai.interface import OptimizerWrapper

__all__ = ["Plugin"]


class Plugin(ABC):
    @abstractmethod
    def supported_devices(self) -> List[str]:
        pass

    @abstractmethod
    def supported_precisions(self) -> List[str]:
        pass

    @abstractmethod
    def control_precision(self) -> bool:
        pass

    @abstractmethod
    def control_device(self) -> bool:
        pass

    @abstractmethod
    def support_no_sync(self) -> bool:
        pass

    @abstractmethod
    def support_lora(self) -> bool:
        pass

    @abstractmethod
    def configure(
        self,
        model: nn.Module,
        optimizer: Optional[Optimizer] = None,
        criterion: Optional[Callable] = None,
        dataloader: Optional[DataLoader] = None,
        lr_scheduler: Optional[LRScheduler] = None,
    ) -> Tuple[nn.Module, OptimizerWrapper, Callable, DataLoader, LRScheduler]:
        # implement this method
        pass

    @abstractmethod
    def control_checkpoint_io(self) -> bool:
        """
        Whether the plugin controls the checkpoint io
        """

    @abstractmethod
    def get_checkpoint_io(self) -> CheckpointIO:
        """
        Get checkpoint io object for this plugin, only invoked when control_checkpoint_io is True.
        """

    @abstractmethod
    def no_sync(self, model: nn.Module, optimizer: OptimizerWrapper) -> Iterator[None]:
        """
        Context manager to disable gradient synchronization.
        """

    @abstractmethod
    def enable_lora(self, model: nn.Module, pretrained_dir: str, lora_config: Dict) -> nn.Module:
        """
        Add LoRA modules to the model passed in. Should only be called in booster.enable_lora().
        """

    @abstractmethod
    def prepare_dataloader(
        self,
        dataset: Dataset,
        batch_size: int,
        shuffle: bool = False,
        seed: int = 1024,
        drop_last: bool = False,
        pin_memory: bool = False,
        num_workers: int = 0,
        **kwargs,
    ):
        """Prepare a dataloader for distributed training. The dataloader will be wrapped by
        `torch.utils.data.DataLoader`
        """
[booster] added the plugin base and torch ddp plugin (#3180) * [booster] added the plugin base and torch ddp plugin * polish code * polish code * polish code 2 years ago			`from abc import ABC, abstractmethod`
[lora] add lora APIs for booster, support lora for TorchDDP (#4981) * add apis and peft requirement * add liscense and implement apis * add checkpointio apis * add torchddp fwd_bwd test * add support_lora methods * add checkpointio test and debug * delete unneeded codes * remove peft from LICENSE * add concrete methods for enable_lora * simplify enable_lora api * fix requirements 1 year ago			`from typing import Callable, Dict, Iterator, List, Optional, Tuple`
[booster] added the plugin base and torch ddp plugin (#3180) * [booster] added the plugin base and torch ddp plugin * polish code * polish code * polish code 2 years ago
			`import torch.nn as nn`
			`from torch.optim import Optimizer`
			`from torch.optim.lr_scheduler import _LRScheduler as LRScheduler`
[booster] update prepare dataloader method for plugin (#3706) * [booster] add prepare dataloader method for plug * [booster] update examples and docstr 2 years ago			`from torch.utils.data import DataLoader, Dataset`
[booster] added the plugin base and torch ddp plugin (#3180) * [booster] added the plugin base and torch ddp plugin * polish code * polish code * polish code 2 years ago
[booster] implemented the torch ddd + resnet example (#3232) * [booster] implemented the torch ddd + resnet example * polish code 2 years ago			`from colossalai.checkpoint_io import CheckpointIO`
			`from colossalai.interface import OptimizerWrapper`
[booster] added the plugin base and torch ddp plugin (#3180) * [booster] added the plugin base and torch ddp plugin * polish code * polish code * polish code 2 years ago
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 1 year ago			`__all__ = ["Plugin"]`
[booster] added the plugin base and torch ddp plugin (#3180) * [booster] added the plugin base and torch ddp plugin * polish code * polish code * polish code 2 years ago

			`class Plugin(ABC):`
			`@abstractmethod`
			`def supported_devices(self) -> List[str]:`
			`pass`

			`@abstractmethod`
			`def supported_precisions(self) -> List[str]:`
			`pass`

			`@abstractmethod`
			`def control_precision(self) -> bool:`
			`pass`

			`@abstractmethod`
			`def control_device(self) -> bool:`
			`pass`

			`@abstractmethod`
			`def support_no_sync(self) -> bool:`
			`pass`

[lora] add lora APIs for booster, support lora for TorchDDP (#4981) * add apis and peft requirement * add liscense and implement apis * add checkpointio apis * add torchddp fwd_bwd test * add support_lora methods * add checkpointio test and debug * delete unneeded codes * remove peft from LICENSE * add concrete methods for enable_lora * simplify enable_lora api * fix requirements 1 year ago			`@abstractmethod`
			`def support_lora(self) -> bool:`
			`pass`

[booster] added the plugin base and torch ddp plugin (#3180) * [booster] added the plugin base and torch ddp plugin * polish code * polish code * polish code 2 years ago			`@abstractmethod`
			`def configure(`
			`self,`
			`model: nn.Module,`
[booster] make optimizer argument optional for boost (#3993) * feat: make optimizer optional in Booster.boost * test: skip unet test if diffusers version > 0.10.2 1 year ago			`optimizer: Optional[Optimizer] = None,`
			`criterion: Optional[Callable] = None,`
			`dataloader: Optional[DataLoader] = None,`
			`lr_scheduler: Optional[LRScheduler] = None,`
			`) -> Tuple[nn.Module, OptimizerWrapper, Callable, DataLoader, LRScheduler]:`
[booster] added the plugin base and torch ddp plugin (#3180) * [booster] added the plugin base and torch ddp plugin * polish code * polish code * polish code 2 years ago			`# implement this method`
			`pass`
[booster] implemented the torch ddd + resnet example (#3232) * [booster] implemented the torch ddd + resnet example * polish code 2 years ago
			`@abstractmethod`
			`def control_checkpoint_io(self) -> bool:`
			`"""`
			`Whether the plugin controls the checkpoint io`
			`"""`

			`@abstractmethod`
			`def get_checkpoint_io(self) -> CheckpointIO:`
			`"""`
			`Get checkpoint io object for this plugin, only invoked when control_checkpoint_io is True.`
			`"""`
[booster] update prepare dataloader method for plugin (#3706) * [booster] add prepare dataloader method for plug * [booster] update examples and docstr 2 years ago
[booster] fix no_sync method (#3709) * [booster] fix no_sync method * [booster] add test for ddp no_sync * [booster] fix merge * [booster] update unit test * [booster] update unit test * [booster] update unit test 2 years ago			`@abstractmethod`
[zero]support no_sync method for zero1 plugin (#4138) * support no sync for zero1 plugin * polish * polish 1 year ago			`def no_sync(self, model: nn.Module, optimizer: OptimizerWrapper) -> Iterator[None]:`
[booster] fix no_sync method (#3709) * [booster] fix no_sync method * [booster] add test for ddp no_sync * [booster] fix merge * [booster] update unit test * [booster] update unit test * [booster] update unit test 2 years ago			`"""`
			`Context manager to disable gradient synchronization.`
			`"""`

[lora] add lora APIs for booster, support lora for TorchDDP (#4981) * add apis and peft requirement * add liscense and implement apis * add checkpointio apis * add torchddp fwd_bwd test * add support_lora methods * add checkpointio test and debug * delete unneeded codes * remove peft from LICENSE * add concrete methods for enable_lora * simplify enable_lora api * fix requirements 1 year ago			`@abstractmethod`
			`def enable_lora(self, model: nn.Module, pretrained_dir: str, lora_config: Dict) -> nn.Module:`
			`"""`
			`Add LoRA modules to the model passed in. Should only be called in booster.enable_lora().`
			`"""`

[booster] update prepare dataloader method for plugin (#3706) * [booster] add prepare dataloader method for plug * [booster] update examples and docstr 2 years ago			`@abstractmethod`
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 1 year ago			`def prepare_dataloader(`
			`self,`
			`dataset: Dataset,`
			`batch_size: int,`
			`shuffle: bool = False,`
			`seed: int = 1024,`
			`drop_last: bool = False,`
			`pin_memory: bool = False,`
			`num_workers: int = 0,`
			`**kwargs,`
			`):`
[booster] update prepare dataloader method for plugin (#3706) * [booster] add prepare dataloader method for plug * [booster] update examples and docstr 2 years ago			`"""Prepare a dataloader for distributed training. The dataloader will be wrapped by`
			`torch.utils.data.DataLoader`
			`"""`