2023-06-19 05:53:17 +00:00
|
|
|
import importlib
|
|
|
|
from dataclasses import dataclass
|
|
|
|
|
2023-05-22 07:02:17 +00:00
|
|
|
import torch.nn as nn
|
|
|
|
|
2023-07-05 07:13:00 +00:00
|
|
|
from .base_policy import Policy
|
2023-06-15 09:55:42 +00:00
|
|
|
|
2023-06-30 02:56:29 +00:00
|
|
|
__all__ = ["PolicyLocation", "get_autopolicy", "import_policy"]
|
|
|
|
|
2023-05-24 02:26:46 +00:00
|
|
|
|
2023-06-19 05:53:17 +00:00
|
|
|
@dataclass
|
|
|
|
class PolicyLocation:
|
2023-05-22 07:02:17 +00:00
|
|
|
"""
|
2023-06-19 05:53:17 +00:00
|
|
|
PolicyLocation describes the location of a policy class.
|
2023-06-15 09:56:51 +00:00
|
|
|
|
2023-06-19 05:53:17 +00:00
|
|
|
Args:
|
|
|
|
file_name (str): The file name of the policy under colossalai.shardformer.policies
|
|
|
|
class_name (str): The class name of the policy class
|
|
|
|
"""
|
|
|
|
file_name: str
|
|
|
|
class_name: str
|
|
|
|
|
|
|
|
|
|
|
|
# we don't want to import all policies here
|
|
|
|
# as each policy file imports its own model zoo library
|
|
|
|
# we will allow the user to only import the policy file needed
|
|
|
|
_POLICY_LIST = {
|
|
|
|
# BERT
|
|
|
|
"transformers.models.bert.modeling_bert.BertModel":
|
2023-06-22 02:33:06 +00:00
|
|
|
PolicyLocation(file_name="bert", class_name="BertModelPolicy"),
|
2023-06-19 05:53:17 +00:00
|
|
|
"transformers.models.bert.modeling_bert.BertForPreTraining":
|
2023-07-07 07:41:00 +00:00
|
|
|
PolicyLocation(file_name="bert", class_name="BertForPreTrainingPolicy"),
|
2023-06-19 05:53:17 +00:00
|
|
|
"transformers.models.bert.modeling_bert.BertLMHeadModel":
|
|
|
|
PolicyLocation(file_name="bert", class_name="BertLMHeadModelPolicy"),
|
2023-06-22 02:33:06 +00:00
|
|
|
"transformers.models.bert.modeling_bert.BertForMaskedLM":
|
|
|
|
PolicyLocation(file_name="bert", class_name="BertForMaskedLMPolicy"),
|
2023-06-19 05:53:17 +00:00
|
|
|
"transformers.models.bert.modeling_bert.BertForSequenceClassification":
|
|
|
|
PolicyLocation(file_name="bert", class_name="BertForSequenceClassificationPolicy"),
|
2023-06-22 02:33:06 +00:00
|
|
|
"transformers.models.bert.modeling_bert.BertForTokenClassification":
|
|
|
|
PolicyLocation(file_name="bert", class_name="BertForTokenClassificationPolicy"),
|
|
|
|
"transformers.models.bert.modeling_bert.BertForNextSentencePrediction":
|
|
|
|
PolicyLocation(file_name="bert", class_name="BertForNextSentencePredictionPolicy"),
|
2023-06-19 05:53:17 +00:00
|
|
|
"transformers.models.bert.modeling_bert.BertForMultipleChoice":
|
|
|
|
PolicyLocation(file_name="bert", class_name="BertForMultipleChoicePolicy"),
|
2023-07-17 08:12:20 +00:00
|
|
|
"transformers.models.bert.modeling_bert.BertForQuestionAnswering":
|
|
|
|
PolicyLocation(file_name="bert", class_name="BertForQuestionAnsweringPolicy"),
|
2023-06-19 05:53:17 +00:00
|
|
|
|
|
|
|
# LLaMA
|
|
|
|
"transformers.models.llama.modeling_llama.LlamaModel":
|
2023-07-11 03:37:26 +00:00
|
|
|
PolicyLocation(file_name="llama", class_name="LlamaModelPolicy"),
|
2023-06-19 05:53:17 +00:00
|
|
|
"transformers.models.llama.modeling_llama.LlamaForCausalLM":
|
|
|
|
PolicyLocation(file_name="llama", class_name="LlamaForCausalLMPolicy"),
|
|
|
|
"transformers.models.llama.modeling_llama.LlamaForSequenceClassification":
|
|
|
|
PolicyLocation(file_name="llama", class_name="LlamaForSequenceClassificationPolicy"),
|
|
|
|
|
|
|
|
# T5
|
2023-06-19 09:57:37 +00:00
|
|
|
"transformers.models.t5.modeling_t5.T5Model":
|
|
|
|
PolicyLocation(file_name="t5", class_name="T5ModelPolicy"),
|
|
|
|
"transformers.models.t5.modeling_t5.T5ForConditionalGeneration":
|
|
|
|
PolicyLocation(file_name="t5", class_name="T5ForConditionalGenerationPolicy"),
|
|
|
|
"transformers.models.t5.modeling_t5.T5EncoderModel":
|
|
|
|
PolicyLocation(file_name="t5", class_name="T5EncoderPolicy"),
|
2023-06-19 05:53:17 +00:00
|
|
|
|
|
|
|
# GPT2
|
2023-06-20 03:45:16 +00:00
|
|
|
"transformers.models.gpt2.modeling_gpt2.GPT2Model":
|
|
|
|
PolicyLocation(file_name="gpt2", class_name="GPT2ModelPolicy"),
|
2023-06-22 02:33:06 +00:00
|
|
|
"transformers.models.gpt2.modeling_gpt2.GPT2LMHeadModel":
|
|
|
|
PolicyLocation(file_name="gpt2", class_name="GPT2LMHeadModelPolicy"),
|
|
|
|
"transformers.models.gpt2.modeling_gpt2.GPT2DoubleHeadsModel":
|
|
|
|
PolicyLocation(file_name="gpt2", class_name="GPT2DoubleHeadsModelPolicy"),
|
2023-07-19 01:28:27 +00:00
|
|
|
"transformers.models.gpt2.modeling_gpt2.GPT2ForQuestionAnswering":
|
|
|
|
PolicyLocation(file_name="gpt2", class_name="GPT2ForQuestionAnsweringPolicy"),
|
2023-06-22 02:33:06 +00:00
|
|
|
"transformers.models.gpt2.modeling_gpt2.GPT2ForTokenClassification":
|
|
|
|
PolicyLocation(file_name="gpt2", class_name="GPT2ForTokenClassificationPolicy"),
|
|
|
|
"transformers.models.gpt2.modeling_gpt2.GPT2ForSequenceClassification":
|
|
|
|
PolicyLocation(file_name="gpt2", class_name="GPT2ForSequenceClassificationPolicy"),
|
2023-06-27 09:39:29 +00:00
|
|
|
|
2023-07-25 07:02:29 +00:00
|
|
|
# ViT
|
|
|
|
"transformers.models.vit.modeling_vit.ViTModel":
|
|
|
|
PolicyLocation(file_name="vit", class_name="ViTModelPolicy"),
|
|
|
|
"transformers.models.vit.modeling_vit.ViTForImageClassification":
|
|
|
|
PolicyLocation(file_name="vit", class_name="ViTForImageClassificationPolicy"),
|
|
|
|
"transformers.models.vit.modeling_vit.ViTForMaskedImageModeling":
|
|
|
|
PolicyLocation(file_name="vit", class_name="ViTForMaskedImageModelingPolicy"),
|
|
|
|
|
2023-06-27 09:39:29 +00:00
|
|
|
# OPT
|
|
|
|
"transformers.models.opt.modeling_opt.OPTModel":
|
|
|
|
PolicyLocation(file_name="opt", class_name="OPTModelPolicy"),
|
|
|
|
"transformers.models.opt.modeling_opt.OPTForCausalLM":
|
|
|
|
PolicyLocation(file_name="opt", class_name="OPTForCausalLMPolicy"),
|
|
|
|
"transformers.models.opt.modeling_opt.OPTForSequenceClassification":
|
|
|
|
PolicyLocation(file_name="opt", class_name="OPTForSequenceClassificationPolicy"),
|
|
|
|
"transformers.models.opt.modeling_opt.OPTForQuestionAnswering":
|
|
|
|
PolicyLocation(file_name="opt", class_name="OPTForQuestionAnsweringPolicy"),
|
2023-07-04 08:07:47 +00:00
|
|
|
|
2023-06-28 07:04:35 +00:00
|
|
|
# Bloom
|
|
|
|
"transformers.models.bloom.modeling_bloom.BloomModel":
|
|
|
|
PolicyLocation(file_name="bloom", class_name="BloomModelPolicy"),
|
|
|
|
"transformers.models.bloom.modeling_bloom.BloomForCausalLM":
|
|
|
|
PolicyLocation(file_name="bloom", class_name="BloomForCausalLMPolicy"),
|
|
|
|
"transformers.models.bloom.modeling_bloom.BloomForSequenceClassification":
|
|
|
|
PolicyLocation(file_name="bloom", class_name="BloomForSequenceClassificationPolicy"),
|
|
|
|
"transformers.models.bloom.modeling_bloom.BloomForTokenClassification":
|
|
|
|
PolicyLocation(file_name="bloom", class_name="BloomForTokenClassificationPolicy"),
|
|
|
|
"transformers.models.bloom.modeling_bloom.BloomForQuestionAnswering":
|
|
|
|
PolicyLocation(file_name="bloom", class_name="BloomForQuestionAnsweringPolicy"),
|
2023-07-14 07:56:59 +00:00
|
|
|
|
2023-07-17 06:25:32 +00:00
|
|
|
# Whisper
|
|
|
|
"transformers.models.whisper.modeling_whisper.WhisperModel":
|
|
|
|
PolicyLocation(file_name="whisper", class_name="WhisperModelPolicy"),
|
|
|
|
"transformers.models.whisper.modeling_whisper.WhisperForConditionalGeneration":
|
|
|
|
PolicyLocation(file_name="whisper", class_name="WhisperForConditionalGenerationPolicy"),
|
|
|
|
"transformers.models.whisper.modeling_whisper.WhisperForAudioClassification":
|
|
|
|
PolicyLocation(file_name="whisper", class_name="WhisperForAudioClassificationPolicy"),
|
|
|
|
|
2023-07-14 07:56:59 +00:00
|
|
|
# Sam
|
|
|
|
"transformers.models.sam.modeling_sam.SamModel":
|
|
|
|
PolicyLocation(file_name="sam", class_name="SamModelPolicy"),
|
2023-07-25 06:29:10 +00:00
|
|
|
|
|
|
|
# Blip2
|
|
|
|
"transformers.models.blip_2.modeling_blip_2.Blip2Model":
|
|
|
|
PolicyLocation(file_name="blip2", class_name="Blip2ModelPolicy"),
|
|
|
|
"transformers.models.blip_2.modeling_blip_2.Blip2ForConditionalGeneration":
|
|
|
|
PolicyLocation(file_name="blip2", class_name="Blip2ForConditionalGenerationPolicy"),
|
2023-06-19 05:53:17 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
def import_policy(policy_location: PolicyLocation) -> Policy:
|
|
|
|
"""
|
|
|
|
Dynamically import a Policy class based on the policy location.
|
|
|
|
"""
|
|
|
|
module_name = f"colossalai.shardformer.policies.{policy_location.file_name}"
|
|
|
|
module = importlib.import_module(module_name)
|
|
|
|
return getattr(module, policy_location.class_name)
|
2023-06-13 06:44:40 +00:00
|
|
|
|
2023-06-07 08:09:40 +00:00
|
|
|
|
2023-06-19 05:53:17 +00:00
|
|
|
def _fullname(obj):
|
|
|
|
"""
|
|
|
|
Return the full name of an object, including the module name.
|
|
|
|
"""
|
|
|
|
klass = obj.__class__
|
|
|
|
module = klass.__module__
|
|
|
|
if module == 'builtins':
|
|
|
|
return klass.__qualname__ # avoid outputs like 'builtins.str'
|
|
|
|
return module + '.' + klass.__qualname__
|
2023-05-22 07:02:17 +00:00
|
|
|
|
2023-05-24 02:26:46 +00:00
|
|
|
|
2023-06-15 09:55:42 +00:00
|
|
|
def get_autopolicy(model: nn.Module) -> Policy:
|
2023-05-24 02:26:46 +00:00
|
|
|
r"""
|
2023-05-22 07:02:17 +00:00
|
|
|
Return the auto policy for the model
|
|
|
|
|
|
|
|
Args:
|
2023-05-24 02:26:46 +00:00
|
|
|
model (:class:`nn.Module`): The model to get the auto policy
|
2023-05-22 07:02:17 +00:00
|
|
|
|
|
|
|
Return:
|
2023-05-24 02:26:46 +00:00
|
|
|
:class:`Policy`: The auto policy for the model
|
2023-05-22 07:02:17 +00:00
|
|
|
"""
|
2023-06-19 05:53:17 +00:00
|
|
|
full_name = _fullname(model)
|
|
|
|
policy_location = _POLICY_LIST.get(full_name, None)
|
|
|
|
|
|
|
|
if policy_location is None:
|
2023-05-24 02:26:46 +00:00
|
|
|
raise NotImplementedError(
|
2023-06-19 05:53:17 +00:00
|
|
|
f"Auto policy for {model.__class__.__qualname__} is not implemented\n. Supported models are {list(_POLICY_LIST.keys())}"
|
2023-05-24 02:26:46 +00:00
|
|
|
)
|
2023-06-19 05:53:17 +00:00
|
|
|
else:
|
|
|
|
policy = import_policy(policy_location)
|
|
|
|
return policy()
|