from .cuda_native import FusedScaleMaskSoftmax, LayerNorm, MultiHeadAttention try: from colossalai._C import fused_optim except: from colossalai.kernel.op_builder.fused_optim import FusedOptimBuilder fused_optim = FusedOptimBuilder().load() try: from colossalai._C import cpu_optim except ImportError: from colossalai.kernel.op_builder import CPUAdamBuilder cpu_optim = CPUAdamBuilder().load() try: from colossalai._C import multihead_attention except ImportError: from colossalai.kernel.op_builder import MultiHeadAttnBuilder multihead_attention = MultiHeadAttnBuilder().load() try: from colossalai._C import scaled_upper_triang_masked_softmax except ImportError: from colossalai.kernel.op_builder import ScaledSoftmaxBuilder scaled_upper_triang_masked_softmax = ScaledSoftmaxBuilder().load() try: from colossalai._C import moe except ImportError: from colossalai.kernel.op_builder import MOEBuilder moe = MOEBuilder().load() __all__ = [ "fused_optim", "cpu_optim", "multihead_attention", "moe", "LayerNorm", "FusedScaleMaskSoftmax", "MultiHeadAttention", "scaled_upper_triang_masked_softmax", ]