diff --git a/colossalai/kernel/triton/__init__.py b/colossalai/kernel/triton/__init__.py index 8d41dff13..82a922650 100644 --- a/colossalai/kernel/triton/__init__.py +++ b/colossalai/kernel/triton/__init__.py @@ -11,7 +11,6 @@ if HAS_TRITON: from .context_attn_unpad import context_attention_unpadded from .flash_decoding import flash_decoding_attention from .fused_rotary_embedding import fused_rotary_embedding - from .gptq_triton import gptq_fused_linear_triton from .kvcache_copy import copy_kv_to_blocked_cache from .no_pad_rotary_embedding import decoding_fused_rotary_embedding, rotary_embedding from .rms_layernorm import rms_layernorm @@ -24,7 +23,6 @@ if HAS_TRITON: "copy_kv_to_blocked_cache", "softmax", "rms_layernorm", - "gptq_fused_linear_triton", "rotary_embedding", "fused_rotary_embedding", "get_xine_cache",