mirror of https://github.com/hpcaitech/ColossalAI
remove duplicate import (#5100)
parent
e53e729d8e
commit
68fcaa2225
|
@ -413,8 +413,6 @@ def get_llama_flash_attention_forward():
|
||||||
warnings.warn("using llamav1, llamav1 hasn't repeat_kv function")
|
warnings.warn("using llamav1, llamav1 hasn't repeat_kv function")
|
||||||
llama_version = 1
|
llama_version = 1
|
||||||
|
|
||||||
from colossalai.kernel.cuda_native import AttnMaskType, ColoAttention
|
|
||||||
|
|
||||||
def forward(
|
def forward(
|
||||||
self: LlamaAttention,
|
self: LlamaAttention,
|
||||||
hidden_states: torch.Tensor,
|
hidden_states: torch.Tensor,
|
||||||
|
|
Loading…
Reference in New Issue