pull/6071/head
wangbluo 2024-10-15 13:28:33 +08:00
parent fd92789af2
commit bc7eeade33
1 changed files with 0 additions and 1 deletions

View File

@ -857,7 +857,6 @@ def get_gpt2_flash_attention_forward(shard_config: Optional[ShardConfig] = None)
dropout_p = self.attn_dropout.p if self.training else 0.0
sp_mode = shard_config.sequence_parallelism_mode
shard_config.sequence_parallel_process_group
if sp_mode == "ring_attn":
attn_output = RingAttention.attention(
query,