diff --git a/internlm/solver/optimizer/hybrid_zero_optim.py b/internlm/solver/optimizer/hybrid_zero_optim.py index 8b63fa0..6f983f3 100644 --- a/internlm/solver/optimizer/hybrid_zero_optim.py +++ b/internlm/solver/optimizer/hybrid_zero_optim.py @@ -856,6 +856,8 @@ class HybridZeroOptimizer(BaseOptimizer): for handle in handles: handle.wait() + torch.cuda().synchronize() + ################## # FP16 Utilities # ##################