add zero broadcast_sync

2023-10-26 16:27:03 +08:00 · 2023-10-26 16:27:03 +08:00 · 15ff413362
parent 3c992a2101
commit 15ff413362
1 changed files with 3 additions and 0 deletions
--- a/internlm/solver/optimizer/hybrid_zero_optim.py
+++ b/internlm/solver/optimizer/hybrid_zero_optim.py
@ -710,6 +710,9 @@ class HybridZeroOptimizer(BaseOptimizer):
        with torch.cuda.stream(self._comm_bcast_stream):
            self.broadcast_params()

+        if not self._overlap_sync_param:
+            torch.cuda.synchronize()
+
        timer("step").stop()

        # update gradients may not be needed here, because the sync_params function is used in initialization,