mirror of https://github.com/InternLM/InternLM
fix group_norms computing in hybrid_zero_optim
parent
2ad5f512b5
commit
7ca5da27e8
|
@ -574,6 +574,9 @@ class HybridZeroOptimizer(BaseOptimizer):
|
||||||
# compute norm for gradients in the before bucket
|
# compute norm for gradients in the before bucket
|
||||||
groups_norms = []
|
groups_norms = []
|
||||||
for group_id in range(self.num_param_groups):
|
for group_id in range(self.num_param_groups):
|
||||||
|
if self._is_moe_group(self.optim.param_groups[group_id]):
|
||||||
|
groups_norms.append([])
|
||||||
|
else:
|
||||||
groups_norms.append(self._compute_norm_with_stage(group_id=group_id))
|
groups_norms.append(self._compute_norm_with_stage(group_id=group_id))
|
||||||
|
|
||||||
# clear reduced grads
|
# clear reduced grads
|
||||||
|
|
Loading…
Reference in New Issue