refactor code for log

2023-09-22 14:14:58 +08:00 · 2023-09-22 14:14:58 +08:00 · 9e6e7986b6
parent 3607548265
commit 9e6e7986b6
2 changed files with 5 additions and 5 deletions
--- a/internlm/initialize/launch.py
+++ b/internlm/initialize/launch.py
@ -364,6 +364,11 @@ def launch(
            f"data parallel size: {gpc.data_parallel_size}, pipeline parallel size: {gpc.pipeline_parallel_size}, "
            f"tensor parallel size: {gpc.tensor_parallel_size}",
        )
+        logger.info(
+            f"Creating MoE with num_experts: {gpc.config.model.num_experts} | "
+            f"expert parallel size: {gpc.expert_parallel_size} | "
+            f"number of local experts: {gpc.config.model.num_experts//gpc.expert_parallel_size}"
+        )


 def launch_from_slurm(
--- a/internlm/model/moe.py
+++ b/internlm/model/moe.py
@ -69,11 +69,6 @@ class MoE(torch.nn.Module):
        self.num_experts = num_experts
        self.num_local_experts = num_experts // self.ep_size

-        if gpc.is_rank_for_log():
-            logger.info(  # pylint: disable=W1203
-                f"Creating MoE layer with num_experts: {num_experts} | num_local_experts:"
-                f"{self.num_local_experts} | expert_parallel_size: {self.ep_size}"
-            )
        assert noisy_gate_policy is None or noisy_gate_policy in ["None", "Jitter", "RSample"], (
            "Unsupported noisy_gate_policy: " + noisy_gate_policy
        )