[fix] fix test_shard_llama

2024-10-25 09:01:13 +00:00 · 2024-10-25 09:01:13 +00:00 · cc0dfddcbc
parent d0ec221b38
commit cc0dfddcbc
3 changed files with 24 additions and 19 deletions
--- a/colossalai/shardformer/policies/llama.py
+++ b/colossalai/shardformer/policies/llama.py
@ -394,8 +394,8 @@ class LlamaForCausalLMPolicy(LlamaPolicy):
        return held_layers

    def get_shared_params(self) -> List[Dict[int, Tensor]]:
-        # if self.pipeline_stage_manager is not None and self.pipeline_stage_manager.use_zbv:
-        #     return []
+        if self.pipeline_stage_manager is not None and self.pipeline_stage_manager.use_zbv:
+            return []
        llama_model = self.model.model
        if self.pipeline_stage_manager and self.pipeline_stage_manager.num_stages > 1:
            if (
@ -403,20 +403,26 @@ class LlamaForCausalLMPolicy(LlamaPolicy):
                and self.pipeline_stage_manager.num_stages > 1
            ):
                # tie weights
-                if self.pipeline_stage_manager.use_zbv:
-                    return [
-                        {
-                            0: llama_model.embed_tokens.weight,
-                            0: self.model.lm_head.weight,
-                        }
-                    ]
-                else:
-                    return [
-                        {
-                            0: llama_model.embed_tokens.weight,
-                            self.pipeline_stage_manager.num_stages - 1: self.model.lm_head.weight,
-                        }
-                    ]
+                return [
+                    {
+                        0: llama_model.embed_tokens.weight,
+                        self.pipeline_stage_manager.num_stages - 1: self.model.lm_head.weight,
+                    }
+                ]
+                # if self.pipeline_stage_manager.use_zbv:
+                #     return [
+                #         {
+                #             0: llama_model.embed_tokens.weight,
+                #             0: self.model.lm_head.weight,
+                #         }
+                #     ]
+                # else:
+                #     return [
+                #         {
+                #             0: llama_model.embed_tokens.weight,
+                #             self.pipeline_stage_manager.num_stages - 1: self.model.lm_head.weight,
+                #         }
+                #     ]
        return []


--- a/examples/language/llama/benchmark.py
+++ b/examples/language/llama/benchmark.py
@ -237,7 +237,6 @@ def main():
            ).get_v_schedule()
        else:
            scheduler_nodes = None
-        # print(f"{dist.get_rank()} {scheduler_nodes[]} ")

        plugin = HybridParallelPlugin(
            tp_size=args.tp,
--- a/tests/test_pipeline/test_schedule/test_zerobubble_pp.py
+++ b/tests/test_pipeline/test_schedule/test_zerobubble_pp.py
@ -923,9 +923,9 @@ def run_with_booster_moehybridplugin(config: Tuple[int, ...]):
@parameterize(
    "config",
    [
-        # (1, 2, 2, 1), # Pass
+        (1, 2, 2, 1),  # Pass
        # TODO: only support pp + tp accleration; Will support fully pp and None tp Hybrid in furture;
-        (0, 4, 1, 1),
+        # (0, 4, 1, 1),
        # (1, 2, 1, 2),
        # (1, 1, 2, 2),
    ],