From ef9e7cc6221823a610e3a9b0c369745d7f1e1f71 Mon Sep 17 00:00:00 2001 From: yingtongxiong <974106207@qq.com> Date: Mon, 9 Oct 2023 20:05:39 +0800 Subject: [PATCH] modify the config --- configs/7B_sft.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/configs/7B_sft.py b/configs/7B_sft.py index dd4104a..4c55fee 100644 --- a/configs/7B_sft.py +++ b/configs/7B_sft.py @@ -154,8 +154,8 @@ pipeline parallel (dict): tensor parallel: tensor parallel size, usually the number of GPUs per node. """ parallel = dict( - zero1=-1, - tensor=dict(size=2, mode='origin_tp'), # the mode should be 'origin_tp' or 'fstp'. if the mode is 'fstp', the sequence_parallel should be True + zero1=8, + tensor=dict(size=1, mode='origin_tp'), # the mode should be 'origin_tp' or 'fstp'. if the mode is 'fstp', the sequence_parallel should be True pipeline=dict(size=1, interleaved_overlap=True), sequence_parallel=False, )