From 07ee22dbd62ce0e2cbf757495458b2af3a5f0416 Mon Sep 17 00:00:00 2001 From: mwiacx <759046501@qq.com> Date: Wed, 13 Sep 2023 17:03:30 +0800 Subject: [PATCH] revert 7b config --- configs/7B_sft.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/configs/7B_sft.py b/configs/7B_sft.py index 0c37495..9a866dd 100644 --- a/configs/7B_sft.py +++ b/configs/7B_sft.py @@ -150,8 +150,8 @@ pipeline parallel (dict): tensor parallel: tensor parallel size, usually the number of GPUs per node. """ parallel = dict( - zero1=-1, - pipeline=dict(size=2, interleaved_overlap=True), + zero1=8, + pipeline=dict(size=1, interleaved_overlap=True), sequence_parallel=False, )