revert 7b config

pull/306/head
mwiacx 2023-09-13 17:03:30 +08:00
parent 244290c16d
commit 07ee22dbd6
1 changed files with 2 additions and 2 deletions

View File

@ -150,8 +150,8 @@ pipeline parallel (dict):
tensor parallel: tensor parallel size, usually the number of GPUs per node.
"""
parallel = dict(
zero1=-1,
pipeline=dict(size=2, interleaved_overlap=True),
zero1=8,
pipeline=dict(size=1, interleaved_overlap=True),
sequence_parallel=False,
)