diff --git a/configs/7B_sft.py b/configs/7B_sft.py index 14a10a3..c6c5d79 100644 --- a/configs/7B_sft.py +++ b/configs/7B_sft.py @@ -150,7 +150,6 @@ parallel = dict( tensor=1, pipeline=dict(size=1, interleaved_overlap=True), sequence_parallel=False, - expert=2, ) cudnn_deterministic = False @@ -163,4 +162,4 @@ monitor = dict( feishu_alert_address=None, # feishu webhook to send alert message light_monitor_address=None, # light_monitor address to send heartbeat ), -) +) \ No newline at end of file