mirror of https://github.com/hpcaitech/ColossalAI
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
14 lines
731 B
14 lines
731 B
# distplan in ["colossalai", "zero1", "zero2", "torch_ddp", "torch_zero"]
|
|
export DISTPAN=${DISTPAN:-"colossalai"}
|
|
|
|
# The following options only valid when DISTPAN="colossalai"
|
|
export GPUNUM=${GPUNUM:-1}
|
|
export TPDEGREE=${TPDEGREE:-1}
|
|
export PLACEMENT=${PLACEMENT:-"cpu"}
|
|
export USE_SHARD_INIT=${USE_SHARD_INIT:-False}
|
|
export BATCH_SIZE=${BATCH_SIZE:-16}
|
|
export MODEL_TYPE=${MODEL_TYPE:-"gpt2_medium"}
|
|
|
|
mkdir -p logs
|
|
torchrun --standalone --nproc_per_node=${GPUNUM} train_gpt_demo.py --tp_degree=${TPDEGREE} --model_type=${MODEL_TYPE} --batch_size=${BATCH_SIZE} --placement ${PLACEMENT} --shardinit ${USE_SHARD_INIT} --distplan ${DISTPAN} 2>&1 | tee ./logs/${MODEL_TYPE}_${DISTPAN}_gpu_${GPUNUM}_bs_${BATCH_SIZE}_tp_${TPDEGREE}.log
|