mirror of https://github.com/hpcaitech/ColossalAI
aibig-modeldata-parallelismdeep-learningdistributed-computingfoundation-modelsheterogeneous-traininghpcinferencelarge-scalemodel-parallelismpipeline-parallelism
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
30 lines
563 B
30 lines
563 B
set -xe |
|
pip install -r requirements.txt |
|
|
|
export BS=32 |
|
export MEMCAP=0 |
|
export GPUNUM=1 |
|
|
|
# acceptable values include `125m`, `350m`, `1.3b`, `2.7b`, `6.7b`, `13b`, `30b`, `66b` |
|
export MODEL="125m" |
|
|
|
for BS in 8 32 128 |
|
do |
|
for PLUGIN in "torch_ddp" "torch_ddp_fp16" "low_level_zero" "gemini" |
|
do |
|
for GPUNUM in 1 4 |
|
do |
|
|
|
MODLE_PATH="facebook/opt-${MODEL}" |
|
colossalai run \ |
|
--nproc_per_node ${GPUNUM} \ |
|
--master_port 29505 \ |
|
opt_benchmark.py \ |
|
--model_name_or_path ${MODLE_PATH} \ |
|
--mem_cap ${MEMCAP} \ |
|
--plugin ${PLUGIN} \ |
|
--batch_size ${BS} |
|
|
|
done |
|
done |
|
done
|
|
|