torch<2.0.0, >=1.12.1
packaging==23.1
colossalai==0.3.2
autoflake==2.2.1
black==23.9.1
transformers
tensorboard==2.14.0
six==1.16.0
datasets
ninja==1.11.1
flash-attn>=2.0.0,<=2.0.5
tqdm
sentencepiece==0.1.99
protobuf<=3.20.0