ColossalAI/examples/language/roberta/configs/colossalai_ddp.py

5 lines
128 B
Python

from colossalai.zero.shard_utils import TensorShardStrategy
from colossalai.nn.optimizer import FusedAdam
clip_grad_norm = 1.0