SEQ_LENGTH = 1024 BATCH_SIZE = 4 NUM_EPOCHS = 4 TPDEGREE = 2 USE_SHARD_INIT = False placement = 'cpu'