mirror of https://github.com/hpcaitech/ColossalAI
[shardformer] ChatGLM support layernorm sharding
parent
00f6ef159d
commit
f155ae89c4
|
@ -417,7 +417,7 @@ class SelfAttention(torch.nn.Module):
|
||||||
)
|
)
|
||||||
=======
|
=======
|
||||||
self.dense = nn.Linear(self.projection_size,
|
self.dense = nn.Linear(self.projection_size,
|
||||||
self.hidden_size,
|
config.hidden_size,
|
||||||
bias=config.add_bias_linear,
|
bias=config.add_bias_linear,
|
||||||
device=device,
|
device=device,
|
||||||
**_config_to_kwargs(config))
|
**_config_to_kwargs(config))
|
||||||
|
|
Loading…
Reference in New Issue