mirror of https://github.com/InternLM/InternLM
make seed in different tensor rank different (#405)
parent
8b65e2e3c4
commit
9aef11e89c
|
@ -568,7 +568,8 @@ class ParallelContext(metaclass=SingletonMeta):
|
|||
# during model construction), this is because the random state will be different in different tensor parallel
|
||||
# device of the same data parallel group. The underlying reason is that the device of tp_rank = 0 will perform
|
||||
# additional random operations during the RowParallelLinear module building process.
|
||||
set_mode(ParallelMode.DUMMY)
|
||||
# set_mode(ParallelMode.DUMMY)
|
||||
set_mode(ParallelMode.TENSOR)
|
||||
|
||||
seeds = get_seeds()
|
||||
seed_str = ", ".join([f"{k}: {v}" for k, v in seeds.items()])
|
||||
|
|
Loading…
Reference in New Issue