mirror of https://github.com/InternLM/InternLM
fix(utils): disable bench_net in gputest.py (#421)
parent
4b5bdedff2
commit
3ea94f2e2a
|
@ -39,7 +39,9 @@ def empty_cache_and_diag(batch_count, interval=50):
|
||||||
with torch.no_grad():
|
with torch.no_grad():
|
||||||
timer_diagnosis()
|
timer_diagnosis()
|
||||||
bench_gpu()
|
bench_gpu()
|
||||||
bench_net()
|
# FIXME: Runtime benchmark diagnosis can easily cause the training process
|
||||||
|
# to exit due to NCCL errors.
|
||||||
|
# bench_net()
|
||||||
# do empty_cache after the bench
|
# do empty_cache after the bench
|
||||||
torch.cuda.empty_cache()
|
torch.cuda.empty_cache()
|
||||||
# do garbage collection
|
# do garbage collection
|
||||||
|
|
Loading…
Reference in New Issue