[profiler] Fixed bugs in CommProfiler and PcieProfiler (#377)

pull/394/head
HELSON 2022-03-10 17:54:55 +08:00 committed by Frank Lee
parent b5f43acee3
commit 8c18eb0998
2 changed files with 5 additions and 3 deletions

View File

@ -140,7 +140,7 @@ class CommProfiler(BaseProfiler):
kernel_name, code_location, vol = self.pending_metadata
self.profiler.__exit__(None, None, None)
if self.profiler.enabled:
if self.profiler.enabled and dist.get_world_size(group) > 1:
assert_flag = 0
current_comm_event = None
events = self.profiler.function_events

View File

@ -80,8 +80,10 @@ class PcieProfiler(BaseProfiler):
events = self.profiler.function_events
for event in events:
if event.name == "aten::_to_copy":
current_comm_event = PcieEvent(1, self.data_size * _get_numel(event.input_shapes[0]),
event.cuda_time_total)
t_shape = event.input_shapes[0]
if len(t_shape) == 0 or event.cuda_time_total == 0:
continue
current_comm_event = PcieEvent(1, self.data_size * _get_numel(t_shape), event.cuda_time_total)
self.total_count += current_comm_event.count
self.total_pcie_vol += current_comm_event.pcie_vol
self.total_cuda_time += current_comm_event.cuda_time