From 4644f8bc2c8fbcb6236ecb9132b6cacfd8e961da Mon Sep 17 00:00:00 2001 From: RandySheriffH <48490400+RandySheriffH@users.noreply.github.com> Date: Tue, 2 Nov 2021 14:31:39 -0700 Subject: [PATCH] refactor profiling logics (#9567) Co-authored-by: RandySheriffH --- onnxruntime/core/providers/cuda/cuda_profiler.cc | 11 +++++------ 1 file changed, 5 insertions(+), 6 deletions(-) diff --git a/onnxruntime/core/providers/cuda/cuda_profiler.cc b/onnxruntime/core/providers/cuda/cuda_profiler.cc index d7258313c0..de9cbcc09f 100644 --- a/onnxruntime/core/providers/cuda/cuda_profiler.cc +++ b/onnxruntime/core/providers/cuda/cuda_profiler.cc @@ -126,7 +126,7 @@ void CudaProfiler::EndProfiling(TimePoint start_time, Events& events) { {"block_y", std::to_string(stat.block_y_)}, {"block_z", std::to_string(stat.block_z_)}}; EventRecord event{ - KEVENT, -1, -1, stat.name_, DUR(profiling_start, stat.stop_), DUR(stat.start_, stat.stop_), {args.begin(), args.end()}}; + KEVENT, -1, -1, stat.name_, DUR(profiling_start, stat.start_), DUR(stat.start_, stat.stop_), {args.begin(), args.end()}}; auto ts = id_map[stat.correlation_id]; if (event_map.find(ts) == event_map.end()) { event_map.insert({ts, {event}}); @@ -140,15 +140,14 @@ void CudaProfiler::EndProfiling(TimePoint start_time, Events& events) { while (insert_iter != events.end() && insert_iter->ts < ts) { insert_iter++; } - if (insert_iter != events.end() && insert_iter != events.begin() && insert_iter->ts > ts) { - insert_iter--; - } if (insert_iter != events.end() && insert_iter->ts == ts) { for (auto& evt_iter : map_iter.second) { evt_iter.args["op_name"] = insert_iter->args["op_name"]; } + insert_iter = events.insert(insert_iter+1, map_iter.second.begin(), map_iter.second.end()); + } else { + insert_iter = events.insert(insert_iter, map_iter.second.begin(), map_iter.second.end()); } - insert_iter = events.insert(insert_iter, map_iter.second.begin(), map_iter.second.end()); while (insert_iter != events.end() && insert_iter->cat == EventCategory::KERNEL_EVENT) { insert_iter++; } @@ -212,4 +211,4 @@ void CudaProfiler::Clear() {} } // namespace profiling } // namespace onnxruntime -#endif \ No newline at end of file +#endif