From 9ca4b6f1177e7edc7ba50f78b0c5123be0476c18 Mon Sep 17 00:00:00 2001 From: "A. Unique TensorFlower" Date: Thu, 27 Feb 2020 13:16:10 -0800 Subject: [PATCH] we don't save event.name for the sake of memory saving. therefore we need to do it when we flush out xevents. PiperOrigin-RevId: 297670929 Change-Id: Ib1e611229cf56f8e1eab08249853ec881480d3b9 --- .../core/profiler/internal/gpu/device_tracer.cc | 14 ++++++++------ 1 file changed, 8 insertions(+), 6 deletions(-) diff --git a/tensorflow/core/profiler/internal/gpu/device_tracer.cc b/tensorflow/core/profiler/internal/gpu/device_tracer.cc index 9494c6fe233..6b59675481e 100644 --- a/tensorflow/core/profiler/internal/gpu/device_tracer.cc +++ b/tensorflow/core/profiler/internal/gpu/device_tracer.cc @@ -65,6 +65,9 @@ void CreateXEvent(const CuptiTracerEvent& event, XPlaneBuilder* plane, return; } std::string kernel_name = port::MaybeAbiDemangle(event.name.c_str()); + if (kernel_name.empty()) { + kernel_name = GetTraceEventTypeName(event.type); + } XEventMetadata* event_metadata = plane->GetOrCreateEventMetadata(kernel_name); XEventBuilder xevent = line->AddEvent(*event_metadata); xevent.SetTimestampNs(event.start_time_ns); @@ -95,12 +98,11 @@ void CreateXEvent(const CuptiTracerEvent& event, XPlaneBuilder* plane, xevent.AddStatValue(*plane->GetOrCreateStatMetadata( GetStatTypeStr(StatType::kKernelDetails)), kernel_details); - } - if (event.type == CuptiTracerEventType::MemcpyH2D || - event.type == CuptiTracerEventType::MemcpyD2H || - event.type == CuptiTracerEventType::MemcpyD2D || - event.type == CuptiTracerEventType::MemcpyP2P || - event.type == CuptiTracerEventType::MemcpyOther) { + } else if (event.type == CuptiTracerEventType::MemcpyH2D || + event.type == CuptiTracerEventType::MemcpyD2H || + event.type == CuptiTracerEventType::MemcpyD2D || + event.type == CuptiTracerEventType::MemcpyP2P || + event.type == CuptiTracerEventType::MemcpyOther) { const auto& memcpy_info = event.memcpy_info; std::string memcpy_details = absl::StrFormat("size:%u dest:%u async:%u", memcpy_info.num_bytes,