diff --git a/tensorflow/core/platform/default/device_tracer.cc b/tensorflow/core/platform/default/device_tracer.cc index 162b339c584..e4c286bf8f9 100644 --- a/tensorflow/core/platform/default/device_tracer.cc +++ b/tensorflow/core/platform/default/device_tracer.cc @@ -175,18 +175,15 @@ class CuptiCallbackHook { Status Enable(CudaEventRecorder* recorder) { TF_RETURN_IF_ERROR( ToStatus(cuptiSubscribe(&subscriber_, &CuptiCallback, recorder))); - for (auto cbid : - {CUPTI_DRIVER_TRACE_CBID_cuLaunchKernel, - CUPTI_DRIVER_TRACE_CBID_cuLaunchCooperativeKernelMultiDevice, - CUPTI_DRIVER_TRACE_CBID_cuLaunchCooperativeKernel, - CUPTI_DRIVER_TRACE_CBID_cuMemcpy, - CUPTI_DRIVER_TRACE_CBID_cuMemcpyAsync, - CUPTI_DRIVER_TRACE_CBID_cuMemcpyHtoD_v2, - CUPTI_DRIVER_TRACE_CBID_cuMemcpyHtoDAsync_v2, - CUPTI_DRIVER_TRACE_CBID_cuMemcpyDtoH_v2, - CUPTI_DRIVER_TRACE_CBID_cuMemcpyDtoHAsync_v2, - CUPTI_DRIVER_TRACE_CBID_cuMemcpyDtoD_v2, - CUPTI_DRIVER_TRACE_CBID_cuMemcpyDtoDAsync_v2}) { + for (auto cbid : {CUPTI_DRIVER_TRACE_CBID_cuLaunchKernel, + CUPTI_DRIVER_TRACE_CBID_cuMemcpy, + CUPTI_DRIVER_TRACE_CBID_cuMemcpyAsync, + CUPTI_DRIVER_TRACE_CBID_cuMemcpyHtoD_v2, + CUPTI_DRIVER_TRACE_CBID_cuMemcpyHtoDAsync_v2, + CUPTI_DRIVER_TRACE_CBID_cuMemcpyDtoH_v2, + CUPTI_DRIVER_TRACE_CBID_cuMemcpyDtoHAsync_v2, + CUPTI_DRIVER_TRACE_CBID_cuMemcpyDtoD_v2, + CUPTI_DRIVER_TRACE_CBID_cuMemcpyDtoDAsync_v2}) { TF_RETURN_IF_ERROR(ToStatus(cuptiEnableCallback( /*enable=*/1, subscriber_, CUPTI_CB_DOMAIN_DRIVER_API, cbid))); } @@ -244,11 +241,7 @@ class CuptiCallbackHook { const CUpti_CallbackData& cbdata, CudaEventRecorder* recorder) { switch (cbid) { - case CUPTI_DRIVER_TRACE_CBID_cuLaunchKernel: - TF_FALLTHROUGH_INTENDED; - case CUPTI_DRIVER_TRACE_CBID_cuLaunchCooperativeKernelMultiDevice: - TF_FALLTHROUGH_INTENDED; - case CUPTI_DRIVER_TRACE_CBID_cuLaunchCooperativeKernel: { + case CUPTI_DRIVER_TRACE_CBID_cuLaunchKernel: { DCHECK_NE(cbdata.symbolName, nullptr); auto params = static_cast(cbdata.functionParams);