From 97f7450efffcad4b5b96e27b7dd7e4a078ef15ce Mon Sep 17 00:00:00 2001 From: Alex Stark Date: Tue, 3 Sep 2019 12:53:28 -0700 Subject: [PATCH] Add profiling label to multithreaded conv. PiperOrigin-RevId: 266992949 --- .../lite/kernels/internal/optimized/multithreaded_conv.h | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/tensorflow/lite/kernels/internal/optimized/multithreaded_conv.h b/tensorflow/lite/kernels/internal/optimized/multithreaded_conv.h index c4796acb432..0119dfff7c5 100644 --- a/tensorflow/lite/kernels/internal/optimized/multithreaded_conv.h +++ b/tensorflow/lite/kernels/internal/optimized/multithreaded_conv.h @@ -139,6 +139,10 @@ inline void Conv(const Eigen::ThreadPoolDevice& device, const float* bias_data, const RuntimeShape& output_shape, float* output_data, const RuntimeShape& im2col_shape, float* im2col_data) { + // Nest profiling under "Conv", to aggregate with other kernels. + gemmlowp::ScopedProfilingLabel label("Conv"); + gemmlowp::ScopedProfilingLabel inner_label("Multithreaded EigenTensor"); + // im2col data should not be generated for the multi-thread supporting case. TFLITE_DCHECK(!im2col_data); (void)im2col_shape;