From 78f6d51b8d9a2f3542918f004a29a6fbba232a40 Mon Sep 17 00:00:00 2001 From: Adrian Kuegel Date: Thu, 18 Jun 2020 05:26:02 -0700 Subject: [PATCH] Also set the unroll factor in the C++ integration code for tanh. PiperOrigin-RevId: 317083225 Change-Id: I7c2c26d664c15cbc967188da4b3012161edbcf49 --- tensorflow/core/kernels/mlir_generated_cwise_op_gpu_tanh.cu.cc | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tensorflow/core/kernels/mlir_generated_cwise_op_gpu_tanh.cu.cc b/tensorflow/core/kernels/mlir_generated_cwise_op_gpu_tanh.cu.cc index 70de777239f..a122c5112e6 100644 --- a/tensorflow/core/kernels/mlir_generated_cwise_op_gpu_tanh.cu.cc +++ b/tensorflow/core/kernels/mlir_generated_cwise_op_gpu_tanh.cu.cc @@ -124,7 +124,7 @@ class MlirGeneratedTanhOp : public OpKernel { // This has to be aligned with the configuration that was used when building // the kernels. See the corresponding build rules in `cubin_headers/BUILD`. LaunchConfig config = GetLaunchConfiguration( - {256}, {}, {static_cast(inp.NumElements())}); + {256}, {4}, {static_cast(inp.NumElements())}); OP_REQUIRES_OK( ctx, stream->parent()->Launch(stream, config.threadDim, config.blockDim, *kernel, args));