From 40cd0a047d4d8d8277d3264556c9c3d0813639b8 Mon Sep 17 00:00:00 2001 From: "A. Unique TensorFlower" Date: Tue, 8 Dec 2020 04:12:37 -0800 Subject: [PATCH] [MLIR][KernelGen] Fix performance discrepancy for `logical_not` kernel Loads and stores are not successfully vectorized. Disable loop unrolling to increase parallelism. PiperOrigin-RevId: 346293461 Change-Id: Ibfc360360eacc66c570ea990580fccfedac8c1de --- tensorflow/core/kernels/mlir_generated/BUILD | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tensorflow/core/kernels/mlir_generated/BUILD b/tensorflow/core/kernels/mlir_generated/BUILD index 047782f5ff9..a5330021500 100644 --- a/tensorflow/core/kernels/mlir_generated/BUILD +++ b/tensorflow/core/kernels/mlir_generated/BUILD @@ -289,7 +289,7 @@ gen_kernel_library( generate_unranked = True, tile_size = "256", types = ["i1"], - unroll_factors = "4", + unroll_factors = "1", ) gen_kernel_library(