Fix spatial dimension reference in conv padding legalization.

Padding legalization is run after the GpuConvRewriter pass, which in the case of backward input convolution will swap input spatial dimension numbers with output spatial dimension numbers. This was not taken into account in the GpuConvPaddingLegalization pass. PiperOrigin-RevId: 332421264 Change-Id: I3bcfd8fc63c9ec3f3b28b19921f0546f578ae7c6
2020-09-18 03:42:46 -07:00 · 2020-09-18 03:42:46 -07:00 · 3ab5dca2e6
commit 3ab5dca2e6
parent ba5f4249a2
3 changed files with 125 additions and 2 deletions
--- a/tensorflow/compiler/xla/service/gpu/BUILD
+++ b/tensorflow/compiler/xla/service/gpu/BUILD
@ -1035,6 +1035,24 @@ cc_library(
    ],
 )

+tf_cc_test(
+    name = "gpu_conv_padding_legalization_test",
+    srcs = ["gpu_conv_padding_legalization_test.cc"],
+    tags = tf_cuda_tests_tags(),
+    deps = [
+        ":gpu_conv_padding_legalization",
+        ":ir_emission_utils",
+        "//tensorflow/compiler/xla:shape_util",
+        "//tensorflow/compiler/xla:test",
+        "//tensorflow/compiler/xla:xla_data_proto_cc",
+        "//tensorflow/compiler/xla/service:hlo",
+        "//tensorflow/compiler/xla/service:hlo_matchers",
+        "//tensorflow/compiler/xla/tests:hlo_test_base",
+        "//tensorflow/compiler/xla/tests:xla_internal_test_main",  # fixdeps: keep
+        "//tensorflow/core:test",
+    ],
+)
+
 cc_library(
    name = "cudnn_pad_for_convolutions",
    srcs = ["cudnn_pad_for_convolutions.cc"],
--- a/tensorflow/compiler/xla/service/gpu/gpu_conv_padding_legalization.cc
+++ b/tensorflow/compiler/xla/service/gpu/gpu_conv_padding_legalization.cc
@ -313,7 +313,11 @@ bool GpuConvPaddingLegalization::CanonicalizeBackwardInputConvolution(
                            new_backward_conv_window.mutable_dimensions(i));
    }
    // Decreasing the padding by X *increases* the size of our output by X.
-    int64 dim = backward_conv_dnums.output_spatial_dimensions(i);
+    // Note that we have swapped input spatial dimensions with output spatial
+    // dimensions to be compatible with the cuDNN API, so
+    // input_spatial_dimensions(i) gives the i-th spatial dimension of the
+    // output.
+    int64 dim = backward_conv_dnums.input_spatial_dimensions(i);
    new_backward_conv_shape.set_dimensions(
        dim, new_backward_conv_shape.dimensions(dim) +
                 std::abs(padding_low - padding_high));
@ -353,7 +357,11 @@ bool GpuConvPaddingLegalization::CanonicalizeBackwardInputConvolution(
  for (size_t i = 0; i < backward_conv->window().dimensions_size(); ++i) {
    int64 padding_low = backward_conv->window().dimensions(i).padding_low();
    int64 padding_high = backward_conv->window().dimensions(i).padding_high();
-    int64 dim = backward_conv_dnums.output_spatial_dimensions(i);
+    // Note that we have swapped input spatial dimensions with output spatial
+    // dimensions to be compatible with the cuDNN API, so
+    // input_spatial_dimensions(i) gives the i-th spatial dimension of the
+    // output.
+    int64 dim = backward_conv_dnums.input_spatial_dimensions(i);
    if (padding_low > padding_high) {
      // If the amount of low padding (of the old backward convolution) is
      // larger, we internally pad the low end of the activations and slice
--- a/tensorflow/compiler/xla/service/gpu/gpu_conv_padding_legalization_test.cc
+++ b/tensorflow/compiler/xla/service/gpu/gpu_conv_padding_legalization_test.cc
@ -0,0 +1,97 @@
+/* Copyright 2020 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "tensorflow/compiler/xla/service/gpu/gpu_conv_padding_legalization.h"
+
+#include "tensorflow/compiler/xla/service/gpu/ir_emission_utils.h"
+#include "tensorflow/compiler/xla/service/hlo_instruction.h"
+#include "tensorflow/compiler/xla/service/hlo_matchers.h"
+#include "tensorflow/compiler/xla/service/hlo_module.h"
+#include "tensorflow/compiler/xla/service/hlo_opcode.h"
+#include "tensorflow/compiler/xla/shape_util.h"
+#include "tensorflow/compiler/xla/test.h"
+#include "tensorflow/compiler/xla/tests/hlo_test_base.h"
+#include "tensorflow/compiler/xla/xla_data.pb.h"
+#include "tensorflow/core/platform/test.h"
+
+namespace xla {
+namespace gpu {
+namespace {
+
+namespace op = xla::testing::opcode_matchers;
+using ::testing::_;
+
+using GpuConvPaddingLegalizationTest = HloTestBase;
+
+TEST_F(GpuConvPaddingLegalizationTest, BackwardInputConvolve) {
+  auto module = ParseAndReturnVerifiedModule(R"(
+  HloModule convolution_module
+ENTRY %convolution (operand f64[2,2,2,3]{3,2,1,0}) -> (f64[2,2,4,4]{3,2,1,0}, u8[0]) {
+  %operand = f64[2,2,2,3]{3,2,1,0} parameter(0)
+  %kernel = f64[2,3,2,3]{3,2,1,0} constant(
+  {
+    { /*i0=0*/
+    { /*i1=0*/
+      { 0.29629629629629628, 0.30246913580246915, 0.30864197530864196 },
+      { 0.31481481481481483, 0.32098765432098764, 0.3271604938271605 }
+    },
+    { /*i1=1*/
+      { 0.25925925925925924, 0.26543209876543211, 0.27160493827160492 },
+      { 0.27777777777777779, 0.2839506172839506, 0.29012345679012347 }
+    },
+    { /*i1=2*/
+      { 0.22222222222222221, 0.22839506172839505, 0.23456790123456789 },
+      { 0.24074074074074073, 0.24691358024691357, 0.25308641975308643 }
+    }
+    },
+    { /*i0=1*/
+    { /*i1=0*/
+      { 0.18518518518518517, 0.19135802469135801, 0.19753086419753085 },
+      { 0.20370370370370369, 0.20987654320987653, 0.21604938271604937 }
+    },
+    { /*i1=1*/
+      { 0.14814814814814814, 0.15432098765432098, 0.16049382716049382 },
+      { 0.16666666666666666, 0.1728395061728395, 0.17901234567901234 }
+    },
+    { /*i2=2*/
+      { 0.1111111111111111, 0.11728395061728394, 0.12345679012345678 },
+      { 0.12962962962962962, 0.13580246913580246, 0.1419753086419753 }
+    }
+    }
+  })
+  %reverse = f64[2,3,2,3]{3,2,1,0} reverse(%kernel), dimensions={0,1}
+  ROOT %custom-call = (f64[2,2,4,4]{3,2,1,0}, u8[0]{0}) custom-call(f64[2,2,2,3]{3,2,1,0} %operand, f64[2,3,2,3]{3,2,1,0} %reverse), window={size=2x3 stride=2x2 pad=0_0x0_1}, dim_labels=bf01_01io->b01f, custom_call_target="__cudnn$convBackwardInput", backend_config="{\"algorithm\":\"0\",\"tensor_ops_enabled\":false,\"conv_result_scale\":1,\"activation_mode\":\"0\",\"side_input_scale\":0}"
+}
+                                               )")
+                    .ValueOrDie();
+  ASSERT_TRUE(GpuConvPaddingLegalization().Run(module.get()).ValueOrDie());
+  auto root = module->entry_computation()->root_instruction();
+  EXPECT_THAT(root,
+              op::Tuple(op::Slice(op::GetTupleElement(
+                            op::CustomCall(kCudnnConvBackwardInputCallTarget, _,
+                                           op::Reverse(op::Constant())),
+                            0)),
+                        op::GetTupleElement()));
+  auto slice = root->operand(0);
+  Shape expected_slice_shape = ShapeUtil::MakeShape(F64, {2, 2, 4, 4});
+  EXPECT_TRUE(ShapeUtil::Equal(slice->shape(), expected_slice_shape));
+  auto conv = slice->operand(0);
+  Shape expected_conv_shape = ShapeUtil::MakeShape(F64, {2, 2, 4, 5});
+  EXPECT_TRUE(ShapeUtil::Equal(conv->shape(), expected_conv_shape));
+}
+
+}  // anonymous namespace
+}  // namespace gpu
+}  // namespace xla