Fix argument buffer reuse for BatchNormGrad.

When scale_after_normalization is set, the kernel may not alias the gamma input with db output, as gamma is still needed. PiperOrigin-RevId: 237970041
2019-03-12 01:30:41 -07:00 · 2019-03-12 01:30:41 -07:00 · 8c99eb5f8b
commit 8c99eb5f8b
parent 74b961829e
3 changed files with 7 additions and 3 deletions
--- a/tensorflow/core/kernels/batch_norm_op.cc
+++ b/tensorflow/core/kernels/batch_norm_op.cc
@ -127,8 +127,12 @@ class BatchNormGradOp : public OpKernel {
    OP_REQUIRES_OK(context, context->forward_input_or_allocate_output(
                                {2}, 2, var.shape(), &dv));
    Tensor* db = nullptr;
-    OP_REQUIRES_OK(context, context->forward_input_or_allocate_output(
+    if (scale_after_normalization_) {
-                                {3}, 3, mean.shape(), &db));
+      OP_REQUIRES_OK(context, context->allocate_output(3, mean.shape(), &db));
    } else {
      OP_REQUIRES_OK(context, context->forward_input_or_allocate_output(
                                  {3}, 3, mean.shape(), &db));
    }
    Tensor* dg = nullptr;
    OP_REQUIRES_OK(context, context->allocate_output(4, gamma.shape(), &dg));
--- a/tensorflow/python/BUILD
+++ b/tensorflow/python/BUILD
@ -3711,6 +3711,7 @@ cuda_py_test(
    ],
    shard_count = 4,
    tags = ["no_windows"],
    xla_enable_strict_auto_jit = True,
 )
 cuda_py_test(
--- a/tensorflow/python/ops/nn_batchnorm_test.py
+++ b/tensorflow/python/ops/nn_batchnorm_test.py
@ -206,7 +206,6 @@ class BatchNormalizationTest(test.TestCase):
                                  2)
  @test_util.run_deprecated_v1
  @test_util.disable_xla("This test never passed for XLA")
  def testBatchNormGradImpl(self):
    x_shape = [7, 5, 4, 6]
    param_shape = [6]