Merge pull request #46410 from kaixih:rnn_update_api_tf2_pr

PiperOrigin-RevId: 352109370 Change-Id: I98bd1fad87b038c4e2e1fd1b5797560400ef5e0a
2021-01-15 16:58:48 -08:00 · 2021-01-15 16:58:48 -08:00 · 2c4e6e357a
commit 2c4e6e357a
parent 034633f23b f7505ea3de
1 changed files with 56 additions and 79 deletions
--- a/tensorflow/python/keras/layers/recurrent_v2.py
+++ b/tensorflow/python/keras/layers/recurrent_v2.py
@ -641,11 +641,7 @@ def standard_gru(inputs, init_h, kernel, recurrent_kernel, bias, mask,
 def gpu_gru(inputs, init_h, kernel, recurrent_kernel, bias, mask, time_major,
            go_backwards, sequence_lengths):
  """GRU with CuDNN implementation which is only available for GPU."""
-  if not time_major and mask is None:
+  seq_axis, batch_axis = (0, 1) if time_major else (1, 0)
    inputs = array_ops.transpose(inputs, perm=(1, 0, 2))
    seq_axis, batch_axis = (0, 1)
  else:
    seq_axis, batch_axis = (0, 1) if time_major else (1, 0)
  # For init_h, cuDNN expects one more dim of num_layers before or after batch
  # dim for time major or batch major inputs respectively
  init_h = array_ops.expand_dims(init_h, axis=seq_axis)
@ -676,40 +672,35 @@ def gpu_gru(inputs, init_h, kernel, recurrent_kernel, bias, mask, time_major,
  if mask is not None:
    sequence_lengths = calculate_sequence_by_mask(mask, time_major)
  if sequence_lengths is not None:
    if go_backwards:
      # Three reversals are required. E.g.,
      # normal input = [1, 2, 3, 0, 0]  # where 0 need to be masked
      # reversed_input_to_cudnn = [3, 2, 1, 0, 0]
      # output_from_cudnn = [6, 5, 4, 0, 0]
      # expected_output = [0, 0, 6, 5 ,4]
      inputs = array_ops.reverse_sequence_v2(
          inputs, sequence_lengths, seq_axis=seq_axis, batch_axis=batch_axis)
    outputs, h, _, _, _ = gen_cudnn_rnn_ops.CudnnRNNV3(
        input=inputs,
        input_h=init_h,
        input_c=0,
        params=params,
        is_training=True,
        rnn_mode='gru',
        sequence_lengths=sequence_lengths,
        time_major=time_major)
    if go_backwards:
      outputs = array_ops.reverse_sequence_v2(
          outputs, sequence_lengths, seq_axis=seq_axis, batch_axis=batch_axis)
      outputs = array_ops.reverse(outputs, axis=[seq_axis])
  else:
-    if go_backwards:
+    input_shape = math_ops.cast(array_ops.shape(inputs), dtypes.int32)
-      # Reverse axis 0 since the input is already convert to time major.
+    timesteps = input_shape[seq_axis]
-      inputs = array_ops.reverse(inputs, axis=[0])
+    batches = input_shape[batch_axis]
-    outputs, h, _, _ = gen_cudnn_rnn_ops.CudnnRNN(
+    sequence_lengths = array_ops.fill([batches], timesteps)
-        input=inputs, input_h=init_h, input_c=0, params=params,
+
-        is_training=True, rnn_mode='gru')
+  if go_backwards:
    # Three reversals are required. E.g.,
    # normal input = [1, 2, 3, 0, 0]  # where 0 need to be masked
    # reversed_input_to_cudnn = [3, 2, 1, 0, 0]
    # output_from_cudnn = [6, 5, 4, 0, 0]
    # expected_output = [0, 0, 6, 5 ,4]
    inputs = array_ops.reverse_sequence_v2(
        inputs, sequence_lengths, seq_axis=seq_axis, batch_axis=batch_axis)
  outputs, h, _, _, _ = gen_cudnn_rnn_ops.CudnnRNNV3(
      input=inputs,
      input_h=init_h,
      input_c=0,
      params=params,
      is_training=True,
      rnn_mode='gru',
      sequence_lengths=sequence_lengths,
      time_major=time_major)
  if go_backwards:
    outputs = array_ops.reverse_sequence_v2(
        outputs, sequence_lengths, seq_axis=seq_axis, batch_axis=batch_axis)
    outputs = array_ops.reverse(outputs, axis=[seq_axis])
  last_output = outputs[-1]
  if not time_major and mask is None:
    outputs = array_ops.transpose(outputs, perm=[1, 0, 2])
  h = array_ops.squeeze(h, axis=seq_axis)
  # In the case of variable length input, the cudnn kernel will fill zeros for
@ -718,8 +709,7 @@ def gpu_gru(inputs, init_h, kernel, recurrent_kernel, bias, mask, time_major,
  # get the final effect output instead just 0s at the last timestep.
  # In order to mimic the default keras behavior, we copy the final h state as
  # the last_output, since it is numerically same as the output.
-  if mask is not None:
+  last_output = h
    last_output = h
  return last_output, outputs, h, _runtime(_RUNTIME_GPU)
@ -1456,11 +1446,7 @@ def gpu_lstm(inputs, init_h, init_c, kernel, recurrent_kernel, bias, mask,
    runtime: Constant string tensor which indicate real runtime hardware. This
      value is for testing purpose and should not be used by user.
  """
-  if not time_major and mask is None:
+  seq_axis, batch_axis = (0, 1) if time_major else (1, 0)
    inputs = array_ops.transpose(inputs, perm=(1, 0, 2))
    seq_axis, batch_axis = (0, 1)
  else:
    seq_axis, batch_axis = (0, 1) if time_major else (1, 0)
  # For init_h and init_c, cuDNN expects one more dim of num_layers before or
  # after batch dim for time major or batch major inputs respectively
  init_h = array_ops.expand_dims(init_h, axis=seq_axis)
@ -1493,43 +1479,35 @@ def gpu_lstm(inputs, init_h, init_c, kernel, recurrent_kernel, bias, mask,
  if mask is not None:
    sequence_lengths = calculate_sequence_by_mask(mask, time_major)
  if sequence_lengths is not None:
    if go_backwards:
      # Three reversals are required. E.g.,
      # normal input = [1, 2, 3, 0, 0]  # where 0 need to be masked
      # reversed_input_to_cudnn = [3, 2, 1, 0, 0]
      # output_from_cudnn = [6, 5, 4, 0, 0]
      # expected_output = [0, 0, 6, 5 ,4]
      inputs = array_ops.reverse_sequence_v2(
          inputs, sequence_lengths, seq_axis=seq_axis, batch_axis=batch_axis)
    outputs, h, c, _, _ = gen_cudnn_rnn_ops.CudnnRNNV3(
        input=inputs,
        input_h=init_h,
        input_c=init_c,
        params=params,
        is_training=True,
        rnn_mode='lstm',
        sequence_lengths=sequence_lengths,
        time_major=time_major)
    if go_backwards:
      outputs = array_ops.reverse_sequence_v2(
          outputs, sequence_lengths, seq_axis=seq_axis, batch_axis=batch_axis)
      outputs = array_ops.reverse(outputs, axis=[seq_axis])
  else:
-    # # Fill the array with shape [batch] with value of max timesteps.
+    input_shape = math_ops.cast(array_ops.shape(inputs), dtypes.int32)
-    # sequence_length = array_ops.fill([array_ops.shape(inputs)[1]],
+    timesteps = input_shape[seq_axis]
-    #                                  array_ops.shape(inputs)[0])
+    batches = input_shape[batch_axis]
-    if go_backwards:
+    sequence_lengths = array_ops.fill([batches], timesteps)
-      # Reverse axis 0 since the input is already convert to time major.
+
-      inputs = array_ops.reverse(inputs, axis=[0])
+  if go_backwards:
-    outputs, h, c, _ = gen_cudnn_rnn_ops.CudnnRNN(
+    # Three reversals are required. E.g.,
-        input=inputs, input_h=init_h, input_c=init_c, params=params,
+    # normal input = [1, 2, 3, 0, 0]  # where 0 need to be masked
-        is_training=True, rnn_mode='lstm')
+    # reversed_input_to_cudnn = [3, 2, 1, 0, 0]
    # output_from_cudnn = [6, 5, 4, 0, 0]
    # expected_output = [0, 0, 6, 5 ,4]
    inputs = array_ops.reverse_sequence_v2(
        inputs, sequence_lengths, seq_axis=seq_axis, batch_axis=batch_axis)
  outputs, h, c, _, _ = gen_cudnn_rnn_ops.CudnnRNNV3(
      input=inputs,
      input_h=init_h,
      input_c=init_c,
      params=params,
      is_training=True,
      rnn_mode='lstm',
      sequence_lengths=sequence_lengths,
      time_major=time_major)
  if go_backwards:
    outputs = array_ops.reverse_sequence_v2(
        outputs, sequence_lengths, seq_axis=seq_axis, batch_axis=batch_axis)
    outputs = array_ops.reverse(outputs, axis=[seq_axis])
  last_output = outputs[-1]
  if not time_major and mask is None:
    outputs = array_ops.transpose(outputs, perm=[1, 0, 2])
  h = array_ops.squeeze(h, axis=seq_axis)
  c = array_ops.squeeze(c, axis=seq_axis)
@ -1539,8 +1517,7 @@ def gpu_lstm(inputs, init_h, init_c, kernel, recurrent_kernel, bias, mask,
  # get the final effect output instead just 0s at the last timestep.
  # In order to mimic the default keras behavior, we copy the final h state as
  # the last_output, since it is numerically same as the output.
-  if mask is not None:
+  last_output = h
    last_output = h
  return last_output, outputs, h, c, _runtime(_RUNTIME_GPU)