From 0a4adad2fc253acc60b58675de8422c065787dd7 Mon Sep 17 00:00:00 2001
From: Ken Franko <kfranko@google.com>
Date: Fri, 12 Jun 2020 15:11:18 -0700
Subject: [PATCH] Add tests for automatic outside compilation on TPUs with
 Keras models.

PiperOrigin-RevId: 316186023
Change-Id: Ib223b500ee0eb70e24d53171f34ca0acb6821579
---
 tensorflow/python/keras/tests/BUILD           |  40 ++-
 .../automatic_outside_compilation_test.py     | 277 ++++++++++++++++++
 2 files changed, 316 insertions(+), 1 deletion(-)
 create mode 100644 tensorflow/python/keras/tests/automatic_outside_compilation_test.py

diff --git a/tensorflow/python/keras/tests/BUILD b/tensorflow/python/keras/tests/BUILD
index 57f9e1d3df2..d270e6f638c 100644
--- a/tensorflow/python/keras/tests/BUILD
+++ b/tensorflow/python/keras/tests/BUILD
@@ -1,9 +1,12 @@
 # Description:
 #   Contains Keras test utils and integration tests.
 
-load("//tensorflow:tensorflow.bzl", "tf_py_test")
 load("//tensorflow:tensorflow.bzl", "cuda_py_test")
 
+# buildifier: disable=same-origin-load
+load("//tensorflow:tensorflow.bzl", "tf_py_test")
+load("//tensorflow/python/tpu:tpu.bzl", "tpu_py_test")
+
 package(
     default_visibility = [
         "//tensorflow/tools/pip_package:__pkg__",
@@ -42,6 +45,41 @@ tf_py_test(
     ],
 )
 
+tpu_py_test(
+    name = "automatic_outside_compilation_test",
+    srcs = [
+        "automatic_outside_compilation_test.py",
+    ],
+    disable_experimental = True,
+    python_version = "PY3",
+    tags = ["no_oss"],
+    deps = [
+        "//tensorflow/python:array_ops",
+        "//tensorflow/python:client_testlib",
+        "//tensorflow/python:config",
+        "//tensorflow/python:constant_op",
+        "//tensorflow/python:control_flow_ops",
+        "//tensorflow/python:dtypes",
+        "//tensorflow/python:errors",
+        "//tensorflow/python:framework_ops",
+        "//tensorflow/python:framework_test_lib",
+        "//tensorflow/python:function",
+        "//tensorflow/python:math_ops",
+        "//tensorflow/python:platform",
+        "//tensorflow/python:random_ops",
+        "//tensorflow/python:string_ops",
+        "//tensorflow/python:summary",
+        "//tensorflow/python:summary_ops_v2",
+        "//tensorflow/python:training_lib",
+        "//tensorflow/python:training_util",
+        "//tensorflow/python:variables",
+        "//tensorflow/python/eager:test",
+        "//tensorflow/python/keras",
+        "//tensorflow/python/keras/distribute:distribute_strategy_test_lib",
+        "//tensorflow/python/ops/losses",
+    ],
+)
+
 tf_py_test(
     name = "convert_to_constants_test",
     srcs = ["convert_to_constants_test.py"],
diff --git a/tensorflow/python/keras/tests/automatic_outside_compilation_test.py b/tensorflow/python/keras/tests/automatic_outside_compilation_test.py
new file mode 100644
index 00000000000..76e5ca98af9
--- /dev/null
+++ b/tensorflow/python/keras/tests/automatic_outside_compilation_test.py
@@ -0,0 +1,277 @@
+# Copyright 2020 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Tests for automatic outside compilation for TF 2.0/Keras."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os
+
+import numpy as np
+
+from tensorflow.python.compat import v2_compat
+from tensorflow.python.data.ops import dataset_ops
+from tensorflow.python.distribute import tpu_strategy as tpu_strategy_lib
+from tensorflow.python.distribute.cluster_resolver import tpu_cluster_resolver
+from tensorflow.python.eager import context
+from tensorflow.python.eager import def_function
+from tensorflow.python.eager import remote
+from tensorflow.python.eager import test
+from tensorflow.python.keras import callbacks
+from tensorflow.python.keras import initializers
+from tensorflow.python.keras.distribute import distribute_strategy_test
+from tensorflow.python.keras.engine import base_layer
+from tensorflow.python.keras.engine import sequential as sequential_model_lib
+from tensorflow.python.keras.engine import training
+from tensorflow.python.keras.layers import convolutional as conv_layer_lib
+from tensorflow.python.keras.layers import core as layer_lib
+from tensorflow.python.keras.layers import pooling as pool_layer_lib
+from tensorflow.python.lib.io import file_io
+from tensorflow.python.ops import math_ops
+from tensorflow.python.ops import summary_ops_v2
+from tensorflow.python.platform import flags
+from tensorflow.python.summary import summary_iterator
+from tensorflow.python.tpu import tpu_strategy_util
+
+NUM_CLASSES = 4
+
+FLAGS = flags.FLAGS
+flags.DEFINE_string('tpu', '', 'Name of TPU to connect to.')
+flags.DEFINE_string('project', None, 'Name of GCP project with TPU.')
+flags.DEFINE_string('zone', None, 'Name of GCP zone with TPU.')
+
+
+def get_tpu_cluster_resolver():
+  resolver = tpu_cluster_resolver.TPUClusterResolver(
+      tpu=FLAGS.tpu,
+      zone=FLAGS.zone,
+      project=FLAGS.project,
+  )
+  return resolver
+
+
+def get_tpu_strategy():
+  resolver = get_tpu_cluster_resolver()
+  remote.connect_to_cluster(resolver)
+  tpu_strategy_util.initialize_tpu_system(resolver)
+  return tpu_strategy_lib.TPUStrategy(resolver)
+
+
+class LayerForScalarSummary(base_layer.Layer):
+  """A pass-through layer that only records scalar values to summary."""
+
+  def call(self, x):
+    summary_ops_v2.scalar('custom_scalar_summary', math_ops.reduce_sum(x))
+    return x
+
+
+class LayerForImageSummary(base_layer.Layer):
+  """A pass-through layer that only records image values to summary."""
+
+  def call(self, x):
+    summary_ops_v2.image('custom_image_summary', x)
+    return x
+
+
+class LayerForHistogramSummary(base_layer.Layer):
+  """A pass-through layer that records histogram values to summary."""
+
+  def call(self, x):
+    summary_ops_v2.histogram('custom_histogram_summary', x)
+    return x
+
+
+class CustomModel(training.Model):
+  """Custom model with summary ops in model call definition."""
+
+  def __init__(self, name=None):
+    super(CustomModel, self).__init__()
+    self._my_layers = [
+        layer_lib.Dense(
+            4096,
+            name='dense1',
+            kernel_initializer=initializers.glorot_normal(seed=0),
+            use_bias=False),
+        layer_lib.Dense(
+            4,
+            name='dense2',
+            kernel_initializer=initializers.glorot_normal(seed=0),
+            use_bias=False),
+    ]
+    self.histogram_summary_layer = LayerForHistogramSummary()
+    self.scalar_summary_layer = LayerForScalarSummary()
+
+  def call(self, x):
+    for layer in self._my_layers:
+      x = layer(x)
+    x = self.scalar_summary_layer(x)
+    return self.histogram_summary_layer(x)
+
+
+def get_image_dataset():
+  inputs = np.zeros((10, 28, 28, 3), dtype=np.float32)
+  targets = np.zeros((10, NUM_CLASSES), dtype=np.float32)
+  dataset = dataset_ops.Dataset.from_tensor_slices((inputs, targets))
+  dataset = dataset.repeat(100)
+  dataset = dataset.batch(10, drop_remainder=True)
+  return dataset
+
+
+def mnist_model(input_shape):
+  """Creates a MNIST model."""
+  model = sequential_model_lib.Sequential()
+
+  # Adding custom pass-through layer to visualize input images.
+  model.add(LayerForImageSummary())
+
+  model.add(
+      conv_layer_lib.Conv2D(
+          32, kernel_size=(3, 3), activation='relu', input_shape=input_shape))
+  model.add(conv_layer_lib.Conv2D(64, (3, 3), activation='relu'))
+  model.add(pool_layer_lib.MaxPooling2D(pool_size=(2, 2)))
+  model.add(layer_lib.Dropout(0.25))
+  model.add(layer_lib.Flatten())
+  model.add(layer_lib.Dense(128, activation='relu'))
+  model.add(layer_lib.Dropout(0.5))
+  model.add(layer_lib.Dense(NUM_CLASSES, activation='softmax'))
+
+  # Adding custom pass-through layer for summary recording.
+  model.add(LayerForHistogramSummary())
+  return model
+
+
+class AutoOutsideCompilationWithKerasTest(test.TestCase):
+
+  def setUp(self):
+    super(AutoOutsideCompilationWithKerasTest, self).setUp()
+    v2_compat.enable_v2_behavior()
+    context.context().soft_device_placement = True
+    self.summary_dir = self.get_temp_dir()
+
+  def testV2SummaryWithImageModel(self):
+    strategy = get_tpu_strategy()
+
+    with strategy.scope():
+      model = mnist_model((28, 28, 3))
+      model.compile('sgd', 'mse')
+
+      dataset = get_image_dataset()
+      tensorboard_callback = callbacks.TensorBoard(
+          self.summary_dir, update_freq=2)
+      model.fit(
+          dataset,
+          steps_per_epoch=10,
+          epochs=1,
+          callbacks=[tensorboard_callback])
+
+      event_files = file_io.get_matching_files_v2(
+          os.path.join(self.summary_dir, 'train', 'event*'))
+      events_count_dictionary = {
+          ('sequential/layer_for_histogram_summary'
+           '/custom_histogram_summary'): 0,
+          'sequential/layer_for_image_summary/custom_image_summary/image/0': 0
+      }
+
+      for event_file in event_files:
+        for e in summary_iterator.summary_iterator(event_file):
+          for v in e.summary.value:
+            if v.tag in events_count_dictionary:
+              events_count_dictionary[v.tag] += 1
+
+      # Since total of 10 steps are ran and summary ops should be invoked
+      # every 2 batches, we should see total of 5 event logs.
+      self.assertEqual(
+          events_count_dictionary[
+              ('sequential/layer_for_histogram_summary/'
+               'custom_histogram_summary')],
+          5)
+      self.assertEqual(
+          events_count_dictionary[
+              ('sequential/layer_for_image_summary/'
+               'custom_image_summary/image/0')],
+          5)
+
+  def testV2SummaryWithKerasFit(self):
+    strategy = get_tpu_strategy()
+
+    with strategy.scope():
+      model = CustomModel()
+      model.compile('sgd', 'mse')
+
+      dataset = distribute_strategy_test.get_dataset(strategy)
+      tensorboard_callback = callbacks.TensorBoard(
+          self.summary_dir, update_freq=2)
+      model.fit(
+          dataset,
+          steps_per_epoch=10,
+          epochs=1,
+          callbacks=[tensorboard_callback])
+
+      event_files = file_io.get_matching_files_v2(
+          os.path.join(self.summary_dir, 'train', 'event*'))
+      events_count_dictionary = {
+          'custom_model/layer_for_scalar_summary/custom_scalar_summary': 0,
+          'custom_model/layer_for_histogram_summary/custom_histogram_summary': 0
+      }
+
+      for event_file in event_files:
+        for e in summary_iterator.summary_iterator(event_file):
+          for v in e.summary.value:
+            if v.tag in events_count_dictionary:
+              events_count_dictionary[v.tag] += 1
+
+      # Since total of 10 steps are ran and summary ops should be invoked
+      # every 2 batches, we should see total of 5 event logs.
+      self.assertEqual(
+          events_count_dictionary[('custom_model/layer_for_histogram_summary/'
+                                   'custom_histogram_summary')],
+          5)
+      self.assertEqual(
+          events_count_dictionary[
+              'custom_model/layer_for_scalar_summary/custom_scalar_summary'], 5)
+
+  def testSummaryWithCustomTrainingLoop(self):
+    strategy = get_tpu_strategy()
+
+    with strategy.scope():
+      model = distribute_strategy_test.get_model()
+      model.compile('sgd', 'mse')
+      writer = summary_ops_v2.create_file_writer_v2(self.summary_dir)
+
+      @def_function.function
+      def custom_function(dataset):
+
+        def _custom_step(features, labels):
+          del labels
+          logits = model(features)
+          with summary_ops_v2.always_record_summaries(), writer.as_default():
+            summary_ops_v2.scalar(
+                'logits', logits, step=model.optimizer.iterations)
+          return logits
+
+        iterator = iter(dataset)
+        output = strategy.unwrap(
+            strategy.run(_custom_step, args=(next(iterator))))
+        return output
+
+      dataset = strategy.experimental_distribute_dataset(
+          distribute_strategy_test.get_dataset(strategy))
+
+      custom_function(dataset)
+
+
+if __name__ == '__main__':
+  test.main()