Splitting out the memory usage tests into their own test file as that was making the test suite for MultiDeviceIterator too big and timing out.

PiperOrigin-RevId: 235242183
2019-02-22 12:53:41 -08:00 · 2019-02-22 12:53:41 -08:00 · 61aced4825
commit 61aced4825
parent eb741cedf3
3 changed files with 123 additions and 71 deletions
--- a/tensorflow/python/data/kernel_tests/BUILD
+++ b/tensorflow/python/data/kernel_tests/BUILD
@ -444,6 +444,21 @@ cuda_py_test(
    ],
 )

+cuda_py_test(
+    name = "memory_cleanup_test",
+    size = "medium",
+    srcs = ["memory_cleanup_test.py"],
+    additional_deps = [
+        ":test_base",
+        "@absl_py//absl/testing:parameterized",
+        "//tensorflow/core:protos_all_py",
+        "//tensorflow/python/data/ops:dataset_ops",
+        "//tensorflow/python/data/ops:multi_device_iterator_ops",
+        "//tensorflow/python:client_testlib",
+        "//tensorflow/python:framework_test_lib",
+    ],
+)
+
 cuda_py_test(
    name = "optional_test",
    size = "small",
--- a/tensorflow/python/data/kernel_tests/memory_cleanup_test.py
+++ b/tensorflow/python/data/kernel_tests/memory_cleanup_test.py
@ -0,0 +1,108 @@
+# Copyright 2018 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Verify that memory usage is minimal in eager mode."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import time
+import six
+
+from tensorflow.core.protobuf import config_pb2
+from tensorflow.python.data.kernel_tests import test_base
+from tensorflow.python.data.ops import dataset_ops
+from tensorflow.python.data.ops import multi_device_iterator_ops
+from tensorflow.python.eager import context
+from tensorflow.python.framework import ops
+from tensorflow.python.framework import test_util
+from tensorflow.python.platform import test
+from tensorflow.python.platform import tf_logging as logging
+
+
+# memory_profiler might not be available in the OSS version of TensorFlow.
+try:
+  import memory_profiler  # pylint:disable=g-import-not-at-top
+except ImportError:
+  memory_profiler = None
+
+
+@test_util.run_all_in_graph_and_eager_modes
+class MemoryCleanupTest(test_base.DatasetTestBase):
+
+  def assertNotIncreasingMemory(self,
+                                f,
+                                num_iters=100000,
+                                increase_threshold_absolute_mb=10):
+    """Assert memory usage doesn't increase beyond given threshold for f."""
+    with context.eager_mode():
+      # Warm up.
+      f()
+      # Wait for background threads to start up and take over memory.
+      # FIXME: The nature of this test leaves few other options. Maybe there
+      # is a better way to do this.
+      time.sleep(4)
+      initial = memory_profiler.memory_usage(-1)[0]
+      for _ in six.moves.range(num_iters):
+        f()
+      increase = memory_profiler.memory_usage(-1)[0] - initial
+      logging.info("Memory increase observed: %f MB" % increase)
+      assert increase < increase_threshold_absolute_mb, (
+          "Increase is too high. Initial memory usage: %f MB. Increase: %f MB. "
+          "Maximum allowed increase: %f") % (initial, increase,
+                                             increase_threshold_absolute_mb)
+
+  @test_util.run_v1_only("b/121264236")
+  def testEagerMemoryUsageWithReset(self):
+    if not context.executing_eagerly():
+      self.skipTest("Only eager mode test")
+    if memory_profiler is None:
+      self.skipTest("memory_profiler required to run this test")
+
+    dataset = dataset_ops.Dataset.range(10)
+    multi_device_iterator = multi_device_iterator_ops.MultiDeviceIterator(
+        dataset, ["/cpu:1", "/cpu:2"])
+
+    def f():
+      self.evaluate(multi_device_iterator.get_next())
+      multi_device_iterator._eager_reset()
+
+    self.assertNotIncreasingMemory(
+        f, num_iters=100, increase_threshold_absolute_mb=50)
+
+  @test_util.run_v1_only("b/121264236")
+  def testEagerMemoryUsageWithRecreation(self):
+    if not context.executing_eagerly():
+      self.skipTest("Only eager mode test")
+    if memory_profiler is None:
+      self.skipTest("memory_profiler required to run this test")
+
+    dataset = dataset_ops.Dataset.range(10)
+
+    def f():
+      multi_device_iterator = multi_device_iterator_ops.MultiDeviceIterator(
+          dataset, ["/cpu:1", "/cpu:2"])
+      self.evaluate(multi_device_iterator.get_next())
+      del multi_device_iterator
+
+    # TODO(b/123316347): Reduce threshold once bug is fixed.
+    self.assertNotIncreasingMemory(
+        f, num_iters=100, increase_threshold_absolute_mb=500)
+
+
+if __name__ == "__main__":
+  ops.enable_eager_execution(
+      config=config_pb2.ConfigProto(device_count={"CPU": 3, "GPU": 1}))
+  test.main()
--- a/tensorflow/python/data/kernel_tests/multi_device_iterator_test.py
+++ b/tensorflow/python/data/kernel_tests/multi_device_iterator_test.py
@ -18,9 +18,7 @@ from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function

-import time
 from absl.testing import parameterized
-import six

 from tensorflow.core.protobuf import config_pb2
 from tensorflow.python.data.experimental.ops import optimization
@ -34,44 +32,12 @@ from tensorflow.python.framework import ops
 from tensorflow.python.framework import test_util
 from tensorflow.python.ops import array_ops
 from tensorflow.python.platform import test
-from tensorflow.python.platform import tf_logging as logging
-
-
-# memory_profiler might not be available in the OSS version of TensorFlow.
-try:
-  import memory_profiler  # pylint:disable=g-import-not-at-top
-except ImportError:
-  memory_profiler = None


@test_util.run_all_in_graph_and_eager_modes
 class MultiDeviceIteratorTest(test_base.DatasetTestBase,
                              parameterized.TestCase):

-  def assertNotIncreasingMemory(self,
-                                f,
-                                num_iters=100000,
-                                increase_threshold_absolute_mb=10):
-    """Assert memory usage doesn't increase beyond given threshold for f."""
-
-    with context.eager_mode():
-      # Warm up.
-      f()
-
-      # Wait for background threads to start up and take over memory.
-      # FIXME: The nature of this test leaves few other options. Maybe there
-      # is a better way to do this.
-      time.sleep(4)
-      initial = memory_profiler.memory_usage(-1)[0]
-      for _ in six.moves.range(num_iters):
-        f()
-      increase = memory_profiler.memory_usage(-1)[0] - initial
-      logging.info("Memory increase observed: %f MB" % increase)
-      assert increase < increase_threshold_absolute_mb, (
-          "Increase is too high. Initial memory usage: %f MB. Increase: %f MB. "
-          "Maximum allowed increase: %f") % (initial, increase,
-                                             increase_threshold_absolute_mb)
-
  @parameterized.parameters(0, 1, 42,)
  @test_util.run_v1_only("b/121264236")
  def testInitOnly(self, num_inits):
@ -102,43 +68,6 @@ class MultiDeviceIteratorTest(test_base.DatasetTestBase,
        self.evaluate(elem_on_1)
        self.evaluate(elem_on_2)

-  @test_util.run_v1_only("b/121264236")
-  def testEagerMemoryUsageWithReset(self):
-    if not context.executing_eagerly():
-      self.skipTest("Only eager mode test")
-    if memory_profiler is None:
-      self.skipTest("memory_profiler required to run this test")
-
-    dataset = dataset_ops.Dataset.range(10)
-    multi_device_iterator = multi_device_iterator_ops.MultiDeviceIterator(
-        dataset, ["/cpu:1", "/cpu:2"])
-
-    def f():
-      self.evaluate(multi_device_iterator.get_next())
-      multi_device_iterator._eager_reset()
-
-    self.assertNotIncreasingMemory(
-        f, num_iters=100, increase_threshold_absolute_mb=50)
-
-  @test_util.run_v1_only("b/121264236")
-  def testEagerMemoryUsageWithRecreation(self):
-    if not context.executing_eagerly():
-      self.skipTest("Only eager mode test")
-    if memory_profiler is None:
-      self.skipTest("memory_profiler required to run this test")
-
-    dataset = dataset_ops.Dataset.range(10)
-
-    def f():
-      multi_device_iterator = multi_device_iterator_ops.MultiDeviceIterator(
-          dataset, ["/cpu:1", "/cpu:2"])
-      self.evaluate(multi_device_iterator.get_next())
-      del multi_device_iterator
-
-    # TODO(b/123316347): Reduce threshold once bug is fixed.
-    self.assertNotIncreasingMemory(
-        f, num_iters=100, increase_threshold_absolute_mb=500)
-
  @test_util.run_v1_only("b/121264236")
  def testOneOnSameDevice(self):
    with ops.device("/cpu:0"):