The ftrl optimizer creates large constants for its slot variable initialization. Changing this to create a tensor instead to reduce peak memory usage when applying this to large variables.

PiperOrigin-RevId: 358201046 Change-Id: I839a629d3ee98f75fe9069255984807745082532
2021-02-18 09:52:05 -08:00 · 2021-02-18 09:52:05 -08:00 · 28e6dc5177
commit 28e6dc5177
parent bc2f30e9c8
2 changed files with 11 additions and 5 deletions
--- a/tensorflow/python/training/BUILD
+++ b/tensorflow/python/training/BUILD
@ -294,7 +294,8 @@ py_library(
    deps = [
        ":optimizer",
        ":training_ops",
-        "//tensorflow/python:constant_op",
+        "//tensorflow/python:array_ops",
+        "//tensorflow/python:dtypes",
        "//tensorflow/python:framework_ops",
        "//tensorflow/python:math_ops",
        "//tensorflow/python/util:tf_export",
--- a/tensorflow/python/training/ftrl.py
+++ b/tensorflow/python/training/ftrl.py
@ -17,8 +17,9 @@ from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function

-from tensorflow.python.framework import constant_op
+from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import math_ops
 from tensorflow.python.training import optimizer
 from tensorflow.python.training import training_ops
@ -134,10 +135,14 @@ class FtrlOptimizer(optimizer.Optimizer):

  def _create_slots(self, var_list):
    # Create the "accum" and "linear" slots.
+    def _accum_initializer(shape, dtype=dtypes.float32, partition_info=None):
+      del partition_info
+      return array_ops.ones(
+          shape=shape, dtype=dtype) * self._initial_accumulator_value
    for v in var_list:
-      val = constant_op.constant(
-          self._initial_accumulator_value, dtype=v.dtype, shape=v.get_shape())
-      self._get_or_make_slot(v, val, "accum", self._accum_name or self._name)
+      self._get_or_make_slot_with_initializer(
+          v, _accum_initializer, v.shape, v.dtype, "accum",
+          self._accum_name or self._name)
      self._zeros_slot(v, "linear", self._linear_name or self._name)

  def _prepare(self):