Refactoring for internal use.

PiperOrigin-RevId: 238065622
2019-03-12 11:58:27 -07:00 · 2019-03-12 11:58:27 -07:00 · 92875ced0f
commit 92875ced0f
parent ab9b930f75
5 changed files with 187 additions and 36 deletions
--- a/tensorflow/core/grappler/costs/BUILD
+++ b/tensorflow/core/grappler/costs/BUILD
@ -165,6 +165,7 @@ tf_cc_test(

 cc_library(
    name = "cost_estimator",
+    srcs = ["cost_estimator.cc"],
    hdrs = ["cost_estimator.h"],
    visibility = ["//visibility:public"],
    deps = [
@ -173,6 +174,16 @@ cc_library(
    ],
 )

+tf_cc_test(
+    name = "cost_estimator_test",
+    srcs = ["cost_estimator_test.cc"],
+    deps = [
+        ":cost_estimator",
+        "//tensorflow/core:test",
+        "//tensorflow/core:test_main",
+    ],
+)
+
 cc_library(
    name = "virtual_placer",
    srcs = ["virtual_placer.cc"],
--- a/tensorflow/core/grappler/costs/cost_estimator.cc
+++ b/tensorflow/core/grappler/costs/cost_estimator.cc
@ -0,0 +1,81 @@
+/* Copyright 2017 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "tensorflow/core/grappler/costs/cost_estimator.h"
+
+namespace tensorflow {
+namespace grappler {
+
+Costs CombineCosts(const Costs& left, const Costs& right) {
+  CHECK_NE(left.max_memory, kMemoryUnknown);
+  CHECK_NE(left.max_per_op_buffers, kMemoryUnknown);
+  CHECK_NE(left.max_per_op_streaming, kMemoryUnknown);
+
+  Costs result = left;
+  result.execution_time += right.execution_time;
+  result.compute_time += right.compute_time;
+  result.memory_time += right.memory_time;
+  result.intermediate_memory_time += right.intermediate_memory_time;
+  result.intermediate_memory_read_time += right.intermediate_memory_read_time;
+  result.intermediate_memory_write_time += right.intermediate_memory_write_time;
+
+  if (right.max_per_op_buffers != kMemoryUnknown) {
+    result.max_per_op_buffers =
+        std::max(left.max_per_op_buffers, right.max_per_op_buffers);
+  }
+  if (right.max_per_op_streaming != kMemoryUnknown) {
+    result.max_per_op_streaming =
+        std::max(left.max_per_op_streaming, right.max_per_op_streaming);
+  }
+
+  result.num_ops_total += right.num_ops_total;
+  if (right.inaccurate) {
+    result.inaccurate = true;
+  }
+  result.num_ops_with_unknown_shapes += right.num_ops_with_unknown_shapes;
+  if (right.max_memory != kMemoryUnknown) {
+    result.max_memory += right.max_memory;
+  }
+
+  return result;
+}
+
+// Multiplies Costs by a scalar.
+// Equivalent to applying CombineCosts "multiplier" times.
+// Note the field regarding num_ops are not multiplied.
+Costs MultiplyCosts(const Costs& costs, int multiplier) {
+  CHECK_GE(multiplier, 0);
+  if (multiplier == 0) {
+    return Costs::ZeroCosts();
+  }
+  if (multiplier == 1) {
+    return costs;
+  }
+
+  Costs result = costs;
+  result.execution_time *= multiplier;
+  result.compute_time *= multiplier;
+  result.memory_time *= multiplier;
+  result.intermediate_memory_time *= multiplier;
+  result.intermediate_memory_read_time *= multiplier;
+  result.intermediate_memory_write_time *= multiplier;
+  if (result.max_memory != kMemoryUnknown) {
+    result.max_memory *= multiplier;
+  }
+  return result;
+}
+
+}  // end namespace grappler
+}  // end namespace tensorflow
--- a/tensorflow/core/grappler/costs/cost_estimator.h
+++ b/tensorflow/core/grappler/costs/cost_estimator.h
@ -16,9 +16,6 @@ limitations under the License.
 #ifndef TENSORFLOW_CORE_GRAPPLER_COSTS_COST_ESTIMATOR_H_
 #define TENSORFLOW_CORE_GRAPPLER_COSTS_COST_ESTIMATOR_H_

-#include <chrono>
-#include <cmath>
-#include <unordered_map>
 #include "tensorflow/core/lib/core/status.h"
 #include "tensorflow/core/protobuf/config.pb.h"

@ -204,6 +201,12 @@ Costs Costs::ZeroCosts() {
  return costs;
 }

+Costs CombineCosts(const Costs& left, const Costs& right);
+
+// Multiplies Costs by a scalar.
+// Equivalent to applying CombineCosts "multiplier" times.
+Costs MultiplyCosts(const Costs& costs, int multiplier);
+
 // Given a GrapperItem and an optimized implementation of the corresponding
 // TensorFlow graph, the CostEstimator attempts to predicts the actual cost of
 // running the graph.
--- a/tensorflow/core/grappler/costs/cost_estimator_test.cc
+++ b/tensorflow/core/grappler/costs/cost_estimator_test.cc
@ -0,0 +1,88 @@
+/* Copyright 2017 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "tensorflow/core/grappler/costs/cost_estimator.h"
+
+#include "tensorflow/core/platform/test.h"
+
+namespace tensorflow {
+namespace grappler {
+namespace {
+
+TEST(CostEstimatorTest, CombineCosts) {
+  Costs c = Costs::ZeroCosts();
+  c.execution_time = Costs::NanoSeconds(1);
+  c.compute_time = Costs::NanoSeconds(2);
+  c.memory_time = Costs::NanoSeconds(3);
+  c.intermediate_memory_time = Costs::NanoSeconds(4);
+  c.intermediate_memory_read_time = Costs::NanoSeconds(5);
+  c.intermediate_memory_write_time = Costs::NanoSeconds(6);
+  c.max_memory = 1;
+  c.max_per_op_buffers = 2;
+  c.max_per_op_streaming = 3;
+  c.num_ops_total = 1;
+  c.inaccurate = false;
+  c.num_ops_with_unknown_shapes = 0;
+
+  Costs sum = CombineCosts(c, c);
+
+  EXPECT_EQ(sum.execution_time, Costs::NanoSeconds(2));
+  EXPECT_EQ(sum.compute_time, Costs::NanoSeconds(4));
+  EXPECT_EQ(sum.memory_time, Costs::NanoSeconds(6));
+  EXPECT_EQ(sum.intermediate_memory_time, Costs::NanoSeconds(8));
+  EXPECT_EQ(sum.intermediate_memory_read_time, Costs::NanoSeconds(10));
+  EXPECT_EQ(sum.intermediate_memory_write_time, Costs::NanoSeconds(12));
+  EXPECT_EQ(sum.max_memory, 2);
+  EXPECT_EQ(sum.max_per_op_buffers, 2);
+  EXPECT_EQ(sum.max_per_op_streaming, 3);
+  EXPECT_EQ(sum.num_ops_total, 2);
+  EXPECT_FALSE(sum.inaccurate);
+  EXPECT_EQ(sum.num_ops_with_unknown_shapes, 0);
+}
+
+TEST(CostEstimatorTest, MultiplyCosts) {
+  Costs c = Costs::ZeroCosts();
+  c.execution_time = Costs::NanoSeconds(1);
+  c.compute_time = Costs::NanoSeconds(2);
+  c.memory_time = Costs::NanoSeconds(3);
+  c.intermediate_memory_time = Costs::NanoSeconds(4);
+  c.intermediate_memory_read_time = Costs::NanoSeconds(5);
+  c.intermediate_memory_write_time = Costs::NanoSeconds(6);
+  c.max_memory = 1;
+  c.max_per_op_buffers = 2;
+  c.max_per_op_streaming = 3;
+  c.num_ops_total = 1;
+  c.inaccurate = false;
+  c.num_ops_with_unknown_shapes = 0;
+
+  Costs product = MultiplyCosts(c, 10);
+
+  EXPECT_EQ(product.execution_time, Costs::NanoSeconds(10));
+  EXPECT_EQ(product.compute_time, Costs::NanoSeconds(20));
+  EXPECT_EQ(product.memory_time, Costs::NanoSeconds(30));
+  EXPECT_EQ(product.intermediate_memory_time, Costs::NanoSeconds(40));
+  EXPECT_EQ(product.intermediate_memory_read_time, Costs::NanoSeconds(50));
+  EXPECT_EQ(product.intermediate_memory_write_time, Costs::NanoSeconds(60));
+  EXPECT_EQ(product.max_memory, 10);
+  EXPECT_EQ(product.max_per_op_buffers, 2);
+  EXPECT_EQ(product.max_per_op_streaming, 3);
+  EXPECT_EQ(product.num_ops_total, 1);
+  EXPECT_FALSE(product.inaccurate);
+  EXPECT_EQ(product.num_ops_with_unknown_shapes, 0);
+}
+
+}  // namespace
+}  // namespace grappler
+}  // namespace tensorflow
--- a/tensorflow/core/grappler/costs/virtual_scheduler.cc
+++ b/tensorflow/core/grappler/costs/virtual_scheduler.cc
@ -34,41 +34,9 @@ limitations under the License.

 namespace tensorflow {
 namespace grappler {
+
 namespace {

-Costs CombineCosts(const Costs& left, const Costs& right) {
-  CHECK_NE(left.max_memory, kMemoryUnknown);
-  CHECK_NE(left.max_per_op_buffers, kMemoryUnknown);
-  CHECK_NE(left.max_per_op_streaming, kMemoryUnknown);
-
-  Costs result = left;
-  result.execution_time += right.execution_time;
-  result.compute_time += right.compute_time;
-  result.memory_time += right.memory_time;
-  result.intermediate_memory_time += right.intermediate_memory_time;
-
-  result.num_ops_total += right.num_ops_total;
-  if (right.inaccurate) result.inaccurate = true;
-  result.num_ops_with_unknown_shapes += right.num_ops_with_unknown_shapes;
-
-  if (right.max_memory != kMemoryUnknown) {
-    result.max_memory += right.max_memory;
-  }
-  if (right.max_per_op_buffers != kMemoryUnknown) {
-    result.max_per_op_buffers =
-        std::max(left.max_per_op_buffers, right.max_per_op_buffers);
-  }
-  if (right.max_per_op_streaming != kMemoryUnknown) {
-    result.max_per_op_streaming =
-        std::max(left.max_per_op_streaming, right.max_per_op_streaming);
-  }
-  VLOG(4) << "costs execution_time=" << result.execution_time.count()
-          << " max_memory=" << result.max_memory
-          << " max_per_op_buffers=" << result.max_per_op_buffers
-          << " max_per_op_streaming=" << result.max_per_op_streaming;
-  return result;
-}
-
 // Key to the cached _Recv ops map, and its hash and predicate structures.
 struct RecvNodeDescriptor {
  const NodeDef* node;