diff --git a/.mention-bot b/.mention-bot
new file mode 100644
index 00000000000..6210b1f4d53
--- /dev/null
+++ b/.mention-bot
@@ -0,0 +1,11 @@
+{
+  "maxReviewers": 2,
+  "numFilesToCheck": 10, // Number of files to check against, default is 5
+  "userBlacklist": ["tensorflower-gardener"], // users in this list will never be mentioned by mention-bot
+  "requiredOrgs": ["tensorflow"], // mention-bot will only mention user who are a member of one of these organizations
+  "skipAlreadyAssignedPR": true, // mention-bot will ignore already assigned PR's
+  "skipAlreadyMentionedPR": true, // mention-bot will ignore if there is already existing an exact mention
+  "skipTitle": "Branch", // mention-bot will ignore PR that includes text in the title,
+  "delayed": true, // mention-bot will wait to comment until specified time in `delayedUntil` value
+  "delayedUntil": "10m",
+}
diff --git a/README.md b/README.md
index 1372f209b93..0ed9e78fc98 100644
--- a/README.md
+++ b/README.md
@@ -33,10 +33,10 @@ and discussion.**
 
 People who are a little more adventurous can also try our nightly binaries:
 
-* Linux CPU-only: [Python 2](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=cpu-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-cp27-none-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=cpu-slave)) / [Python 3.4](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=cpu-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-cp34-cp34m-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=cpu-slave/)) / [Python 3.5](https://ci.tensorflow.org/view/Nightly/job/nightly-python35-linux-cpu/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-cp35-cp35m-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-python35-linux-cpu/))
-* Linux GPU: [Python 2](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=gpu-linux/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-cp27-none-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=gpu-linux/)) / [Python 3.4](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=gpu-linux/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-cp34-cp34m-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=gpu-linux/)) / [Python 3.5](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3.5,label=gpu-linux/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-cp35-cp35m-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3.5,label=gpu-linux/))
-* Mac CPU-only: [Python 2](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=mac1-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-py2-none-any.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=mac1-slave/)) / [Python 3](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=mac1-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-py3-none-any.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=mac1-slave/))
-* Mac GPU: [Python 2](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-mac-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=gpu-mac/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-py2-none-any.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-mac-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=gpu-mac/)) / [Python 3](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-mac-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=gpu-mac/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-py3-none-any.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-mac-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=gpu-mac/))
+* Linux CPU-only: [Python 2](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=cpu-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-cp27-none-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=cpu-slave)) / [Python 3.4](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=cpu-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-cp34-cp34m-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=cpu-slave/)) / [Python 3.5](https://ci.tensorflow.org/view/Nightly/job/nightly-python35-linux-cpu/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-cp35-cp35m-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-python35-linux-cpu/))
+* Linux GPU: [Python 2](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=gpu-linux/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-cp27-none-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=gpu-linux/)) / [Python 3.4](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=gpu-linux/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-cp34-cp34m-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=gpu-linux/)) / [Python 3.5](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3.5,label=gpu-linux/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-cp35-cp35m-linux_x86_64.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-linux-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3.5,label=gpu-linux/))
+* Mac CPU-only: [Python 2](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=mac1-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-py2-none-any.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=mac1-slave/)) / [Python 3](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=mac1-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-py3-none-any.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=mac1-slave/))
+* Mac GPU: [Python 2](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-mac-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=gpu-mac/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-py2-none-any.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-mac-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=gpu-mac/)) / [Python 3](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-mac-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=gpu-mac/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-py3-none-any.whl) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-mac-gpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON3,label=gpu-mac/))
 * [Android](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-android/TF_BUILD_CONTAINER_TYPE=ANDROID,TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=NO_PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=android-slave/lastSuccessfulBuild/artifact/bazel-out/local_linux/bin/tensorflow/examples/android/tensorflow_demo.apk) ([build history](https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-android/TF_BUILD_CONTAINER_TYPE=ANDROID,TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=NO_PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=android-slave/))
 
 #### *Try your first TensorFlow program*
diff --git a/RELEASE.md b/RELEASE.md
index 7d0a68654cf..af256fae93f 100644
--- a/RELEASE.md
+++ b/RELEASE.md
@@ -10,6 +10,7 @@ BUS_ANY was used.
 
 ## Major Features and Improvements
 
+* CUDA 8 support.
 * cuDNN 5 support.
 * HDFS Support.
 * Adds Fused LSTM support via cuDNN 5 in `tensorflow/contrib/cudnn_rnn`.
diff --git a/WORKSPACE b/WORKSPACE
index eee6c603144..f96dbef86e6 100644
--- a/WORKSPACE
+++ b/WORKSPACE
@@ -153,8 +153,8 @@ new_http_archive(
 new_http_archive(
   name = "iron_iconset_svg",
   build_file = "bower.BUILD",
-  url = "https://github.com/polymerelements/iron-iconset-svg/archive/v1.0.10.tar.gz",
-  strip_prefix = "iron-iconset-svg-1.0.10",
+  url = "https://github.com/polymerelements/iron-iconset-svg/archive/v1.1.0.tar.gz",
+  strip_prefix = "iron-iconset-svg-1.1.0",
 )
 
 new_http_archive(
@@ -188,8 +188,8 @@ new_http_archive(
 new_http_archive(
   name = "iron_overlay_behavior",
   build_file = "bower.BUILD",
-  url = "https://github.com/polymerelements/iron-overlay-behavior/archive/v1.9.0.tar.gz",
-  strip_prefix = "iron-overlay-behavior-1.9.0",
+  url = "https://github.com/polymerelements/iron-overlay-behavior/archive/v1.10.1.tar.gz",
+  strip_prefix = "iron-overlay-behavior-1.10.1",
 )
 
 new_http_archive(
@@ -206,6 +206,13 @@ new_http_archive(
   strip_prefix = "iron-resizable-behavior-1.0.3",
 )
 
+new_http_archive(
+  name = "iron_scroll_target_behavior",
+  build_file = "bower.BUILD",
+  url = "https://github.com/polymerelements/iron-scroll-target-behavior/archive/v1.0.3.tar.gz",
+  strip_prefix = "iron-scroll-target-behavior-1.0.3",
+)
+
 new_http_archive(
   name = "iron_selector",
   build_file = "bower.BUILD",
@@ -291,8 +298,8 @@ new_http_archive(
 new_http_archive(
   name = "paper_icon_button",
   build_file = "bower.BUILD",
-  url = "https://github.com/polymerelements/paper-icon-button/archive/v1.1.2.tar.gz",
-  strip_prefix = "paper-icon-button-1.1.2",
+  url = "https://github.com/polymerelements/paper-icon-button/archive/v1.1.3.tar.gz",
+  strip_prefix = "paper-icon-button-1.1.3",
 )
 
 new_http_archive(
diff --git a/bower.BUILD b/bower.BUILD
index 9d961529d10..e8401f88f45 100644
--- a/bower.BUILD
+++ b/bower.BUILD
@@ -209,6 +209,7 @@ filegroup(
     name = "iron_overlay_behavior",
     srcs = [
         "index.html",
+        "iron-focusables-helper.html",
         "iron-overlay-backdrop.html",
         "iron-overlay-behavior.html",
         "iron-overlay-manager.html",
@@ -232,6 +233,14 @@ filegroup(
     ],
 )
 
+filegroup(
+    name = "iron_scroll_target_behavior",
+    srcs = [
+        "index.html",
+        "iron-scroll-target-behavior.html",
+    ],
+)
+
 filegroup(
     name = "iron_selector",
     srcs = [
diff --git a/eigen.BUILD b/eigen.BUILD
index 8a699f6aa84..8ce28ac0766 100644
--- a/eigen.BUILD
+++ b/eigen.BUILD
@@ -62,8 +62,6 @@ cc_library(
         # This define (mostly) guarantees we don't link any problematic
         # code. We use it, but we do not rely on it, as evidenced above.
         "EIGEN_MPL2_ONLY",
-        # TODO(jart): Use EIGEN_USE_NONBLOCKING_THREAD_POOL but first add an
-        #             eigen_initialize.cc file and alwayslink=1.
     ],
     includes = ["."],
     visibility = ["//visibility:public"],
diff --git a/tensorflow/BUILD b/tensorflow/BUILD
index 5b9517a0e55..7cee39046ef 100644
--- a/tensorflow/BUILD
+++ b/tensorflow/BUILD
@@ -105,6 +105,7 @@ filegroup(
         "//tensorflow/contrib/framework:all_files",
         "//tensorflow/contrib/graph_editor:all_files",
         "//tensorflow/contrib/grid_rnn:all_files",
+        "//tensorflow/contrib/integrate:all_files",
         "//tensorflow/contrib/layers:all_files",
         "//tensorflow/contrib/layers/kernels:all_files",
         "//tensorflow/contrib/learn:all_files",
@@ -148,7 +149,6 @@ filegroup(
         "//tensorflow/examples/image_retraining:all_files",
         "//tensorflow/examples/label_image:all_files",
         "//tensorflow/examples/learn:all_files",
-        "//tensorflow/examples/skflow:all_files",
         "//tensorflow/examples/tutorials/estimators:all_files",
         "//tensorflow/examples/tutorials/mnist:all_files",
         "//tensorflow/examples/tutorials/word2vec:all_files",
diff --git a/tensorflow/cc/BUILD b/tensorflow/cc/BUILD
index c7c54240ed0..39d519a707c 100644
--- a/tensorflow/cc/BUILD
+++ b/tensorflow/cc/BUILD
@@ -264,6 +264,36 @@ tf_cc_test(
     ],
 )
 
+cc_library(
+    name = "nn_grad",
+    srcs = ["gradients/nn_grad.cc"],
+    deps = [
+        ":cc_ops",
+        ":grad_op_registry",
+        ":ops",
+        ":scope",
+        "//tensorflow/core:core_cpu",
+        "//tensorflow/core:framework",
+    ],
+)
+
+tf_cc_test(
+    name = "gradients_nn_grad_test",
+    srcs = ["gradients/nn_grad_test.cc"],
+    deps = [
+        ":cc_ops",
+        ":grad_op_registry",
+        ":grad_testutil",
+        ":gradient_checker",
+        ":nn_grad",
+        ":testutil",
+        "//tensorflow/core:lib_internal",
+        "//tensorflow/core:test",
+        "//tensorflow/core:test_main",
+        "//tensorflow/core:testlib",
+    ],
+)
+
 tf_gen_op_wrappers_cc(
     name = "cc_ops",
     op_lib_names = [
@@ -411,6 +441,7 @@ cc_library(
     srcs = ["training/queue_runner.cc"],
     hdrs = ["training/queue_runner.h"],
     deps = [
+        ":coordinator",
         "//tensorflow/core:core_cpu",
         "//tensorflow/core:framework",
         "//tensorflow/core:lib",
@@ -425,6 +456,7 @@ tf_cc_test(
     name = "queue_runner_test",
     srcs = ["training/queue_runner_test.cc"],
     deps = [
+        "coordinator",
         ":cc_ops",
         ":queue_runner",
         ":scope",
@@ -439,3 +471,37 @@ tf_cc_test(
         "//tensorflow/core:testlib",
     ],
 )
+
+cc_library(
+    name = "coordinator",
+    srcs = ["training/coordinator.cc"],
+    hdrs = ["training/coordinator.h"],
+    deps = [
+        "//tensorflow/core:core_cpu",
+        "//tensorflow/core:framework",
+        "//tensorflow/core:lib",
+        "//tensorflow/core:lib_internal",
+        "//tensorflow/core:protos_all_cc",
+        "//tensorflow/core:tensorflow",
+    ],
+)
+
+tf_cc_test(
+    name = "coordinator_test",
+    srcs = ["training/coordinator_test.cc"],
+    deps = [
+        ":cc_ops",
+        ":coordinator",
+        ":queue_runner",
+        ":scope",
+        "//tensorflow/core:core_cpu",
+        "//tensorflow/core:framework",
+        "//tensorflow/core:lib",
+        "//tensorflow/core:lib_internal",
+        "//tensorflow/core:protos_all_cc",
+        "//tensorflow/core:tensorflow",
+        "//tensorflow/core:test",
+        "//tensorflow/core:test_main",
+        "//tensorflow/core:testlib",
+    ],
+)
diff --git a/tensorflow/cc/framework/gradient_checker.cc b/tensorflow/cc/framework/gradient_checker.cc
index a729bdd24d3..57b955454e8 100644
--- a/tensorflow/cc/framework/gradient_checker.cc
+++ b/tensorflow/cc/framework/gradient_checker.cc
@@ -110,20 +110,15 @@ Status ComputeNumericJacobianTranspose(const Scope& scope, const ops::Output& x,
   return Status::OK();
 }
 
-}  // namespace
-
 template <typename T>
-Status ComputeGradientError(const Scope& scope, const ops::Output& x,
-                            const TensorShape& x_shape, const ops::Output& y,
-                            const TensorShape& y_shape, T* max_error) {
+Status ComputeGradientErrorInternal(const Scope& scope, const ops::Output& x,
+                                    const TensorShape& x_shape,
+                                    const ops::Output& y,
+                                    const TensorShape& y_shape, Tensor* x_data,
+                                    T* max_error) {
   const int64 x_size = x_shape.num_elements();
   const int64 y_size = y_shape.num_elements();
 
-  // Initialize 'x_data' to random values.
-  Tensor x_data(x.type(), x_shape);
-  auto x_data_flat = x_data.flat<T>();
-  x_data_flat.setRandom();
-
   // Initialize theoretical Jacobian to zeros.
   Tensor jacobian_t(x.type(), {x_size, y_size});
   auto jacobian_t_flat = jacobian_t.flat<T>();
@@ -131,7 +126,7 @@ Status ComputeGradientError(const Scope& scope, const ops::Output& x,
 
   // Compute theoretical Jacobian.
   TF_RETURN_IF_ERROR(ComputeTheoreticalJacobianTranspose<T>(
-      scope, x, x_shape, x_data, y, y_shape, &jacobian_t));
+      scope, x, x_shape, *x_data, y, y_shape, &jacobian_t));
 
   // Initialize numeric Jacobian to zeros.
   Tensor jacobian_n(x.type(), {x_size, y_size});
@@ -140,7 +135,7 @@ Status ComputeGradientError(const Scope& scope, const ops::Output& x,
 
   // Compute numeric Jacobian.
   TF_RETURN_IF_ERROR(ComputeNumericJacobianTranspose<T>(
-      scope, x, x_shape, y, y_shape, 1e-3, &x_data, &jacobian_n));
+      scope, x, x_shape, y, y_shape, 1e-3, x_data, &jacobian_n));
 
   // Compute the maximum error between theoretical and numeric Jacobians.
   *max_error = 0.0;
@@ -154,10 +149,39 @@ Status ComputeGradientError(const Scope& scope, const ops::Output& x,
   return Status::OK();
 }
 
+}  // namespace
+
+template <typename T>
+Status ComputeGradientError(const Scope& scope, const ops::Output& x,
+                            const TensorShape& x_shape, const ops::Output& y,
+                            const TensorShape& y_shape, T* max_error) {
+  // Initialize 'x_data' to random values.
+  Tensor x_data(x.type(), x_shape);
+  auto x_data_flat = x_data.flat<T>();
+  x_data_flat.setRandom();
+  // Compute gradient error.
+  return ComputeGradientErrorInternal(scope, x, x_shape, y, y_shape, &x_data,
+                                      max_error);
+}
+
+template <typename T>
+Status ComputeGradientError(const Scope& scope, const ops::Output& x,
+                            const Tensor& x_init_value, const ops::Output& y,
+                            const TensorShape& y_shape, T* max_error) {
+  // Initialize 'x_data' from 'x_init_value'.
+  Tensor x_data(x_init_value);
+  // Compute gradient error.
+  return ComputeGradientErrorInternal(scope, x, x_data.shape(), y, y_shape,
+                                      &x_data, max_error);
+}
+
 #define INSTANTIATE_GRAD_ERR_TYPE(T)                                        \
   template Status ComputeGradientError<T>(                                  \
       const Scope& scope, const ops::Output& x, const TensorShape& x_shape, \
-      const ops::Output& y, const TensorShape& y_shape, T* max_error)
+      const ops::Output& y, const TensorShape& y_shape, T* max_error);      \
+  template Status ComputeGradientError<T>(                                  \
+      const Scope& scope, const ops::Output& x, const Tensor& x_init_value, \
+      const ops::Output& y, const TensorShape& y_shape, T* max_error);
 
 INSTANTIATE_GRAD_ERR_TYPE(float);
 INSTANTIATE_GRAD_ERR_TYPE(double);
diff --git a/tensorflow/cc/framework/gradient_checker.h b/tensorflow/cc/framework/gradient_checker.h
index 57e2154b68a..80876afe5c7 100644
--- a/tensorflow/cc/framework/gradient_checker.h
+++ b/tensorflow/cc/framework/gradient_checker.h
@@ -30,6 +30,12 @@ Status ComputeGradientError(const Scope& scope, const ops::Output& x,
                             const TensorShape& x_shape, const ops::Output& y,
                             const TensorShape& y_shape, T* max_error);
 
+// Overload of ComputeGradientError which takes an initial value for 'x'.
+template <typename T>
+Status ComputeGradientError(const Scope& scope, const ops::Output& x,
+                            const Tensor& x_init_value, const ops::Output& y,
+                            const TensorShape& y_shape, T* max_error);
+
 }  // namespace tensorflow
 
 #endif  // THIRD_PARTY_TENSORFLOW_CC_FRAMEWORK_GRADIENT_CHECKER_H_
diff --git a/tensorflow/cc/gradients/nn_grad.cc b/tensorflow/cc/gradients/nn_grad.cc
new file mode 100644
index 00000000000..657585e36fc
--- /dev/null
+++ b/tensorflow/cc/gradients/nn_grad.cc
@@ -0,0 +1,77 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "tensorflow/cc/ops/nn_ops.h"
+#include "tensorflow/cc/ops/standard_ops.h"
+
+#include "tensorflow/cc/framework/grad_op_registry.h"
+
+namespace tensorflow {
+namespace ops {
+namespace {
+
+Status SoftmaxGrad(const Scope& scope, const Operation& op,
+                   const std::vector<Output>& grad_inputs,
+                   std::vector<Output>* grad_outputs) {
+  // Softmax gradient function.
+  // p = softmax(x) maps from [batch, n] to [batch, m]
+  // dp/dx = [dp0/dx0   ... dp0/dxn-1  ]
+  //         [  ...           ...      ]
+  //         [dpm-1/dx0 ... dpm-1/dxn-1]
+  // dL/dx = dp/dx * dL/dy
+  //
+  // Using alternative formula:
+  // dL/dx = dL/dy * y - sum(dL/dy * y) * y
+  //    = (dL/dy - sum(dL/dy * y)) * y
+  auto y = op.output(0);
+  auto dyy = Mul(scope, grad_inputs[0], y);
+  auto sum = Reshape(scope, Sum(scope, dyy, {1}), {-1, 1});
+  auto sub = Sub(scope, grad_inputs[0], sum);
+  auto dx = Mul(scope, sub, y);
+  grad_outputs->push_back(dx);
+  return scope.status();
+}
+REGISTER_GRADIENT_OP("Softmax", SoftmaxGrad);
+
+Status ReluGradHelper(const Scope& scope, const Operation& op,
+                      const std::vector<Output>& grad_inputs,
+                      std::vector<Output>* grad_outputs) {
+  auto dx = ReluGrad(scope, grad_inputs[0], op.input(0));
+  grad_outputs->push_back(dx);
+  return scope.status();
+}
+REGISTER_GRADIENT_OP("Relu", ReluGradHelper);
+
+Status Relu6GradHelper(const Scope& scope, const Operation& op,
+                       const std::vector<Output>& grad_inputs,
+                       std::vector<Output>* grad_outputs) {
+  auto dx = Relu6Grad(scope, grad_inputs[0], op.input(0));
+  grad_outputs->push_back(dx);
+  return scope.status();
+}
+REGISTER_GRADIENT_OP("Relu6", Relu6GradHelper);
+
+Status EluGradHelper(const Scope& scope, const Operation& op,
+                     const std::vector<Output>& grad_inputs,
+                     std::vector<Output>* grad_outputs) {
+  auto dx = EluGrad(scope, grad_inputs[0], op.output(0));
+  grad_outputs->push_back(dx);
+  return scope.status();
+}
+REGISTER_GRADIENT_OP("Elu", EluGradHelper);
+
+}  // anonymous namespace
+}  // namespace ops
+}  // namespace tensorflow
diff --git a/tensorflow/cc/gradients/nn_grad_test.cc b/tensorflow/cc/gradients/nn_grad_test.cc
new file mode 100644
index 00000000000..ef0a2f9626b
--- /dev/null
+++ b/tensorflow/cc/gradients/nn_grad_test.cc
@@ -0,0 +1,91 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "tensorflow/cc/framework/grad_op_registry.h"
+#include "tensorflow/cc/framework/gradient_checker.h"
+#include "tensorflow/cc/framework/testutil.h"
+#include "tensorflow/cc/gradients/grad_testutil.h"
+#include "tensorflow/cc/ops/standard_ops.h"
+#include "tensorflow/core/framework/tensor_testutil.h"
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/lib/random/random.h"
+
+namespace tensorflow {
+using namespace ops;  // NOLINT(build/namespaces)
+
+namespace {
+
+class NNGradTest : public ::testing::Test {
+ protected:
+  NNGradTest() : scope_(Scope::NewRootScope()) {}
+
+  void RunTest(const Output& x, const TensorShape& x_shape, const Output& y,
+               const TensorShape& y_shape) {
+    float max_error;
+    TF_ASSERT_OK(
+        ComputeGradientError(scope_, x, x_shape, y, y_shape, &max_error));
+    EXPECT_LT(max_error, 1e-4);
+  }
+
+  void RunTest(const Output& x, const Tensor& x_init_value, const Output& y,
+               const TensorShape& y_shape) {
+    float max_error;
+    TF_ASSERT_OK(
+        ComputeGradientError(scope_, x, x_init_value, y, y_shape, &max_error));
+    EXPECT_LT(max_error, 1e-4);
+  }
+
+  Scope scope_;
+};
+
+TEST_F(NNGradTest, SoftmaxGrad) {
+  TensorShape shape({32, 10});
+  auto x = Placeholder(scope_, DT_FLOAT, Placeholder::Shape(shape));
+  auto y = Softmax(scope_, x);
+  RunTest(x, shape, y, shape);
+}
+
+TEST_F(NNGradTest, ReluGrad) {
+  TensorShape shape({5, 2});
+  auto x = Placeholder(scope_, DT_FLOAT, Placeholder::Shape(shape));
+  auto y = Relu(scope_, x);
+  // Avoid input values where ReLU gradient is not well defined (around zero).
+  Tensor x_init_value = test::AsTensor<float>(
+      {-0.9, -0.7, -0.5, -0.3, -0.1, 0.1, 0.3, 0.5, 0.7, 0.9}, {5, 2});
+  RunTest(x, x_init_value, y, shape);
+}
+
+TEST_F(NNGradTest, Relu6Grad) {
+  TensorShape shape({5, 2});
+  auto x = Placeholder(scope_, DT_FLOAT, Placeholder::Shape(shape));
+  auto y = Relu6(scope_, x);
+  // Avoid input values where ReLU gradient is not well defined (around zero
+  // and six).
+  Tensor x_init_value = test::AsTensor<float>(
+      {-0.9, -0.7, -0.5, -0.3, -0.1, 6.1, 6.3, 6.5, 6.7, 6.9}, {5, 2});
+  RunTest(x, x_init_value, y, shape);
+}
+
+TEST_F(NNGradTest, EluGrad) {
+  TensorShape shape({5, 2});
+  auto x = Placeholder(scope_, DT_FLOAT, Placeholder::Shape(shape));
+  auto y = Elu(scope_, x);
+  Tensor x_init_value = test::AsTensor<float>(
+      {-0.9, -0.7, -0.5, -0.3, -0.1, 0.1, 0.3, 0.5, 0.7, 0.9}, {5, 2});
+  RunTest(x, x_init_value, y, shape);
+}
+
+}  // namespace
+}  // namespace tensorflow
diff --git a/tensorflow/cc/training/coordinator.cc b/tensorflow/cc/training/coordinator.cc
new file mode 100644
index 00000000000..254538d7785
--- /dev/null
+++ b/tensorflow/cc/training/coordinator.cc
@@ -0,0 +1,90 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "tensorflow/cc/training/coordinator.h"
+
+namespace tensorflow {
+
+Coordinator::Coordinator() : Coordinator(std::vector<error::Code>()) {}
+
+Coordinator::Coordinator(const std::vector<error::Code>& clean_stop_errors)
+    : should_stop_(false) {
+  if (clean_stop_errors.empty()) {
+    clean_stop_errors_.insert(error::OUT_OF_RANGE);
+  } else {
+    for (const auto& code : clean_stop_errors) {
+      clean_stop_errors_.insert(static_cast<int>(code));
+    }
+  }
+}
+
+Coordinator::~Coordinator() {
+  RequestStop();
+  Join();
+}
+
+Status Coordinator::RegisterRunner(std::unique_ptr<RunnerInterface> runner) {
+  runners_.push_back(std::move(runner));
+  return Status::OK();
+}
+
+Status Coordinator::RequestStop() {
+  mutex_lock l(mu_);
+  if (should_stop_) {
+    return Status(error::FAILED_PRECONDITION,
+                  "The Coordinator is not running.");
+  }
+  should_stop_ = true;
+  wait_for_stop_.notify_all();
+  return Status::OK();
+}
+
+bool Coordinator::ShouldStop() {
+  mutex_lock l(mu_);
+  return should_stop_;
+}
+
+Status Coordinator::Join() {
+  // TODO(yuefengz): deal with unexpected calls to Join().
+  // TODO(yuefengz): deal with stragglers.
+  for (const auto& t : runners_) {
+    ReportStatus(t->Join());
+  }
+  runners_.clear();
+  return status_;
+}
+
+void Coordinator::ReportStatus(const Status& status) {
+  mutex_lock l(status_lock_);
+  if (status.ok() || !status_.ok() ||
+      clean_stop_errors_.count(static_cast<int>(status.code())) > 0) {
+    return;
+  }
+  status_ = status;
+}
+
+Status Coordinator::GetStatus() {
+  mutex_lock l(status_lock_);
+  return status_;
+}
+
+void Coordinator::WaitForStop() {
+  mutex_lock l(mu_);
+  while (!should_stop_) {
+    wait_for_stop_.wait(l);
+  }
+}
+
+}  // namespace
diff --git a/tensorflow/cc/training/coordinator.h b/tensorflow/cc/training/coordinator.h
new file mode 100644
index 00000000000..987d243fbd0
--- /dev/null
+++ b/tensorflow/cc/training/coordinator.h
@@ -0,0 +1,109 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef THIRD_PARTY_TENSORFLOW_CC_TRAINING_COORDINATOR_H_
+#define THIRD_PARTY_TENSORFLOW_CC_TRAINING_COORDINATOR_H_
+
+#include <memory>
+#include <unordered_set>
+#include <vector>
+
+#include "tensorflow/core/lib/core/error_codes.pb.h"
+#include "tensorflow/core/lib/core/status.h"
+#include "tensorflow/core/platform/macros.h"
+#include "tensorflow/core/platform/mutex.h"
+
+namespace tensorflow {
+
+// The abstract interface for runners which must implement the Join function.
+class RunnerInterface {
+ public:
+  virtual ~RunnerInterface() {}
+  virtual Status Join() = 0;
+};
+
+// Coordinator class manages the termination of a collection of QueueRunners.
+// Without a coordinator, QueueRunners have to be joined in a specific order;
+// otherwise the QueueRunner::Join() could sometimes hang. The
+// Coordinator::RequestStop() plays the key role which notifies all running
+// threads under a coordinator to stop. This function could be called by any
+// thread or any client.
+// Usage, in the client:
+//   Coordinator coord;
+//   std::unique_ptr<QueueRunner> qr(&coord, ...);
+//   qr.Start(session);
+//   coord.RegisterRunner(std::move(qr));
+//   // do some work
+//   TF_CHECK_OK(coord.Join());
+// In each thread of QueueRunner, the coordinator needs to be used as:
+//   void Run() {
+//     while (!coord->ShouldStop()) {
+//       // do some work
+//       if (error) {
+//         coord->RequestStop();
+//         coord->ReportStatus(error_status);
+//       }
+//     }
+//   }
+class Coordinator {
+ public:
+  Coordinator();
+
+  // Constructor with a list of error codes which would not be taken as errors
+  // in status reporting.
+  Coordinator(const std::vector<error::Code>& clean_stop_errors);
+
+  // In the destructor, RequestStop() and Join() would be called.
+  ~Coordinator();
+
+  // Registers a runner, i.e. a unit of running threads which is usually a
+  // QueueRunner. It takes the ownership of runner to avoid lifecycle-related
+  // problems. Note, the coordinator would not start these threads; they are
+  // supposed to be in running state when they are registered here.
+  Status RegisterRunner(std::unique_ptr<RunnerInterface> runner);
+
+  // Requests all running threads to stop.
+  Status RequestStop();
+
+  // Returns true if its RequestStop() has been called.
+  bool ShouldStop();
+
+  // Joins all threads, returns OK or the first reported and unexpected status.
+  Status Join();
+
+  // Reports status to the coordinator. This is usually called by threads.
+  void ReportStatus(const Status& status);
+
+  // Returns the latest status.
+  Status GetStatus();
+
+  // Returns immediately if the coordinator is stopped or blocks until
+  // RequestStop() is called.
+  void WaitForStop();
+
+ private:
+  std::vector<std::unique_ptr<RunnerInterface>> runners_;
+  std::unordered_set<int> clean_stop_errors_;
+  mutex mu_;
+  bool should_stop_ GUARDED_BY(mu_);
+  mutex status_lock_;
+  Status status_;
+  condition_variable wait_for_stop_;
+  TF_DISALLOW_COPY_AND_ASSIGN(Coordinator);
+};
+
+}  // namespace tensorflow
+
+#endif  // THIRD_PARTY_TENSORFLOW_CC_TRAINING_COORDINATOR_H_
diff --git a/tensorflow/cc/training/coordinator_test.cc b/tensorflow/cc/training/coordinator_test.cc
new file mode 100644
index 00000000000..3bdce5f07f9
--- /dev/null
+++ b/tensorflow/cc/training/coordinator_test.cc
@@ -0,0 +1,183 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "tensorflow/cc/training/coordinator.h"
+
+#include "tensorflow/cc/training/queue_runner.h"
+#include "tensorflow/core/lib/core/blocking_counter.h"
+#include "tensorflow/core/lib/core/error_codes.pb.h"
+#include "tensorflow/core/lib/core/notification.h"
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/platform/env.h"
+#include "tensorflow/core/platform/test.h"
+#include "tensorflow/core/public/session.h"
+
+namespace tensorflow {
+namespace {
+
+using error::Code;
+
+void WaitForStopThread(Coordinator* coord, bool* stopped, Notification* done) {
+  coord->WaitForStop();
+  *stopped = true;
+  done->Notify();
+}
+
+TEST(CoordinatorTest, TestStopAndWaitOnStop) {
+  Coordinator coord;
+  EXPECT_EQ(coord.ShouldStop(), false);
+
+  bool stopped = false;
+  Notification done;
+  Env::Default()->SchedClosure(
+      std::bind(&WaitForStopThread, &coord, &stopped, &done));
+  Env::Default()->SleepForMicroseconds(10000000);
+  EXPECT_EQ(stopped, false);
+
+  coord.RequestStop();
+  done.WaitForNotification();
+  EXPECT_EQ(stopped, true);
+  EXPECT_EQ(coord.ShouldStop(), true);
+}
+
+class MockQueueRunner : public RunnerInterface {
+ public:
+  MockQueueRunner(Coordinator* coord) {
+    coord_ = coord;
+    join_counter_ = nullptr;
+    thread_pool_.reset(new thread::ThreadPool(Env::Default(), "test-pool", 10));
+  }
+
+  MockQueueRunner(Coordinator* coord, int* join_counter)
+      : MockQueueRunner(coord) {
+    join_counter_ = join_counter;
+  }
+
+  void StartCounting(std::atomic<int>* counter, int until) {
+    thread_pool_->Schedule(
+        std::bind(&MockQueueRunner::CountThread, this, counter, until));
+  }
+
+  void StartSettingStatus(const Status& status, BlockingCounter* counter) {
+    thread_pool_->Schedule(
+        std::bind(&MockQueueRunner::SetStatusThread, this, status, counter));
+  }
+
+  Status Join() {
+    if (join_counter_ != nullptr) {
+      (*join_counter_)++;
+    }
+    thread_pool_.reset();
+    return status_;
+  }
+
+  Status GetStatus() { return status_; }
+
+  void SetStatus(const Status& status) { status_ = status; }
+
+ private:
+  void CountThread(std::atomic<int>* counter, int until) {
+    while (!coord_->ShouldStop() && counter->load() < until) {
+      (*counter)++;
+      Env::Default()->SleepForMicroseconds(100000);
+    }
+    coord_->RequestStop();
+  }
+  void SetStatusThread(const Status& status, BlockingCounter* counter) {
+    Env::Default()->SleepForMicroseconds(100000);
+    SetStatus(status);
+    counter->DecrementCount();
+  }
+  std::unique_ptr<thread::ThreadPool> thread_pool_;
+  Status status_;
+  Coordinator* coord_;
+  int* join_counter_;
+};
+
+TEST(CoordinatorTest, TestRealStop) {
+  std::atomic<int> counter(0);
+  Coordinator coord;
+
+  std::unique_ptr<MockQueueRunner> qr1(new MockQueueRunner(&coord));
+  qr1->StartCounting(&counter, 100);
+  coord.RegisterRunner(std::move(qr1));
+
+  std::unique_ptr<MockQueueRunner> qr2(new MockQueueRunner(&coord));
+  qr2->StartCounting(&counter, 100);
+  coord.RegisterRunner(std::move(qr2));
+
+  // Wait until the counting has started
+  while (counter.load() == 0)
+    ;
+  coord.RequestStop();
+
+  int temp_counter = counter.load();
+  Env::Default()->SleepForMicroseconds(10000000);
+  EXPECT_EQ(temp_counter, counter.load());
+  TF_EXPECT_OK(coord.Join());
+}
+
+TEST(CoordinatorTest, TestRequestStop) {
+  Coordinator coord;
+  std::atomic<int> counter(0);
+  std::unique_ptr<MockQueueRunner> qr;
+  for (int i = 0; i < 10; i++) {
+    qr.reset(new MockQueueRunner(&coord));
+    qr->StartCounting(&counter, 10);
+    coord.RegisterRunner(std::move(qr));
+  }
+
+  coord.WaitForStop();
+  EXPECT_EQ(coord.ShouldStop(), true);
+  EXPECT_EQ(counter.load(), 10);
+  TF_EXPECT_OK(coord.Join());
+}
+
+TEST(CoordinatorTest, TestJoin) {
+  Coordinator coord;
+  int join_counter = 0;
+  std::unique_ptr<MockQueueRunner> qr1(
+      new MockQueueRunner(&coord, &join_counter));
+  coord.RegisterRunner(std::move(qr1));
+  std::unique_ptr<MockQueueRunner> qr2(
+      new MockQueueRunner(&coord, &join_counter));
+  coord.RegisterRunner(std::move(qr2));
+
+  TF_EXPECT_OK(coord.Join());
+  EXPECT_EQ(join_counter, 2);
+}
+
+TEST(CoordinatorTest, StatusReporting) {
+  Coordinator coord({Code::CANCELLED, Code::OUT_OF_RANGE});
+  BlockingCounter counter(3);
+
+  std::unique_ptr<MockQueueRunner> qr1(new MockQueueRunner(&coord));
+  qr1->StartSettingStatus(Status(Code::CANCELLED, ""), &counter);
+  coord.RegisterRunner(std::move(qr1));
+
+  std::unique_ptr<MockQueueRunner> qr2(new MockQueueRunner(&coord));
+  qr2->StartSettingStatus(Status(Code::INVALID_ARGUMENT, ""), &counter);
+  coord.RegisterRunner(std::move(qr2));
+
+  std::unique_ptr<MockQueueRunner> qr3(new MockQueueRunner(&coord));
+  qr3->StartSettingStatus(Status(Code::OUT_OF_RANGE, ""), &counter);
+  coord.RegisterRunner(std::move(qr3));
+
+  counter.Wait();
+  EXPECT_EQ(coord.Join().code(), Code::INVALID_ARGUMENT);
+}
+
+}  // namespace
+}  // namespace tensorflow
diff --git a/tensorflow/cc/training/queue_runner.cc b/tensorflow/cc/training/queue_runner.cc
index ed1d0a5da0c..bc48a41ff5d 100644
--- a/tensorflow/cc/training/queue_runner.cc
+++ b/tensorflow/cc/training/queue_runner.cc
@@ -25,6 +25,14 @@ Status QueueRunner::New(const QueueRunnerDef& queue_runner_def,
   return (*result)->Init(queue_runner_def);
 }
 
+Status QueueRunner::New(const QueueRunnerDef& queue_runner_def,
+                        Coordinator* coord,
+                        std::unique_ptr<QueueRunner>* result) {
+  result->reset(new QueueRunner());
+  (*result)->coord_ = coord;
+  return (*result)->Init(queue_runner_def);
+}
+
 Status QueueRunner::Init(const QueueRunnerDef& queue_runner_def) {
   queue_name_ = queue_runner_def.queue_name();
   enqueue_op_names_.clear();
@@ -46,8 +54,8 @@ Status QueueRunner::Init(const QueueRunnerDef& queue_runner_def) {
   }
 
   thread_pool_.reset(new thread::ThreadPool(
-      Env::Default(), SanitizeThreadSuffix(queue_name_), runs_));
-  should_stop_ = false;
+      Env::Default(), SanitizeThreadSuffix(queue_name_), runs_ + 1));
+
   return Status::OK();
 }
 
@@ -57,63 +65,108 @@ QueueRunner::~QueueRunner() {
   Join();
 }
 
-Status QueueRunner::Start(Session* sess) {
+Status QueueRunner::Start(Session* sess) { return Start(sess, 0); }
+
+Status QueueRunner::Start(Session* sess, int wait_for) {
+  counter_.reset(new BlockingCounter(runs_));
   for (const string& enqueue_op : enqueue_op_names_) {
     thread_pool_->Schedule(
         std::bind(&QueueRunner::Run, this, sess, enqueue_op));
   }
+  if (coord_) {
+    thread_pool_->Schedule(std::bind(&QueueRunner::Stop, this, sess));
+  }
+  // Wait for up to 'wait_for' milliseconds.
+  if (wait_for > 0) {
+    if (!counter_->WaitFor(std::chrono::milliseconds(wait_for))) {
+      return Status(error::DEADLINE_EXCEEDED,
+                    "Queues not fed before the timeout");
+    }
+    // Check the status of the queue runner as well as the result of the enqueue
+    // operations.
+    mutex_lock l(mu_);
+    if (!enqueue_status_.ok()) {
+      return enqueue_status_;
+    } else {
+      return status_;
+    }
+  }
   return Status::OK();
 }
 
-Status QueueRunner::Stop(Session* sess) {
-  should_stop_ = true;
+void QueueRunner::Stop(Session* sess) {
   if (cancel_op_name_.empty()) {
-    return Status::OK();
+    return;
   } else {
-    return sess->Run({}, {}, {cancel_op_name_}, nullptr);
+    CHECK(coord_ != nullptr);
+    coord_->WaitForStop();
+    UpdateStatus(sess->Run({}, {}, {cancel_op_name_}, nullptr));
   }
 }
 
 Status QueueRunner::Join() {
   thread_pool_.reset();
+  mutex_lock l(mu_);
   return status_;
 }
 
+void QueueRunner::UpdateStatus(const Status& status) {
+  {
+    mutex_lock l(mu_);
+    if (!status_.ok() || status.ok() ||
+        queue_closed_exception_types_.count(static_cast<int>(status.code())) >
+            0) {
+      return;
+    }
+    status_ = status;
+  }
+  if (coord_) {
+    coord_->ReportStatus(status);
+  }
+}
+
 void QueueRunner::Run(Session* sess, const string& enqueue_op) {
   bool decremented = false;
-  while (!should_stop_.load()) {
+  bool first_iteration = true;
+  while (true) {
+    if (coord_ && coord_->ShouldStop()) {
+      break;
+    }
     auto status = sess->Run({}, {}, {enqueue_op}, nullptr);
+    if (first_iteration) {
+      if (!status.ok()) {
+        mutex_lock l(mu_);
+        enqueue_status_ = status;
+      }
+      counter_->DecrementCount();
+      first_iteration = false;
+    }
     if (status.ok()) {
       continue;
     } else if (queue_closed_exception_types_.count(
                    static_cast<int>(status.code())) > 0) {
-      mutex_lock l(mu_);
-      runs_--;
-      decremented = true;
-      should_stop_ = true;
-
-      // If all enqueue ops have finished, run the close op.
-      if (runs_ == 0 && !close_op_name_.empty()) {
-        auto s = sess->Run({}, {}, {close_op_name_}, nullptr);
-        if (!s.ok() && status_.ok() &&
-            queue_closed_exception_types_.count(static_cast<int>(s.code())) ==
-                0) {
-          status_ = s;
-        }
-      }
-    } else {
       {
         mutex_lock l(mu_);
-        should_stop_ = true;
-        // Only record the first failure status.
-        if (status_.ok()) {
-          status_ = status;
-        }
+        runs_--;
+        decremented = true;
       }
-      // Stop the queue runner immediately to propagate the error to
-      // subsequent queues.
-      Stop(sess);
+
+      // If all enqueue ops have finished, run the close op.
+      if (runs_ == 0) {
+        if (!close_op_name_.empty()) {
+          auto s = sess->Run({}, {}, {close_op_name_}, nullptr);
+          UpdateStatus(status);
+        }
+        break;
+      }
+    } else {
+      UpdateStatus(status);
+      if (coord_) {
+        coord_->RequestStop();
+      }
+      break;
     }
+    first_iteration = false;
   }
 
   if (!decremented) {
diff --git a/tensorflow/cc/training/queue_runner.h b/tensorflow/cc/training/queue_runner.h
index 9374fe36050..01dd7459512 100644
--- a/tensorflow/cc/training/queue_runner.h
+++ b/tensorflow/cc/training/queue_runner.h
@@ -21,6 +21,8 @@ limitations under the License.
 #include <unordered_set>
 #include <vector>
 
+#include "tensorflow/cc/training/coordinator.h"
+#include "tensorflow/core/lib/core/blocking_counter.h"
 #include "tensorflow/core/lib/core/error_codes.pb.h"
 #include "tensorflow/core/lib/core/status.h"
 #include "tensorflow/core/lib/core/threadpool.h"
@@ -32,7 +34,7 @@ namespace tensorflow {
 
 // QueueRunner class imitates the behavior of the python version of QueueRunner
 // which creates a thread for each enqueue op, runs close op on completion.
-class QueueRunner {
+class QueueRunner : public RunnerInterface {
  public:
   // Creates a new QueueRunner from proto.
   // TODO(yuefengz): we may want to initialize from queues and ops in the
@@ -40,24 +42,29 @@ class QueueRunner {
   static Status New(const QueueRunnerDef& queue_runner_def,
                     std::unique_ptr<QueueRunner>* result);
 
+  // Creates a new QueueRunner with a coordinator, see coordinator.h for usage.
+  static Status New(const QueueRunnerDef& queue_runner_def, Coordinator* coord,
+                    std::unique_ptr<QueueRunner>* result);
+
   // The destructor would join all the threads.
   ~QueueRunner();
 
   // Starts the queue runner with the given session.
   Status Start(Session* sess);
 
-  // Requests to stop and runs the cancel op.
-  Status Stop(Session* sess);
+  // Starts the queue runner with the given session, and wait for up to the
+  // specified time (in milliseconds) for the queues to start to fill up.
+  Status Start(Session* sess, int wait_for);
 
   // Joins all the threads. Returns okay if all threads run successfully;
   // otherwise returns the first captured failure status.
-  Status Join();
+  Status Join() final;
 
   // Returns the lastest status.
   Status GetStatus();
 
  private:
-  QueueRunner() {}
+  QueueRunner() : coord_(nullptr) {}
 
   // Initializes the instance with the QueueRunnerDef proto.
   Status Init(const QueueRunnerDef& queue_runner_def);
@@ -65,6 +72,14 @@ class QueueRunner {
   // The Run function for each thread.
   void Run(Session* sess, const string& enqueue_op);
 
+  // Requests to stop and runs the cancel op. It would be called in a separate
+  // thread when coordinator is set.
+  void Stop(Session* sess);
+
+  // Updates the internal status; it only keeps OK or the first unexpected error
+  // status.
+  void UpdateStatus(const Status& status);
+
   string queue_name_;
   std::vector<string> enqueue_op_names_;
   string close_op_name_;
@@ -73,12 +88,15 @@ class QueueRunner {
   std::unordered_set<int> queue_closed_exception_types_;
 
   std::unique_ptr<thread::ThreadPool> thread_pool_;
-  std::atomic<bool> should_stop_;
   condition_variable wait_to_close_;
   mutex mu_;
   // TODO(yuefengz): implement c++ coordinator.
   int runs_ = 0;
-  Status status_;
+  Status status_ GUARDED_BY(mu_);
+  Status enqueue_status_ GUARDED_BY(mu_);
+  std::unique_ptr<BlockingCounter> counter_;
+
+  Coordinator* coord_;
 };
 
 }  // namespace tensorflow
diff --git a/tensorflow/cc/training/queue_runner_test.cc b/tensorflow/cc/training/queue_runner_test.cc
index 0d06c620566..73ea5a307f9 100644
--- a/tensorflow/cc/training/queue_runner_test.cc
+++ b/tensorflow/cc/training/queue_runner_test.cc
@@ -20,6 +20,7 @@ limitations under the License.
 
 #include "tensorflow/cc/framework/scope.h"
 #include "tensorflow/cc/ops/standard_ops.h"
+#include "tensorflow/cc/training/coordinator.h"
 #include "tensorflow/core/framework/graph.pb.h"
 #include "tensorflow/core/framework/tensor.h"
 #include "tensorflow/core/framework/tensor_shape.h"
@@ -111,7 +112,7 @@ TEST(QueueRunnerTest, BasicTest) {
   auto session = BuildSessionAndInitVariable(graph_def);
 
   QueueRunnerDef queue_runner_def = BuildQueueRunnerDef(
-      kQueueName, {kCountUpToOpName, kCountUpToOpName}, kSquareOpName, "", {});
+      kQueueName, {kCountUpToOpName}, kSquareOpName, "", {});
 
   std::unique_ptr<QueueRunner> qr;
   TF_EXPECT_OK(QueueRunner::New(queue_runner_def, &qr));
@@ -164,7 +165,8 @@ GraphDef BuildDoubleQueueGraph() {
   auto close0 = QueueClose(root.WithOpName(kCloseOp0), q0);
   auto cancel0 = QueueClose(root.WithOpName(kCancelOp0), q0,
                             QueueClose::CancelPendingEnqueues(true));
-  auto q1 = FIFOQueue(root.WithOpName(kQueueName1), {DataType::DT_INT32});
+  auto q1 = FIFOQueue(root.WithOpName(kQueueName1), {DataType::DT_INT32},
+                      FIFOQueue::Capacity(3));
   auto dequeue0 =
       QueueDequeue(root.WithOpName(kDequeueOp0), q0, {DataType::DT_INT32});
   auto enqueue1 = QueueEnqueue(root.WithOpName(kEnqueueOp1), q1, {dequeue0[0]});
@@ -252,34 +254,34 @@ TEST(QueueRunnerTest, SessionCloseCancelPendingEnqueue) {
   EXPECT_EQ(join_succeeded, true);
 }
 
-TEST(QueueRunnerTest, Stop) {
-  auto graph_def = BuildDoubleQueueGraph();
+TEST(QueueRunnerTest, EmptyEnqueueOps) {
+  QueueRunnerDef queue_runner_def =
+      BuildQueueRunnerDef(kQueueName, {}, kCountUpToOpName, "", {});
 
+  std::unique_ptr<QueueRunner> qr;
+  EXPECT_EQ(QueueRunner::New(queue_runner_def, &qr).code(),
+            Code::INVALID_ARGUMENT);
+}
+
+TEST(QueueRunnerTest, StartTimeout) {
+  GraphDef graph_def = BuildDoubleQueueGraph();
   SessionOptions options;
   std::unique_ptr<Session> session(NewSession(options));
   TF_CHECK_OK(session->Create(graph_def));
 
-  QueueRunnerDef queue_runner_def =
-      BuildQueueRunnerDef(kQueueName1, {kEnqueueOp1}, kCloseOp1, kCancelOp1,
-                          {Code::OUT_OF_RANGE, Code::CANCELLED});
+  QueueRunnerDef queue_runner_def = BuildQueueRunnerDef(
+      kQueueName1, {kEnqueueOp1}, kCloseOp1, kCancelOp1, {});
+
   std::unique_ptr<QueueRunner> qr;
   TF_EXPECT_OK(QueueRunner::New(queue_runner_def, &qr));
-  TF_CHECK_OK(qr->Start(session.get()));
-
-  TF_EXPECT_OK(qr->Stop(session.get()));
-
-  TF_EXPECT_OK(session->Run({}, {}, {kEnqueueOp0}, nullptr));
-
-  EXPECT_EQ(session->Run({}, {kDequeueOp1}, {}, nullptr).code(),
-            Code::OUT_OF_RANGE);
-
-  // qr is already stopped
-  TF_EXPECT_OK(qr->Join());
+  // This will timeout since queue0 is not fed and queue1 is fetching data from
+  // queue0.
+  EXPECT_EQ(qr->Start(session.get(), 1).code(), Code::DEADLINE_EXCEEDED);
+  session->Close();
 }
 
-TEST(QueueRunnerTest, StopTwoQueues) {
+TEST(QueueRunnerTest, TestCoordinatorStop) {
   auto graph_def = BuildDoubleQueueGraph();
-
   SessionOptions options;
   std::unique_ptr<Session> session(NewSession(options));
   TF_CHECK_OK(session->Create(graph_def));
@@ -290,31 +292,24 @@ TEST(QueueRunnerTest, StopTwoQueues) {
   QueueRunnerDef queue_runner1 =
       BuildQueueRunnerDef(kQueueName1, {kEnqueueOp1}, kCloseOp1, kCancelOp1,
                           {Code::OUT_OF_RANGE, Code::CANCELLED});
+
+  Coordinator coord;
   std::unique_ptr<QueueRunner> qr0;
-  TF_EXPECT_OK(QueueRunner::New(queue_runner0, &qr0));
+  TF_EXPECT_OK(QueueRunner::New(queue_runner0, &coord, &qr0));
   TF_CHECK_OK(qr0->Start(session.get()));
   std::unique_ptr<QueueRunner> qr1;
-  TF_EXPECT_OK(QueueRunner::New(queue_runner1, &qr1));
+  TF_EXPECT_OK(QueueRunner::New(queue_runner1, &coord, &qr1));
   TF_CHECK_OK(qr1->Start(session.get()));
 
+  coord.RegisterRunner(std::move(qr0));
+  coord.RegisterRunner(std::move(qr1));
+
   std::vector<Tensor> dq;
   TF_EXPECT_OK(session->Run({}, {kDequeueOp1}, {}, &dq));
   EXPECT_EQ(*dq[0].scalar<int>().data(), 10);
 
-  TF_EXPECT_OK(qr0->Stop(session.get()));
-  TF_EXPECT_OK(qr1->Stop(session.get()));
-
-  TF_EXPECT_OK(qr0->Join());
-  TF_EXPECT_OK(qr1->Join());
-}
-
-TEST(QueueRunnerTest, EmptyEnqueueOps) {
-  QueueRunnerDef queue_runner_def =
-      BuildQueueRunnerDef(kQueueName, {}, kCountUpToOpName, "", {});
-
-  std::unique_ptr<QueueRunner> qr;
-  EXPECT_EQ(QueueRunner::New(queue_runner_def, &qr).code(),
-            Code::INVALID_ARGUMENT);
+  TF_EXPECT_OK(coord.RequestStop());
+  TF_EXPECT_OK(coord.Join());
 }
 
 }  // namespace
diff --git a/tensorflow/contrib/BUILD b/tensorflow/contrib/BUILD
index be325ba2f19..704de2605ec 100644
--- a/tensorflow/contrib/BUILD
+++ b/tensorflow/contrib/BUILD
@@ -23,6 +23,7 @@ py_library(
         "//tensorflow/contrib/framework:framework_py",
         "//tensorflow/contrib/graph_editor:graph_editor_py",
         "//tensorflow/contrib/grid_rnn:grid_rnn_py",
+        "//tensorflow/contrib/integrate:integrate_py",
         "//tensorflow/contrib/layers:layers_py",
         "//tensorflow/contrib/learn",
         "//tensorflow/contrib/linear_optimizer:sdca_ops_py",
diff --git a/tensorflow/contrib/__init__.py b/tensorflow/contrib/__init__.py
index dfeacba6d4d..0ded847cfaf 100644
--- a/tensorflow/contrib/__init__.py
+++ b/tensorflow/contrib/__init__.py
@@ -28,6 +28,7 @@ from tensorflow.contrib import factorization
 from tensorflow.contrib import framework
 from tensorflow.contrib import graph_editor
 from tensorflow.contrib import grid_rnn
+from tensorflow.contrib import integrate
 from tensorflow.contrib import layers
 from tensorflow.contrib import learn
 from tensorflow.contrib import linear_optimizer
diff --git a/tensorflow/contrib/bayesflow/examples/reinforce_simple/reinforce_simple_example.py b/tensorflow/contrib/bayesflow/examples/reinforce_simple/reinforce_simple_example.py
index d9ff84a466c..85f75f74033 100644
--- a/tensorflow/contrib/bayesflow/examples/reinforce_simple/reinforce_simple_example.py
+++ b/tensorflow/contrib/bayesflow/examples/reinforce_simple/reinforce_simple_example.py
@@ -76,7 +76,7 @@ def build_split_apply_merge_model():
 
   # REINFORCE forward step
   route_selection = st.StochasticTensor(
-      distributions.Categorical, logits=logits)
+      distributions.Categorical(logits=logits))
 
   # Accessing route_selection as a Tensor below forces a sample of
   # the Categorical distribution based on its logits.
diff --git a/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_gradient_estimators_test.py b/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_gradient_estimators_test.py
index e1edbc908c5..2a2b4218303 100644
--- a/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_gradient_estimators_test.py
+++ b/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_gradient_estimators_test.py
@@ -22,6 +22,7 @@ import tensorflow as tf
 
 st = tf.contrib.bayesflow.stochastic_tensor
 sge = tf.contrib.bayesflow.stochastic_gradient_estimators
+dists = tf.contrib.distributions
 
 
 class StochasticGradientEstimatorsTest(tf.test.TestCase):
@@ -31,7 +32,7 @@ class StochasticGradientEstimatorsTest(tf.test.TestCase):
     self._final_loss = tf.constant(3.2)
 
   def _testScoreFunction(self, loss_fn, expected):
-    x = st.BernoulliTensor(p=self._p, loss_fn=loss_fn)
+    x = st.StochasticTensor(dists.Bernoulli(p=self._p), loss_fn=loss_fn)
     sf = x.loss(self._final_loss)
     with self.test_session() as sess:
       sess.run(tf.initialize_all_variables())
@@ -62,8 +63,8 @@ class StochasticGradientEstimatorsTest(tf.test.TestCase):
   def testScoreFunctionWithMeanBaseline(self):
     ema_decay = 0.8
     num_steps = 6
-    x = st.BernoulliTensor(
-        p=self._p,
+    x = st.StochasticTensor(
+        dists.Bernoulli(p=self._p),
         loss_fn=sge.get_score_function_with_baseline(
             sge.get_mean_baseline(ema_decay)))
     sf = x.loss(self._final_loss)
@@ -98,12 +99,12 @@ class StochasticGradientEstimatorsTest(tf.test.TestCase):
 
   def testScoreFunctionWithMeanBaselineHasUniqueVarScope(self):
     ema_decay = 0.8
-    x = st.BernoulliTensor(
-        p=self._p,
+    x = st.StochasticTensor(
+        dists.Bernoulli(p=self._p),
         loss_fn=sge.get_score_function_with_baseline(
             sge.get_mean_baseline(ema_decay)))
-    y = st.BernoulliTensor(
-        p=self._p,
+    y = st.StochasticTensor(
+        dists.Bernoulli(p=self._p),
         loss_fn=sge.get_score_function_with_baseline(
             sge.get_mean_baseline(ema_decay)))
     sf_x = x.loss(self._final_loss)
diff --git a/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_graph_test.py b/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_graph_test.py
index eae678f365b..de5c5c82b82 100644
--- a/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_graph_test.py
+++ b/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_graph_test.py
@@ -39,9 +39,9 @@ class TestSurrogateLosses(tf.test.TestCase):
       mu = [0.0, 0.1, 0.2]
       sigma = tf.constant([1.1, 1.2, 1.3])
       with st.value_type(st.SampleAndReshapeValue()):
-        prior = st.StochasticTensor(distributions.Normal, mu=mu, sigma=sigma)
+        prior = st.StochasticTensor(distributions.Normal(mu=mu, sigma=sigma))
         likelihood = st.StochasticTensor(
-            distributions.Normal, mu=prior, sigma=sigma)
+            distributions.Normal(mu=prior, sigma=sigma))
         self.assertTrue(prior.distribution.is_reparameterized)
         self.assertTrue(likelihood.distribution.is_reparameterized)
 
@@ -77,10 +77,9 @@ class TestSurrogateLosses(tf.test.TestCase):
       mu = tf.constant([0.0, 0.1, 0.2])
       sigma = tf.constant([1.1, 1.2, 1.3])
       with st.value_type(st.SampleAndReshapeValue()):
-        prior = st.StochasticTensor(NormalNotParam, mu=mu, sigma=sigma)
-        likelihood = st.StochasticTensor(
-            NormalNotParam, mu=prior, sigma=sigma)
-        prior_2 = st.StochasticTensor(NormalNotParam, mu=mu, sigma=sigma)
+        prior = st.StochasticTensor(NormalNotParam(mu=mu, sigma=sigma))
+        likelihood = st.StochasticTensor(NormalNotParam(mu=prior, sigma=sigma))
+        prior_2 = st.StochasticTensor(NormalNotParam(mu=mu, sigma=sigma))
 
       loss = tf.square(tf.identity(likelihood) - mu)
       part_loss = tf.square(tf.identity(prior) - mu)
@@ -155,9 +154,7 @@ class TestSurrogateLosses(tf.test.TestCase):
       mu = tf.constant([0.0, 0.1, 0.2])
       sigma = tf.constant([1.1, 1.2, 1.3])
       with st.value_type(st.SampleAndReshapeValue()):
-        dt = st.StochasticTensor(NormalNotParam,
-                                 mu=mu,
-                                 sigma=sigma,
+        dt = st.StochasticTensor(NormalNotParam(mu=mu, sigma=sigma),
                                  loss_fn=None)
         self.assertEqual(None, dt.loss(tf.constant([2.0])))
 
@@ -166,8 +163,8 @@ class TestSurrogateLosses(tf.test.TestCase):
       mu = tf.constant([0.0, 0.1, 0.2])
       sigma = tf.constant([1.1, 1.2, 1.3])
       with st.value_type(st.SampleAndReshapeValue()):
-        dt1 = st.StochasticTensor(NormalNotParam, mu=mu, sigma=sigma)
-        dt2 = st.StochasticTensor(NormalNotParam, mu=mu, sigma=sigma)
+        dt1 = st.StochasticTensor(NormalNotParam(mu=mu, sigma=sigma))
+        dt2 = st.StochasticTensor(NormalNotParam(mu=mu, sigma=sigma))
         loss = tf.square(tf.identity(dt1)) + 10. + dt2
 
         sl_all = sg.surrogate_loss([loss])
@@ -186,8 +183,8 @@ class TestSurrogateLosses(tf.test.TestCase):
 class StochasticDependenciesMapTest(tf.test.TestCase):
 
   def testBuildsMapOfUpstreamNodes(self):
-    dt1 = st.StochasticTensor(distributions.Normal, mu=0., sigma=1.)
-    dt2 = st.StochasticTensor(distributions.Normal, mu=0., sigma=1.)
+    dt1 = st.StochasticTensor(distributions.Normal(mu=0., sigma=1.))
+    dt2 = st.StochasticTensor(distributions.Normal(mu=0., sigma=1.))
     out1 = dt1.value() + 1.
     out2 = dt2.value() + 2.
     x = out1 + out2
@@ -197,11 +194,11 @@ class StochasticDependenciesMapTest(tf.test.TestCase):
     self.assertEqual(dep_map[dt2], set([x, y]))
 
   def testHandlesStackedStochasticNodes(self):
-    dt1 = st.StochasticTensor(distributions.Normal, mu=0., sigma=1.)
+    dt1 = st.StochasticTensor(distributions.Normal(mu=0., sigma=1.))
     out1 = dt1.value() + 1.
-    dt2 = st.StochasticTensor(distributions.Normal, mu=out1, sigma=1.)
+    dt2 = st.StochasticTensor(distributions.Normal(mu=out1, sigma=1.))
     x = dt2.value() + 2.
-    dt3 = st.StochasticTensor(distributions.Normal, mu=0., sigma=1.)
+    dt3 = st.StochasticTensor(distributions.Normal(mu=0., sigma=1.))
     y = dt3.value() * 3.
     dep_map = sg._stochastic_dependencies_map([x, y])
     self.assertEqual(dep_map[dt1], set([x]))
@@ -209,10 +206,10 @@ class StochasticDependenciesMapTest(tf.test.TestCase):
     self.assertEqual(dep_map[dt3], set([y]))
 
   def testTraversesControlInputs(self):
-    dt1 = st.StochasticTensor(distributions.Normal, mu=0., sigma=1.)
+    dt1 = st.StochasticTensor(distributions.Normal(mu=0., sigma=1.))
     logits = dt1.value() * 3.
-    dt2 = st.StochasticTensor(distributions.Bernoulli, logits=logits)
-    dt3 = st.StochasticTensor(distributions.Normal, mu=0., sigma=1.)
+    dt2 = st.StochasticTensor(distributions.Bernoulli(logits=logits))
+    dt3 = st.StochasticTensor(distributions.Normal(mu=0., sigma=1.))
     x = dt3.value()
     y = tf.ones((2, 2)) * 4.
     z = tf.ones((2, 2)) * 3.
diff --git a/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_tensor_test.py b/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_tensor_test.py
index 95c6d39a617..b7bd2adfe8a 100644
--- a/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_tensor_test.py
+++ b/tensorflow/contrib/bayesflow/python/kernel_tests/stochastic_tensor_test.py
@@ -35,19 +35,19 @@ class StochasticTensorTest(tf.test.TestCase):
       sigma2 = tf.constant([0.1, 0.2, 0.3])
 
       prior_default = st.StochasticTensor(
-          distributions.Normal, mu=mu, sigma=sigma)
+          distributions.Normal(mu=mu, sigma=sigma))
       self.assertTrue(
           isinstance(prior_default.value_type, st.SampleAndReshapeValue))
       prior_0 = st.StochasticTensor(
-          distributions.Normal, mu=mu, sigma=sigma,
+          distributions.Normal(mu=mu, sigma=sigma),
           dist_value_type=st.SampleAndReshapeValue())
       self.assertTrue(isinstance(prior_0.value_type, st.SampleAndReshapeValue))
 
       with st.value_type(st.SampleAndReshapeValue()):
-        prior = st.StochasticTensor(distributions.Normal, mu=mu, sigma=sigma)
+        prior = st.StochasticTensor(distributions.Normal(mu=mu, sigma=sigma))
         self.assertTrue(isinstance(prior.value_type, st.SampleAndReshapeValue))
         likelihood = st.StochasticTensor(
-            distributions.Normal, mu=prior, sigma=sigma2)
+            distributions.Normal(mu=prior, sigma=sigma2))
         self.assertTrue(
             isinstance(likelihood.value_type, st.SampleAndReshapeValue))
 
@@ -77,7 +77,7 @@ class StochasticTensorTest(tf.test.TestCase):
       sigma = tf.constant([1.1, 1.2, 1.3])
 
       with st.value_type(st.MeanValue()):
-        prior = st.StochasticTensor(distributions.Normal, mu=mu, sigma=sigma)
+        prior = st.StochasticTensor(distributions.Normal(mu=mu, sigma=sigma))
         self.assertTrue(isinstance(prior.value_type, st.MeanValue))
 
       prior_mean = prior.mean()
@@ -94,7 +94,8 @@ class StochasticTensorTest(tf.test.TestCase):
 
       with st.value_type(st.SampleAndReshapeValue()):
         prior_single = st.StochasticTensor(
-            distributions.Normal, mu=mu, sigma=sigma)
+            distributions.Normal(
+                mu=mu, sigma=sigma))
 
       prior_single_value = prior_single.value()
       self.assertEqual(prior_single_value.get_shape(), (2, 3))
@@ -104,7 +105,7 @@ class StochasticTensorTest(tf.test.TestCase):
 
       with st.value_type(st.SampleAndReshapeValue(n=2)):
         prior_double = st.StochasticTensor(
-            distributions.Normal, mu=mu, sigma=sigma)
+            distributions.Normal(mu=mu, sigma=sigma))
 
       prior_double_value = prior_double.value()
       self.assertEqual(prior_double_value.get_shape(), (4, 3))
@@ -119,7 +120,7 @@ class StochasticTensorTest(tf.test.TestCase):
 
       with st.value_type(st.SampleValue()):
         prior_single = st.StochasticTensor(
-            distributions.Normal, mu=mu, sigma=sigma)
+            distributions.Normal(mu=mu, sigma=sigma))
         self.assertTrue(isinstance(prior_single.value_type, st.SampleValue))
 
       prior_single_value = prior_single.value()
@@ -130,7 +131,7 @@ class StochasticTensorTest(tf.test.TestCase):
 
       with st.value_type(st.SampleValue(n=2)):
         prior_double = st.StochasticTensor(
-            distributions.Normal, mu=mu, sigma=sigma)
+            distributions.Normal(mu=mu, sigma=sigma))
 
       prior_double_value = prior_double.value()
       self.assertEqual(prior_double_value.get_shape(), (2, 2, 3))
@@ -143,9 +144,9 @@ class StochasticTensorTest(tf.test.TestCase):
       mu = [0.0, -1.0, 1.0]
       sigma = tf.constant([1.1, 1.2, 1.3])
       with st.value_type(st.MeanValue()):
-        prior = st.StochasticTensor(distributions.Normal, mu=mu, sigma=sigma)
+        prior = st.StochasticTensor(distributions.Normal(mu=mu, sigma=sigma))
         entropy = prior.entropy()
-        deep_entropy = prior.entropy()
+        deep_entropy = prior.distribution.entropy()
         expected_deep_entropy = distributions.Normal(
             mu=mu, sigma=sigma).entropy()
         entropies = sess.run([entropy, deep_entropy, expected_deep_entropy])
@@ -159,17 +160,15 @@ class StochasticTensorTest(tf.test.TestCase):
 
       # With default
       with st.value_type(st.MeanValue(stop_gradient=True)):
-        dt = st.StochasticTensor(distributions.Normal, mu=mu, sigma=sigma)
+        dt = st.StochasticTensor(distributions.Normal(mu=mu, sigma=sigma))
       loss = dt.loss([tf.constant(2.0)])
       self.assertTrue(loss is not None)
-      self.assertAllClose(dt.distribution.log_prob(mu).eval() * 2.0,
-                          loss.eval())
+      self.assertAllClose(
+          dt.distribution.log_prob(mu).eval() * 2.0, loss.eval())
 
       # With passed-in loss_fn.
       dt = st.StochasticTensor(
-          distributions.Normal,
-          mu=mu,
-          sigma=sigma,
+          distributions.Normal(mu=mu, sigma=sigma),
           dist_value_type=st.MeanValue(stop_gradient=True),
           loss_fn=sge.get_score_function_with_constant_baseline(
               baseline=tf.constant(8.0)))
@@ -204,7 +203,7 @@ class ObservedStochasticTensorTest(tf.test.TestCase):
       sigma = tf.constant([1.1, 1.2, 1.3])
       obs = tf.zeros((2, 3))
       z = st.ObservedStochasticTensor(
-          distributions.Normal, mu=mu, sigma=sigma, value=obs)
+          distributions.Normal(mu=mu, sigma=sigma), value=obs)
       [obs_val, z_val] = sess.run([obs, z.value()])
       self.assertAllEqual(obs_val, z_val)
 
@@ -216,13 +215,13 @@ class ObservedStochasticTensorTest(tf.test.TestCase):
     sigma = tf.placeholder(tf.float32)
     obs = tf.placeholder(tf.float32)
     z = st.ObservedStochasticTensor(
-        distributions.Normal, mu=mu, sigma=sigma, value=obs)
+        distributions.Normal(mu=mu, sigma=sigma), value=obs)
 
     mu2 = tf.placeholder(tf.float32, shape=[None])
     sigma2 = tf.placeholder(tf.float32, shape=[None])
     obs2 = tf.placeholder(tf.float32, shape=[None, None])
     z2 = st.ObservedStochasticTensor(
-        distributions.Normal, mu=mu2, sigma=sigma2, value=obs2)
+        distributions.Normal(mu=mu2, sigma=sigma2), value=obs2)
 
     coll = tf.get_collection(st.STOCHASTIC_TENSOR_COLLECTION)
     self.assertEqual(coll, [z, z2])
@@ -230,27 +229,19 @@ class ObservedStochasticTensorTest(tf.test.TestCase):
   def testConstructionErrors(self):
     mu = [0., 0.]
     sigma = [1., 1.]
-    self.assertRaises(ValueError, st.ObservedStochasticTensor,
-                      distributions.Normal, mu=mu, sigma=sigma,
-                      value=tf.zeros((3,)))
-    self.assertRaises(ValueError, st.ObservedStochasticTensor,
-                      distributions.Normal, mu=mu, sigma=sigma,
-                      value=tf.zeros((3, 1)))
-    self.assertRaises(ValueError, st.ObservedStochasticTensor,
-                      distributions.Normal, mu=mu, sigma=sigma,
-                      value=tf.zeros((1, 2), dtype=tf.int32))
-
-
-class AutomaticDistributionImportTest(tf.test.TestCase):
-
-  def testImportNormal(self):
-    self.assertTrue(hasattr(st, "NormalTensor"))
-    self.assertTrue(callable(st.NormalTensor))
-    norm = st.NormalTensor(mu=0.0, sigma=1.0)
-    self.assertEqual(type(norm).__name__, "NormalTensor")
-    self.assertTrue(isinstance(norm, st.NormalTensor))
-    self.assertTrue(isinstance(norm, st.StochasticTensor))
-
-
-if __name__ == "__main__":
-  tf.test.main()
+    self.assertRaises(
+        ValueError,
+        st.ObservedStochasticTensor,
+        distributions.Normal(mu=mu, sigma=sigma),
+        value=tf.zeros((3,)))
+    self.assertRaises(
+        ValueError,
+        st.ObservedStochasticTensor,
+        distributions.Normal(mu=mu, sigma=sigma),
+        value=tf.zeros((3, 1)))
+    self.assertRaises(
+        ValueError,
+        st.ObservedStochasticTensor,
+        distributions.Normal(mu=mu, sigma=sigma),
+        value=tf.zeros(
+            (1, 2), dtype=tf.int32))
diff --git a/tensorflow/contrib/bayesflow/python/kernel_tests/variational_inference_test.py b/tensorflow/contrib/bayesflow/python/kernel_tests/variational_inference_test.py
index 336bf981de7..cad42067217 100644
--- a/tensorflow/contrib/bayesflow/python/kernel_tests/variational_inference_test.py
+++ b/tensorflow/contrib/bayesflow/python/kernel_tests/variational_inference_test.py
@@ -44,7 +44,7 @@ def mini_vae():
   x = [[-6., 3., 6.], [-8., 4., 8.]]
   prior = distributions.Normal(mu=0., sigma=1.)
   variational = st.StochasticTensor(
-      distributions.Normal, mu=inference_net(x, 1), sigma=1.)
+      distributions.Normal(mu=inference_net(x, 1), sigma=1.))
   vi.register_prior(variational, prior)
   px = distributions.Normal(mu=generative_net(variational, 3), sigma=1.)
   log_likelihood = tf.reduce_sum(px.log_prob(x), 1)
@@ -101,7 +101,7 @@ class VariationalInferenceTest(tf.test.TestCase):
 
     prior = distributions.Bernoulli(0.5)
     variational = st.StochasticTensor(
-        NormalNoEntropy, mu=inference_net(x, 1), sigma=1.)
+        NormalNoEntropy(mu=inference_net(x, 1), sigma=1.))
     vi.register_prior(variational, prior)
     px = distributions.Normal(mu=generative_net(variational, 3), sigma=1.)
     log_likelihood = tf.reduce_sum(px.log_prob(x), 1)
diff --git a/tensorflow/contrib/bayesflow/python/ops/stochastic_tensor.py b/tensorflow/contrib/bayesflow/python/ops/stochastic_tensor.py
index 06661059ffd..eaee3344e5d 100644
--- a/tensorflow/contrib/bayesflow/python/ops/stochastic_tensor.py
+++ b/tensorflow/contrib/bayesflow/python/ops/stochastic_tensor.py
@@ -44,7 +44,6 @@ from __future__ import print_function
 import abc
 import collections
 import contextlib
-import inspect
 import threading
 
 import six
@@ -79,10 +78,6 @@ class BaseStochasticTensor(object):
   def graph(self):
     pass
 
-  @abc.abstractproperty
-  def input_dict(self):
-    pass
-
   @abc.abstractmethod
   def value(self, name=None):
     pass
@@ -120,6 +115,7 @@ class BaseStochasticTensor(object):
 # pylint: disable=protected-access
 ops.register_tensor_conversion_function(
     BaseStochasticTensor, BaseStochasticTensor._tensor_conversion_function)
+
 # pylint: enable=protected-access
 
 
@@ -223,8 +219,8 @@ class SampleAndReshapeValue(_StochasticValueType):
   st_value = st.value()
   assertEqual(st_value.get_shape(), (4, 3))
 
-  dt_value_val = sess.run([st_value])[0]  # or e.g. run([tf.identity(st)])[0]
-  assertEqual(dt_value_val.shape, (4, 3))
+  st_value_val = sess.run([st_value])[0]  # or e.g. run([tf.identity(st)])[0]
+  assertEqual(st_value_val.shape, (4, 3))
   ```
   """
 
@@ -312,17 +308,16 @@ class StochasticTensor(BaseStochasticTensor):
   """StochasticTensor is a BaseStochasticTensor backed by a distribution."""
 
   def __init__(self,
-               dist_cls,
-               name=None,
+               dist,
+               name="StochasticTensor",
                dist_value_type=None,
-               loss_fn=sge.score_function,
-               **dist_args):
+               loss_fn=sge.score_function):
     """Construct a `StochasticTensor`.
 
-    `StochasticTensor` will instantiate a distribution from `dist_cls` and
-    `dist_args` and its `value` method will return the same value each time
-    it is called. What `value` is returned is controlled by the
-    `dist_value_type` (defaults to `SampleAndReshapeValue`).
+    `StochasticTensor` is backed by the `dist` distribution and its `value`
+    method will return the same value each time it is called. What `value` is
+    returned is controlled by the `dist_value_type` (defaults to
+    `SampleAndReshapeValue`).
 
     Some distributions' sample functions are not differentiable (e.g. a sample
     from a discrete distribution like a Bernoulli) and so to differentiate
@@ -338,28 +333,25 @@ class StochasticTensor(BaseStochasticTensor):
     `MeanValueType` or if `loss_fn=None`.
 
     Args:
-      dist_cls: a `Distribution` class.
+      dist: an instance of `Distribution`.
       name: a name for this `StochasticTensor` and its ops.
       dist_value_type: a `_StochasticValueType`, which will determine what the
           `value` of this `StochasticTensor` will be. If not provided, the
           value type set with the `value_type` context manager will be used.
-      loss_fn: callable that takes `(st, st.value(), influenced_loss)`, where
+      loss_fn: callable that takes
+          `(st, st.value(), influenced_loss)`, where
           `st` is this `StochasticTensor`, and returns a `Tensor` loss. By
           default, `loss_fn` is the `score_function`, or more precisely, the
           integral of the score function, such that when the gradient is taken,
           the score function results. See the `stochastic_gradient_estimators`
           module for additional loss functions and baselines.
-      **dist_args: keyword arguments to be passed through to `dist_cls` on
-          construction.
 
     Raises:
-      TypeError: if `dist_cls` is not a `Distribution`.
+      TypeError: if `dist` is not an instance of `Distribution`.
       TypeError: if `loss_fn` is not `callable`.
     """
-    if not issubclass(dist_cls, distributions.Distribution):
-      raise TypeError("dist_cls must be a subclass of Distribution")
-    self._dist_cls = dist_cls
-    self._dist_args = dist_args
+    if not isinstance(dist, distributions.Distribution):
+      raise TypeError("dist must be an instance of Distribution")
     if dist_value_type is None:
       try:
         self._value_type = get_current_value_type()
@@ -371,24 +363,17 @@ class StochasticTensor(BaseStochasticTensor):
       with value_type(dist_value_type):
         self._value_type = get_current_value_type()
 
-    self._value_type.declare_inputs(self, dist_args)
-
     if loss_fn is not None and not callable(loss_fn):
       raise TypeError("loss_fn must be callable")
     self._loss_fn = loss_fn
 
-    with ops.name_scope(name, "StochasticTensor",
-                        dist_args.values()) as scope:
+    with ops.name_scope(name) as scope:
       self._name = scope
-      self._dist = dist_cls(**dist_args)
+      self._dist = dist
       self._value = self._create_value()
 
     super(StochasticTensor, self).__init__()
 
-  @property
-  def input_dict(self):
-    return self._dist_args
-
   @property
   def value_type(self):
     return self._value_type
@@ -397,9 +382,6 @@ class StochasticTensor(BaseStochasticTensor):
   def distribution(self):
     return self._dist
 
-  def clone(self, name=None, **dist_args):
-    return StochasticTensor(self._dist_cls, name=name, **dist_args)
-
   def _create_value(self):
     """Create the value Tensor based on the value type, store as self._value."""
 
@@ -494,33 +476,28 @@ class ObservedStochasticTensor(StochasticTensor):
   """A StochasticTensor with an observed value."""
 
   # pylint: disable=super-init-not-called
-  def __init__(self, dist_cls, value, name=None, **dist_args):
+  def __init__(self, dist, value, name=None):
     """Construct an `ObservedStochasticTensor`.
 
-    `ObservedStochasticTensor` will instantiate a distribution from `dist_cls`
-    and `dist_args` but use the provided value instead of sampling from the
-    distribution. The provided value argument must be appropriately shaped
-    to have come from the constructed distribution.
+    `ObservedStochasticTensor` is backed by distribution `dist` and uses the
+    provided value instead of using the current value type to draw a value from
+    the distribution. The provided value argument must be appropriately shaped
+    to have come from the distribution.
 
     Args:
-      dist_cls: a `Distribution` class.
+      dist: an instance of `Distribution`.
       value: a Tensor containing the observed value
       name: a name for this `ObservedStochasticTensor` and its ops.
-      **dist_args: keyword arguments to be passed through to `dist_cls` on
-          construction.
 
     Raises:
-      TypeError: if `dist_cls` is not a `Distribution`.
+      TypeError: if `dist` is not an instance of `Distribution`.
       ValueError: if `value` is not compatible with the distribution.
     """
-    if not issubclass(dist_cls, distributions.Distribution):
-      raise TypeError("dist_cls must be a subclass of Distribution")
-    self._dist_cls = dist_cls
-    self._dist_args = dist_args
-    with ops.name_scope(name, "ObservedStochasticTensor",
-                        list(dist_args.values()) + [value]) as scope:
+    if not isinstance(dist, distributions.Distribution):
+      raise TypeError("dist must be an instance of Distribution")
+    with ops.name_scope(name, "ObservedStochasticTensor", [value]) as scope:
       self._name = scope
-      self._dist = dist_cls(**dist_args)
+      self._dist = dist
       dist_shape = self._dist.get_batch_shape().concatenate(
           self._dist.get_event_shape())
       value = ops.convert_to_tensor(value)
@@ -538,7 +515,7 @@ class ObservedStochasticTensor(StochasticTensor):
               "sample from the distribution %s." % (value_shape, dist_shape))
       if value.dtype != self._dist.dtype:
         raise ValueError("Type of observed value (%s) does not match type of "
-                         "distribuiton (%s)." % (value.dtype, self._dist.dtype))
+                         "distribution (%s)." % (value.dtype, self._dist.dtype))
       self._value = array_ops.identity(value)
     # pylint: disable=non-parent-init-called
     BaseStochasticTensor.__init__(self)
@@ -557,39 +534,3 @@ __all__ = [
     "value_type",
     "get_current_value_type",
 ]
-
-_globals = globals()
-# pylint: disable=redefined-builtin
-__doc__ += "\n\n## Automatically Generated StochasticTensors\n\n"
-# pylint: enable=redefined-builtin
-for _name in sorted(dir(distributions)):
-  _candidate = getattr(distributions, _name)
-  if (inspect.isclass(_candidate)
-      and _candidate != distributions.Distribution
-      and issubclass(_candidate, distributions.Distribution)):
-    _local_name = "%sTensor" % _name
-
-    class _WrapperTensor(StochasticTensor):
-      _my_candidate = _candidate
-
-      def __init__(self, name=None, dist_value_type=None,
-                   loss_fn=sge.score_function, **dist_args):
-        StochasticTensor.__init__(
-            self,
-            dist_cls=self._my_candidate,
-            name=name,
-            dist_value_type=dist_value_type,
-            loss_fn=loss_fn, **dist_args)
-
-    _WrapperTensor.__name__ = _local_name
-    _WrapperTensor.__doc__ = (
-        "`%s` is a `StochasticTensor` backed by the distribution `%s`."""
-        % (_local_name, _name))
-    _globals[_local_name] = _WrapperTensor
-    del _WrapperTensor
-    del _candidate
-
-    __all__.append(_local_name)
-    __doc__ += "@@%s\n" % _local_name
-
-    del _local_name
diff --git a/tensorflow/contrib/bayesflow/python/ops/stochastic_variables.py b/tensorflow/contrib/bayesflow/python/ops/stochastic_variables.py
index 72c2e0d8ec1..7baf1366bcd 100644
--- a/tensorflow/contrib/bayesflow/python/ops/stochastic_variables.py
+++ b/tensorflow/contrib/bayesflow/python/ops/stochastic_variables.py
@@ -126,7 +126,7 @@ def get_stochastic_variable(getter,
 
   dist_kwargs = dist_kwargs or {}
   dist_kwargs.update(params)
-  sample = st.StochasticTensor(dist_cls, **dist_kwargs)
+  sample = st.StochasticTensor(dist_cls(**dist_kwargs))
 
   if prior is not None:
     if callable(prior):
diff --git a/tensorflow/contrib/cmake/external/gif.cmake b/tensorflow/contrib/cmake/external/gif.cmake
index da20561b880..231159ed0a5 100644
--- a/tensorflow/contrib/cmake/external/gif.cmake
+++ b/tensorflow/contrib/cmake/external/gif.cmake
@@ -1,7 +1,7 @@
 include (ExternalProject)
 
 set(gif_INCLUDE_DIR ${CMAKE_CURRENT_BINARY_DIR}/external/gif_archive/giflib-5.1.4/)
-set(gif_URL http://ufpr.dl.sourceforge.net/project/giflib/giflib-5.1.4.tar.gz)
+set(gif_URL http://cdimage.debian.org/mirror/xbmc.org/build-deps/sources/giflib-5.1.4.tar.gz)
 set(gif_HASH SHA256=34a7377ba834397db019e8eb122e551a49c98f49df75ec3fcc92b9a794a4f6d1)
 set(gif_INSTALL ${CMAKE_BINARY_DIR}/gif/install)
 set(gif_BUILD ${CMAKE_BINARY_DIR}/gif/src/gif)
diff --git a/tensorflow/contrib/cmake/setup.py b/tensorflow/contrib/cmake/setup.py
index 1edc173a8f5..78cb546f852 100644
--- a/tensorflow/contrib/cmake/setup.py
+++ b/tensorflow/contrib/cmake/setup.py
@@ -26,7 +26,7 @@ from setuptools import find_packages, setup, Command
 from setuptools.command.install import install as InstallCommandBase
 from setuptools.dist import Distribution
 
-_VERSION = '0.11.0rc1-cmake-experimental'
+_VERSION = '0.11.0rc2-cmake-experimental'
 
 REQUIRED_PACKAGES = [
     'numpy >= 1.11.0',
diff --git a/tensorflow/contrib/distributions/__init__.py b/tensorflow/contrib/distributions/__init__.py
index 36bc4072382..8111118462a 100644
--- a/tensorflow/contrib/distributions/__init__.py
+++ b/tensorflow/contrib/distributions/__init__.py
@@ -57,7 +57,6 @@ initialized with parameters that define the distributions.
 @@MultivariateNormalCholesky
 @@MultivariateNormalDiagPlusVDVT
 @@MultivariateNormalDiagWithSoftplusStDev
-@@matrix_diag_transform
 
 ### Other multivariate distributions
 
@@ -67,6 +66,10 @@ initialized with parameters that define the distributions.
 @@WishartCholesky
 @@WishartFull
 
+### Multivariate Utilities
+
+@@matrix_diag_transform
+
 ## Transformed distributions
 
 @@TransformedDistribution
@@ -86,7 +89,7 @@ representing the posterior or posterior predictive.
 @@normal_conjugates_known_sigma_posterior
 @@normal_conjugates_known_sigma_predictive
 
-## Kullback Leibler Divergence
+## Kullback-Leibler Divergence
 
 @@kl
 @@RegisterKL
diff --git a/tensorflow/contrib/distributions/python/kernel_tests/distribution_util_test.py b/tensorflow/contrib/distributions/python/kernel_tests/distribution_util_test.py
index b5d041c8c76..66b43662fd5 100644
--- a/tensorflow/contrib/distributions/python/kernel_tests/distribution_util_test.py
+++ b/tensorflow/contrib/distributions/python/kernel_tests/distribution_util_test.py
@@ -25,7 +25,7 @@ import tensorflow as tf
 from tensorflow.contrib.distributions.python.ops import distribution_util
 
 
-class DistributionUtilTest(tf.test.TestCase):
+class AssertCloseTest(tf.test.TestCase):
 
   def testAssertCloseIntegerDtype(self):
     x = [1, 5, 10, 15, 20]
@@ -110,6 +110,9 @@ class DistributionUtilTest(tf.test.TestCase):
             distribution_util.assert_integer_form(w)]):
           tf.identity(w).eval()
 
+
+class GetLogitsAndProbTest(tf.test.TestCase):
+
   def testGetLogitsAndProbImproperArguments(self):
     with self.test_session():
       with self.assertRaises(ValueError):
@@ -229,6 +232,9 @@ class DistributionUtilTest(tf.test.TestCase):
           p=p4, multidimensional=True, validate_args=False)
       prob.eval()
 
+
+class LogCombinationsTest(tf.test.TestCase):
+
   def testLogCombinationsBinomial(self):
     n = [2, 5, 12, 15]
     k = [1, 2, 4, 11]
@@ -252,6 +258,9 @@ class DistributionUtilTest(tf.test.TestCase):
       log_binom = distribution_util.log_combinations(n, counts)
       self.assertEqual([2, 2], log_binom.get_shape())
 
+
+class RotateTransposeTest(tf.test.TestCase):
+
   def _np_rotate_transpose(self, x, shift):
     if not isinstance(x, np.ndarray):
       x = np.array(x)
@@ -283,7 +292,10 @@ class DistributionUtilTest(tf.test.TestCase):
               sess.run(distribution_util.rotate_transpose(x, shift),
                        feed_dict={x: x_value, shift: shift_value}))
 
-  def testChooseVector(self):
+
+class PickVectorTest(tf.test.TestCase):
+
+  def testCorrectlyPicksVector(self):
     with self.test_session():
       x = np.arange(10, 12)
       y = np.arange(15, 18)
@@ -301,5 +313,51 @@ class DistributionUtilTest(tf.test.TestCase):
               tf.constant(False), x, y))  # No eval.
 
 
+class FillLowerTriangularTest(tf.test.TestCase):
+
+  def testCorrectlyMakes1x1LowerTril(self):
+    with self.test_session():
+      x = np.array([[1.], [2], [3]])
+      expected = np.array([[[1.]], [[2]], [[3]]])
+      actual = distribution_util.fill_lower_triangular(x)
+      self.assertAllEqual(expected.shape, actual.get_shape())
+      self.assertAllEqual(expected, actual.eval())
+
+  def testCorrectlyMakesNoBatchLowerTril(self):
+    with self.test_session():
+      x = tf.convert_to_tensor(np.arange(9, dtype=np.float32))
+      expected = np.array(
+          [[0., 0., 0.],
+           [1., 2., 0.],
+           [3., 4., 5.]])
+      actual = distribution_util.fill_lower_triangular(x)
+      self.assertAllEqual(expected.shape, actual.get_shape())
+      self.assertAllEqual(expected, actual.eval())
+      self.assertAllEqual(
+          np.concatenate([np.ones(6, dtype=np.float32),
+                          np.zeros(3, dtype=np.float32)]),
+          tf.gradients(distribution_util.fill_lower_triangular(x), x)[0].eval())
+
+  def testCorrectlyMakesBatchLowerTril(self):
+    with self.test_session():
+      x = np.reshape(np.arange(24), (2, 2, 6))
+      expected = np.array(
+          [[[[0., 0., 0.],
+             [1., 2., 0.],
+             [3., 4., 5.]],
+            [[6., 0., 0.],
+             [7., 8., 0.],
+             [9., 10., 11.]]],
+           [[[12., 0., 0.],
+             [13., 14., 0.],
+             [15., 16., 17.]],
+            [[18., 0., 0.],
+             [19., 20., 0.],
+             [21., 22., 23.]]]])
+      actual = distribution_util.fill_lower_triangular(x)
+      self.assertAllEqual(expected.shape, actual.get_shape())
+      self.assertAllEqual(expected, actual.eval())
+
+
 if __name__ == "__main__":
   tf.test.main()
diff --git a/tensorflow/contrib/distributions/python/ops/distribution_util.py b/tensorflow/contrib/distributions/python/ops/distribution_util.py
index 89950d6aa22..e27dcfe9b3f 100644
--- a/tensorflow/contrib/distributions/python/ops/distribution_util.py
+++ b/tensorflow/contrib/distributions/python/ops/distribution_util.py
@@ -20,11 +20,13 @@ from __future__ import print_function
 
 import functools
 import hashlib
+import math
 import numpy as np
 
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import tensor_shape
 from tensorflow.python.framework import tensor_util
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import check_ops
@@ -376,7 +378,7 @@ def pick_vector(cond,
     TypeError: if `cond` is not a constant and
       `true_vector.dtype != false_vector.dtype`
   """
-  with ops.op_scope((cond, true_vector, false_vector), name):
+  with ops.name_scope(name, values=(cond, true_vector, false_vector)):
     cond = ops.convert_to_tensor(cond, name="cond")
     if cond.dtype != dtypes.bool:
       raise TypeError("%s.dtype=%s which is not %s" %
@@ -405,6 +407,105 @@ def gen_new_seed(seed, salt):
   return None
 
 
+def fill_lower_triangular(x, name="fill_lower_triangular"):
+  """Creates a (batch of) lower triangular matrix from a vector of inputs.
+
+  If `x.get_shape()` is `[b1, b2, ..., bK, d]` then the output shape is `[b1,
+  b2, ..., bK, n, n]` where `n` is such that `d = n(n+1)/2`, i.e.,
+  `n = int(0.5 * (math.sqrt(1. + 8. * d) - 1.))`.
+
+  Note: This function is very slow; possibly 10x slower than zero-ing out the
+  upper-triangular portion of a full matrix.
+
+  Example:
+
+  ```python
+  fill_lower_triangular([1, 2, 3, 4, 5, 6])
+  # Returns: [[1, 0, 0],
+  #           [2, 3, 0],
+  #           [4, 5, 6]]
+  ```
+
+  Args:
+    x: `Tensor` representing lower triangular elements.
+    name: `String`. The name to give this op.
+
+  Returns:
+    tril: `Tensor` with lower triangular elements filled from `x`.
+  """
+  with ops.name_scope(name, values=(x,)):
+    x = ops.convert_to_tensor(x, name="x")
+    if (x.get_shape().ndims is not None and
+        x.get_shape()[-1].value is not None):
+      d = x.get_shape()[-1].value
+      # d = n^2/2 + n/2 implies n is:
+      n = int(0.5 * (math.sqrt(1. + 8. * d) - 1.))
+      final_shape = x.get_shape()[:-1].concatenate(
+          tensor_shape.TensorShape([n, n]))
+    else:
+      d = math_ops.cast(array_ops.shape(x)[-1], dtype=dtypes.float32)
+      # d = n^2/2 + n/2 implies n is:
+      n = math_ops.cast(0.5 * (dtypes.sqrt(1. + 8. * d) - 1.),
+                        dtype=dtypes.int32)
+      final_shape = x.get_shape()[:-1].concatenate(
+          tensor_shape.TensorShape([None, None]))
+
+    # Make ids for each batch dim.
+    if (x.get_shape().ndims is not None and
+        x.get_shape()[:-1].is_fully_defined()):
+      batch_shape = np.asarray(x.get_shape()[:-1].as_list(), dtype=np.int32)
+      m = np.prod(batch_shape)
+    else:
+      batch_shape = array_ops.shape(x)[:-1]
+      m = array_ops.reduce_prod(batch_shape)
+
+    # Flatten batch dims.
+    y = array_ops.reshape(x, [-1, d])
+
+    # Prepend a zero to each row.
+    y = array_ops.pad(y, paddings=[[0, 0], [1, 0]])
+
+    # Make ids for each batch dim.
+    if x.get_shape()[:-1].is_fully_defined():
+      m = np.asarray(np.prod(x.get_shape()[:-1].as_list()), dtype=np.int32)
+    else:
+      m = array_ops.reduce_prod(array_ops.shape(x)[:-1])
+    batch_ids = math_ops.range(m)
+
+    def make_tril_ids(n):
+      """Internal helper to create vector of linear indices into y."""
+      cols = array_ops.reshape(array_ops.tile(math_ops.range(n), [n]), [n, n])
+      rows = array_ops.tile(
+          array_ops.expand_dims(math_ops.range(n), -1), [1, n])
+      pred = math_ops.greater(cols, rows)
+      tril_ids = array_ops.tile(array_ops.reshape(
+          math_ops.cumsum(math_ops.range(n)), [n, 1]), [1, n]) + cols
+      tril_ids = math_ops.select(pred,
+                                 array_ops.zeros([n, n], dtype=dtypes.int32),
+                                 tril_ids + 1)
+      tril_ids = array_ops.reshape(tril_ids, [-1])
+      return tril_ids
+    tril_ids = make_tril_ids(n)
+
+    # Assemble the ids into pairs.
+    idx = array_ops.pack([
+        array_ops.tile(array_ops.expand_dims(batch_ids, -1), [1, n*n]),
+        array_ops.tile([tril_ids], [m, 1])])
+    idx = array_ops.transpose(idx, [1, 2, 0])
+
+    if x.get_shape().ndims == 1:
+      # Prefer using gather because it has a gradient.
+      # We wrap the result in a list so downstream logic "just works."
+      y = [array_ops.gather(y[0, :], tril_ids)]
+    else:
+      y = array_ops.gather_nd(y, idx)
+    y = array_ops.reshape(y, array_ops.concat(0, [batch_shape, [n, n]]))
+
+    y.set_shape(y.get_shape().merge_with(final_shape))
+
+    return y
+
+
 class AppendDocstring(object):
   """Helper class to promote private subclass docstring to public counterpart.
 
diff --git a/tensorflow/contrib/factorization/python/ops/factorization_ops.py b/tensorflow/contrib/factorization/python/ops/factorization_ops.py
index bf6ab001646..34fa0129dd8 100644
--- a/tensorflow/contrib/factorization/python/ops/factorization_ops.py
+++ b/tensorflow/contrib/factorization/python/ops/factorization_ops.py
@@ -571,9 +571,8 @@ class WALSModel(object):
         extras = size % num_shards
         assignments = tf.maximum(ids // (ids_per_shard + 1),
                                  (ids - extras) // ids_per_shard)
-        new_ids = tf.select(assignments < extras,
-                            ids % (ids_per_shard + 1),
-                            (ids - extras) % ids_per_shard)
+        new_ids = tf.where(assignments < extras, ids % (ids_per_shard + 1),
+                           (ids - extras) % ids_per_shard)
         return assignments, new_ids
     return func
 
@@ -655,7 +654,7 @@ class WALSModel(object):
       update_op: An op that assigns the newly computed values to the row/column
         factors.
     """
-    assert isinstance(sp_input, ops.SparseTensor)
+    assert isinstance(sp_input, tf.SparseTensor)
 
     if update_row_factors:
       left = self._row_factors
diff --git a/tensorflow/contrib/framework/BUILD b/tensorflow/contrib/framework/BUILD
index e948a333dda..8534ecdeab5 100644
--- a/tensorflow/contrib/framework/BUILD
+++ b/tensorflow/contrib/framework/BUILD
@@ -18,8 +18,6 @@ py_library(
         "__init__.py",
         "python/framework/__init__.py",
         "python/framework/checkpoint_utils.py",
-        "python/framework/decorator_utils.py",
-        "python/framework/deprecation.py",
         "python/framework/experimental.py",
         "python/framework/tensor_util.py",
         "python/ops/__init__.py",
@@ -102,20 +100,6 @@ py_test(
     deps = ["//tensorflow:tensorflow_py"],
 )
 
-py_test(
-    name = "deprecation_test",
-    srcs = ["python/framework/deprecation_test.py"],
-    srcs_version = "PY2AND3",
-    deps = ["//tensorflow:tensorflow_py"],
-)
-
-py_test(
-    name = "decorator_utils_test",
-    srcs = ["python/framework/decorator_utils_test.py"],
-    srcs_version = "PY2AND3",
-    deps = ["//tensorflow:tensorflow_py"],
-)
-
 py_test(
     name = "experimental_test",
     srcs = ["python/framework/experimental_test.py"],
@@ -135,6 +119,7 @@ py_test(
     size = "small",
     srcs = ["python/ops/variables_test.py"],
     srcs_version = "PY2AND3",
+    tags = ["manual"],
     deps = ["//tensorflow:tensorflow_py"],
 )
 
diff --git a/tensorflow/contrib/framework/python/framework/__init__.py b/tensorflow/contrib/framework/python/framework/__init__.py
index c7fa49490e6..1b8a5a1b395 100644
--- a/tensorflow/contrib/framework/python/framework/__init__.py
+++ b/tensorflow/contrib/framework/python/framework/__init__.py
@@ -19,10 +19,10 @@ from __future__ import division
 from __future__ import print_function
 
 # pylint: disable=wildcard-import
-from tensorflow.contrib.framework.python.framework import decorator_utils
 from tensorflow.contrib.framework.python.framework.checkpoint_utils import *
-from tensorflow.contrib.framework.python.framework.deprecation import deprecated
-from tensorflow.contrib.framework.python.framework.deprecation import deprecated_arg_values
-from tensorflow.contrib.framework.python.framework.deprecation import deprecated_args
 from tensorflow.contrib.framework.python.framework.experimental import experimental
 from tensorflow.contrib.framework.python.framework.tensor_util import *
+from tensorflow.python.util import decorator_utils
+from tensorflow.python.util.deprecation import deprecated
+from tensorflow.python.util.deprecation import deprecated_arg_values
+from tensorflow.python.util.deprecation import deprecated_args
diff --git a/tensorflow/contrib/framework/python/framework/experimental.py b/tensorflow/contrib/framework/python/framework/experimental.py
index cb1723427fa..054b5a4a342 100644
--- a/tensorflow/contrib/framework/python/framework/experimental.py
+++ b/tensorflow/contrib/framework/python/framework/experimental.py
@@ -20,8 +20,8 @@ from __future__ import print_function
 
 import functools
 
-from tensorflow.contrib.framework.python.framework import decorator_utils
 from tensorflow.python.platform import tf_logging as logging
+from tensorflow.python.util import decorator_utils
 
 
 def _add_experimental_function_notice_to_docstring(doc):
diff --git a/tensorflow/contrib/framework/python/framework/tensor_util.py b/tensorflow/contrib/framework/python/framework/tensor_util.py
index f07a41136b6..71761966271 100644
--- a/tensorflow/contrib/framework/python/framework/tensor_util.py
+++ b/tensorflow/contrib/framework/python/framework/tensor_util.py
@@ -20,6 +20,7 @@ from __future__ import print_function
 import numpy as np
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import math_ops
@@ -283,7 +284,7 @@ def is_tensor(x):
   Returns:
     `True` if `x` is a tensor, `False` if not.
   """
-  tensor_types = (ops.Tensor, ops.SparseTensor, variables.Variable)
+  tensor_types = (ops.Tensor, sparse_tensor.SparseTensor, variables.Variable)
   return isinstance(x, tensor_types)
 
 
@@ -303,7 +304,7 @@ def with_shape(expected_shape, tensor):
   Raises:
     ValueError: if tensor has an invalid shape.
   """
-  if isinstance(tensor, ops.SparseTensor):
+  if isinstance(tensor, sparse_tensor.SparseTensor):
     raise ValueError('SparseTensor not supported.')
 
   # Shape type must be 1D int32.
@@ -376,9 +377,9 @@ def convert_to_tensor_or_sparse_tensor(
   """
   if dtype is not None:
     dtype = dtypes.as_dtype(dtype)
-  if isinstance(value, ops.SparseTensorValue):
-    value = ops.SparseTensor.from_value(value)
-  if isinstance(value, ops.SparseTensor):
+  if isinstance(value, sparse_tensor.SparseTensorValue):
+    value = sparse_tensor.SparseTensor.from_value(value)
+  if isinstance(value, sparse_tensor.SparseTensor):
     if dtype and not dtype.is_compatible_with(value.dtype):
       raise RuntimeError(
           'Sparse dtype: requested = %s, actual = %s' % (
diff --git a/tensorflow/contrib/framework/python/ops/prettyprint_ops.py b/tensorflow/contrib/framework/python/ops/prettyprint_ops.py
index 48ceb211ca5..7b4e58ecd1d 100644
--- a/tensorflow/contrib/framework/python/ops/prettyprint_ops.py
+++ b/tensorflow/contrib/framework/python/ops/prettyprint_ops.py
@@ -22,6 +22,7 @@ from __future__ import print_function
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import logging_ops
 from tensorflow.python.ops import math_ops
@@ -43,7 +44,7 @@ def _get_tensor_repr(t,
   if print_tensor_type:
     if isinstance(t, ops.Tensor):
       t_type_str = "Type: Tensor ({})".format(t.dtype.name)
-    elif isinstance(t, ops.SparseTensor):
+    elif isinstance(t, sparse_tensor.SparseTensor):
       t_type_str = "Type: SparseTensor ({})".format(t.dtype.name)
     elif isinstance(t, tensor_array_ops.TensorArray):
       t_type_str = "Type: TensorArray ({})".format(t.dtype.name)
@@ -51,7 +52,7 @@ def _get_tensor_repr(t,
     tensor_list.append(constant_op.constant(t_type_str))
 
   if print_shape:
-    if isinstance(t, ops.SparseTensor):
+    if isinstance(t, sparse_tensor.SparseTensor):
       tensor_list.append(constant_op.constant("Shape:"))
       tensor_list.append(t.shape)
     elif isinstance(t, ops.Tensor):
@@ -66,7 +67,7 @@ def _get_tensor_repr(t,
     tensor_list.append(constant_op.constant("First True in Boolean tensor at:"))
     tensor_list.append(math_ops.argmax(int_tensor, 0))
 
-  if isinstance(t, ops.SparseTensor):
+  if isinstance(t, sparse_tensor.SparseTensor):
     tensor_list.append(constant_op.constant("Sparse indices:"))
     tensor_list.append(t.indices)
     tensor_list.append(constant_op.constant("Sparse values:"))
@@ -137,15 +138,15 @@ def print_op(input_,
   if isinstance(input_, ops.Tensor):
     input_ = logging_ops.Print(input_, tensor_list, message, first_n, summarize,
                                name)
-  elif isinstance(input_, ops.SparseTensor):
+  elif isinstance(input_, sparse_tensor.SparseTensor):
     p = logging_ops.Print(
         constant_op.constant([]), tensor_list, message, first_n, summarize,
         name)
 
     with ops.control_dependencies([p]):
-      input_ = ops.SparseTensor(array_ops.identity(input_.indices),
-                                array_ops.identity(input_.values),
-                                array_ops.identity(input_.shape))
+      input_ = sparse_tensor.SparseTensor(array_ops.identity(input_.indices),
+                                          array_ops.identity(input_.values),
+                                          array_ops.identity(input_.shape))
   elif isinstance(input_, tensor_array_ops.TensorArray):
     p = logging_ops.Print(
         constant_op.constant([]), tensor_list, message, first_n, summarize,
diff --git a/tensorflow/contrib/framework/python/ops/variables_test.py b/tensorflow/contrib/framework/python/ops/variables_test.py
index eb0a2c2d8eb..49683faf90f 100644
--- a/tensorflow/contrib/framework/python/ops/variables_test.py
+++ b/tensorflow/contrib/framework/python/ops/variables_test.py
@@ -36,7 +36,7 @@ class LocalVariableTest(tf.test.TestCase):
       variables = tf.local_variables()
       self.assertEquals(2, len(variables))
       self.assertRaises(tf.OpError, sess.run, variables)
-      tf.initialize_variables(variables).run()
+      tf.variables_initializer(variables).run()
       self.assertAllEqual(set([value0, value1]), set(sess.run(variables)))
 
   def testLocalVariableNameAndShape(self):
@@ -51,7 +51,7 @@ class LocalVariableTest(tf.test.TestCase):
     with self.test_session():
       with tf.variable_scope('A'):
         a = tf.contrib.framework.local_variable(0)
-        self.assertFalse(a in tf.all_variables())
+        self.assertFalse(a in tf.global_variables())
         self.assertTrue(a in tf.local_variables())
 
   def testLocalVariableNotInVariablesToRestore(self):
@@ -82,7 +82,7 @@ class LocalVariableTest(tf.test.TestCase):
   def testInitializedVariableValue(self):
     with self.test_session() as sess:
       a = tf.contrib.framework.local_variable([0, 0, 0, 0, 0], name='a')
-      sess.run(tf.initialize_local_variables())
+      sess.run(tf.local_variables_initializer())
       self.assertAllEqual(a.eval(), [0]*5)
 
 
@@ -439,7 +439,7 @@ class ModelVariablesTest(tf.test.TestCase):
     with self.test_session():
       with tf.variable_scope('A'):
         a = tf.contrib.framework.model_variable('a', [5])
-        self.assertTrue(a in tf.all_variables())
+        self.assertTrue(a in tf.global_variables())
         self.assertTrue(a in tf.get_collection(tf.GraphKeys.MODEL_VARIABLES))
         self.assertFalse(a in tf.local_variables())
 
@@ -474,7 +474,7 @@ class ModelVariablesTest(tf.test.TestCase):
     with self.test_session() as sess:
       a = tf.contrib.framework.model_variable(
           'a', [5], initializer=tf.ones_initializer)
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
       self.assertAllEqual(a.eval(), [1]*5)
 
   def testDeviceFn(self):
@@ -667,7 +667,7 @@ class AssignFromValuesTest(tf.test.TestCase):
           var_names_to_values)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       sess.run(assign_op, feed_dict)
@@ -697,7 +697,7 @@ class AssignFromValuesTest(tf.test.TestCase):
           var_names_to_values)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       sess.run(assign_op, feed_dict)
@@ -725,7 +725,7 @@ class AssignFromValuesFnTest(tf.test.TestCase):
       init_fn = tf.contrib.framework.assign_from_values_fn(var_names_to_values)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       init_fn(sess)
@@ -754,7 +754,7 @@ class AssignFromValuesFnTest(tf.test.TestCase):
       init_fn = tf.contrib.framework.assign_from_values_fn(var_names_to_values)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       init_fn(sess)
@@ -786,7 +786,7 @@ class AssignFromCheckpointTest(tf.test.TestCase):
         var_value = var_names_to_values[var_name]
         var_list.append(tf.Variable(var_value, name=var_name))
       saver = tf.train.Saver(var_list)
-      init_op = tf.initialize_variables(var_list)
+      init_op = tf.variables_initializer(var_list)
       sess.run(init_op)
       # Save the initialized values in the file at 'checkpoint_dir'
       return saver.save(sess, checkpoint_dir, global_step=global_step)
@@ -808,7 +808,7 @@ class AssignFromCheckpointTest(tf.test.TestCase):
           model_path, vars_to_restore)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       sess.run(op, feed_dict)
@@ -859,7 +859,7 @@ class AssignFromCheckpointTest(tf.test.TestCase):
           vars_to_restore)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       sess.run(op, feed_dict)
@@ -890,7 +890,7 @@ class AssignFromCheckpointFnTest(tf.test.TestCase):
         var_value = var_names_to_values[var_name]
         var_list.append(tf.Variable(var_value, name=var_name))
       saver = tf.train.Saver(var_list)
-      init_op = tf.initialize_variables(var_list)
+      init_op = tf.variables_initializer(var_list)
       sess.run(init_op)
       # Save the initialized values in the file at 'checkpoint_dir'
       return saver.save(sess, checkpoint_dir, global_step=global_step)
@@ -912,7 +912,7 @@ class AssignFromCheckpointFnTest(tf.test.TestCase):
           model_path, vars_to_restore)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       init_fn(sess)
@@ -938,7 +938,7 @@ class AssignFromCheckpointFnTest(tf.test.TestCase):
           model_path, vars_to_restore)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       with self.assertRaises(tf.errors.InvalidArgumentError):
@@ -961,7 +961,7 @@ class AssignFromCheckpointFnTest(tf.test.TestCase):
           model_path, vars_to_restore, reshape_variables=True)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       init_fn(sess)
@@ -989,7 +989,7 @@ class AssignFromCheckpointFnTest(tf.test.TestCase):
           vars_to_restore)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       with self.assertRaises(tf.errors.NotFoundError):
@@ -1015,7 +1015,7 @@ class AssignFromCheckpointFnTest(tf.test.TestCase):
           ignore_missing_vars=True)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       init_fn(sess)
@@ -1044,7 +1044,7 @@ class AssignFromCheckpointFnTest(tf.test.TestCase):
           ignore_missing_vars=True)
 
       # Initialize the variables.
-      sess.run(tf.initialize_all_variables())
+      sess.run(tf.global_variables_initializer())
 
       # Perform the assignment.
       init_fn(sess)
diff --git a/tensorflow/contrib/integrate/BUILD b/tensorflow/contrib/integrate/BUILD
new file mode 100644
index 00000000000..1e6db75d215
--- /dev/null
+++ b/tensorflow/contrib/integrate/BUILD
@@ -0,0 +1,38 @@
+# Description:
+#   Integration and ODE solvers for TensorFlow.
+
+licenses(["notice"])  # Apache 2.0
+
+exports_files(["LICENSE"])
+
+package(default_visibility = ["//tensorflow:__subpackages__"])
+
+py_library(
+    name = "integrate_py",
+    srcs = [
+        "__init__.py",
+        "python/ops/odes.py",
+    ],
+    srcs_version = "PY2AND3",
+)
+
+py_test(
+    name = "odes_test",
+    srcs = ["python/ops/odes_test.py"],
+    srcs_version = "PY2AND3",
+    deps = [
+        ":integrate_py",
+        "//tensorflow:tensorflow_py",
+    ],
+)
+
+filegroup(
+    name = "all_files",
+    srcs = glob(
+        ["**/*"],
+        exclude = [
+            "**/METADATA",
+            "**/OWNERS",
+        ],
+    ),
+)
diff --git a/tensorflow/contrib/integrate/README.md b/tensorflow/contrib/integrate/README.md
new file mode 100644
index 00000000000..beae6993b9d
--- /dev/null
+++ b/tensorflow/contrib/integrate/README.md
@@ -0,0 +1,9 @@
+# Integration and ODE solvers for TensorFlow
+
+TensorFlow equivalents to the routines provided by `scipy.integrate`. Currently
+contains a single function, `odeint`, for integrating ordinary differential
+equations.
+
+Maintainers:
+- Stephan Hoyer (shoyer@google.com, github.com/shoyer)
+- Marc Coram (mcoram@google.com, github.com/mcoram)
diff --git a/tensorflow/contrib/integrate/__init__.py b/tensorflow/contrib/integrate/__init__.py
new file mode 100644
index 00000000000..e88d10c5823
--- /dev/null
+++ b/tensorflow/contrib/integrate/__init__.py
@@ -0,0 +1,64 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""Integration and ODE solvers for TensorFlow.
+
+## Example: Lorenz attractor
+
+We can use `odeint` to solve the
+[Lorentz system](https://en.wikipedia.org/wiki/Lorenz_system) of ordinary
+differential equations, a prototypical example of chaotic dynamics:
+
+```python
+rho = 28.0
+sigma = 10.0
+beta = 8.0/3.0
+
+def lorenz_equation(state, t):
+  x, y, z = tf.unpack(state)
+  dx = sigma * (y - x)
+  dy = x * (rho - z) - y
+  dz = x * y - beta * z
+  return tf.pack([dx, dy, dz])
+
+init_state = tf.constant([0, 2, 20], dtype=tf.float64)
+t = np.linspace(0, 50, num=5000)
+tensor_state, tensor_info = tf.contrib.integrate.odeint(
+    lorenz_equation, init_state, t, full_output=True)
+
+sess = tf.Session()
+state, info = sess.run([tensor_state, tensor_info])
+x, y, z = state.T
+plt.plot(x, z)
+```
+
+<div style="width:70%; margin:auto; margin-bottom:10px; margin-top:20px;">
+<img style="width:100%" src="../../images/lorenz_attractor.png" alt>
+</div>
+
+## Ops
+
+@@odeint
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+# pylint: disable=wildcard-import
+from tensorflow.contrib.integrate.python.ops.odes import *
+from tensorflow.python.util.all_util import make_all
+
+__all__ = make_all(__name__)
diff --git a/tensorflow/contrib/integrate/python/ops/odes.py b/tensorflow/contrib/integrate/python/ops/odes.py
new file mode 100644
index 00000000000..5747bdefee8
--- /dev/null
+++ b/tensorflow/contrib/integrate/python/ops/odes.py
@@ -0,0 +1,503 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""ODE solvers for TensorFlow."""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import collections
+
+from tensorflow.python.framework import constant_op
+from tensorflow.python.framework import dtypes
+from tensorflow.python.framework import ops
+from tensorflow.python.ops import array_ops
+from tensorflow.python.ops import control_flow_ops
+from tensorflow.python.ops import math_ops
+from tensorflow.python.ops import tensor_array_ops
+
+
+_ButcherTableau = collections.namedtuple(
+    '_ButcherTableau', 'alpha beta c_sol c_mid c_error')
+
+# Parameters from Shampine (1986), section 4.
+_DORMAND_PRINCE_TABLEAU = _ButcherTableau(
+    alpha=[1/5, 3/10, 4/5, 8/9, 1., 1.],
+    beta=[[1/5],
+          [3/40, 9/40],
+          [44/45, -56/15, 32/9],
+          [19372/6561, -25360/2187, 64448/6561, -212/729],
+          [9017/3168, -355/33, 46732/5247, 49/176, -5103/18656],
+          [35/384, 0, 500/1113, 125/192, -2187/6784, 11/84]],
+    c_sol=[35/384, 0, 500/1113, 125/192, -2187/6784, 11/84, 0],
+    c_mid=[6025192743/30085553152 / 2, 0, 51252292925/65400821598 / 2,
+           -2691868925/45128329728 / 2, 187940372067/1594534317056 / 2,
+           -1776094331/19743644256 / 2, 11237099/235043384 / 2],
+    c_error=[1951/21600 - 35/384,
+             0,
+             22642/50085 - 500/1113,
+             451/720 - 125/192,
+             -12231/42400 - -2187/6784,
+             649/6300 - 11/84,
+             1/60],
+)
+
+
+def _possibly_nonzero(x):
+  return isinstance(x, ops.Tensor) or x != 0
+
+
+def _scaled_dot_product(scale, xs, ys, name=None):
+  """Calculate a scaled, vector inner product between lists of Tensors."""
+  with ops.name_scope(name, 'scaled_dot_product', [scale, xs, ys]) as scope:
+    # Some of the parameters in our Butcher tableau include zeros. Using
+    # _possibly_nonzero lets us avoid wasted computation.
+    return math_ops.add_n([(scale * x) * y for x, y in zip(xs, ys)
+                           if _possibly_nonzero(x) or _possibly_nonzero(y)],
+                          name=scope)
+
+
+def _dot_product(xs, ys, name=None):
+  """Calculate the vector inner product between two lists of Tensors."""
+  with ops.name_scope(name, 'dot_product', [xs, ys]) as scope:
+    return math_ops.add_n([x * y for x, y in zip(xs, ys)], name=scope)
+
+
+def _runge_kutta_step(func, y0, f0, t0, dt, tableau=_DORMAND_PRINCE_TABLEAU,
+                      name=None):
+  """Take an arbitrary Runge-Kutta step and estimate error.
+
+  Args:
+    func: Function to evaluate like `func(y, t)` to compute the time derivative
+      of `y`.
+    y0: Tensor initial value for the state.
+    f0: Tensor initial value for the derivative, computed from `func(y0, t0)`.
+    t0: float64 scalar Tensor giving the initial time.
+    dt: float64 scalar Tensor giving the size of the desired time step.
+    tableau: optional _ButcherTableau describing how to take the Runge-Kutta
+      step.
+    name: optional name for the operation.
+
+  Returns:
+    Tuple `(y1, f1, y1_error, k)` giving the estimated function value after
+    the Runge-Kutta step at `t1 = t0 + dt`, the derivative of the state at `t1`,
+    estimated error at `t1`, and a list of Runge-Kutta coefficients `k` used for
+    calculating these terms.
+  """
+  with ops.name_scope(name, 'runge_kutta_step', [y0, f0, t0, dt]) as scope:
+    y0 = ops.convert_to_tensor(y0, name='y0')
+    f0 = ops.convert_to_tensor(f0, name='f0')
+    t0 = ops.convert_to_tensor(t0, name='t0')
+    dt = ops.convert_to_tensor(dt, name='dt')
+    dt_cast = math_ops.cast(dt, y0.dtype)
+
+    k = [f0]
+    for alpha_i, beta_i in zip(tableau.alpha, tableau.beta):
+      ti = t0 + alpha_i * dt
+      yi = y0 + _scaled_dot_product(dt_cast, beta_i, k)
+      k.append(func(yi, ti))
+
+    if not (tableau.c_sol[-1] == 0 and tableau.c_sol == tableau.beta[-1]):
+      # This property (true for Dormand-Prince) lets us save a few FLOPs.
+      yi = y0 + _scaled_dot_product(dt_cast, tableau.c_sol, k)
+
+    y1 = array_ops.identity(yi, name='%s/y1' % scope)
+    f1 = array_ops.identity(k[-1], name='%s/f1' % scope)
+    y1_error = _scaled_dot_product(dt_cast, tableau.c_error, k,
+                                   name='%s/y1_error' % scope)
+    return (y1, f1, y1_error, k)
+
+
+def _interp_fit(y0, y1, y_mid, f0, f1, dt):
+  """Fit coefficients for 4th order polynomial interpolation.
+
+  Args:
+    y0: function value at the start of the interval.
+    y1: function value at the end of the interval.
+    y_mid: function value at the mid-point of the interval.
+    f0: derivative value at the start of the interval.
+    f1: derivative value at the end of the interval.
+    dt: width of the interval.
+
+  Returns:
+    List of coefficients `[a, b, c, d, e]` for interpolating with the polynomial
+    `p = a * x ** 4 + b * x ** 3 + c * x ** 2 + d * x + e` for values of `x`
+    between 0 (start of interval) and 1 (end of interval).
+  """
+  # a, b, c, d, e = sympy.symbols('a b c d e')
+  # x, dt, y0, y1, y_mid, f0, f1 = sympy.symbols('x dt y0 y1 y_mid f0 f1')
+  # p = a * x ** 4 + b * x ** 3 + c * x ** 2 + d * x + e
+  # sympy.solve([p.subs(x, 0) - y0,
+  #              p.subs(x, 1 / 2) - y_mid,
+  #              p.subs(x, 1) - y1,
+  #              (p.diff(x) / dt).subs(x, 0) - f0,
+  #              (p.diff(x) / dt).subs(x, 1) - f1],
+  #             [a, b, c, d, e])
+  # {a: -2.0*dt*f0 + 2.0*dt*f1 - 8.0*y0 - 8.0*y1 + 16.0*y_mid,
+  #  b: 5.0*dt*f0 - 3.0*dt*f1 + 18.0*y0 + 14.0*y1 - 32.0*y_mid,
+  #  c: -4.0*dt*f0 + dt*f1 - 11.0*y0 - 5.0*y1 + 16.0*y_mid,
+  #  d: dt*f0,
+  #  e: y0}
+  a = _dot_product([-2 * dt, 2 * dt, -8, -8, 16], [f0, f1, y0, y1, y_mid])
+  b = _dot_product([5 * dt, -3 * dt, 18, 14, -32], [f0, f1, y0, y1, y_mid])
+  c = _dot_product([-4 * dt, dt, -11, -5, 16], [f0, f1, y0, y1, y_mid])
+  d = dt * f0
+  e = y0
+  return [a, b, c, d, e]
+
+
+def _interp_fit_rk(y0, y1, k, dt, tableau=_DORMAND_PRINCE_TABLEAU):
+  """Fit an interpolating polynomial to the results of a Runge-Kutta step."""
+  with ops.name_scope('interp_fit_rk'):
+    dt = math_ops.cast(dt, y0.dtype)
+    y_mid = y0 + _scaled_dot_product(dt, tableau.c_mid, k)
+    f0 = k[0]
+    f1 = k[-1]
+    return _interp_fit(y0, y1, y_mid, f0, f1, dt)
+
+
+def _interp_evaluate(coefficients, t0, t1, t):
+  """Evaluate polynomial interpolation at the given time point.
+
+  Args:
+    coefficients: list of Tensor coefficients as created by `interp_fit`.
+    t0: scalar float64 Tensor giving the start of the interval.
+    t1: scalar float64 Tensor giving the end of the interval.
+    t: scalar float64 Tensor giving the desired interpolation point.
+
+  Returns:
+    Polynomial interpolation of the coefficients at time `t`.
+  """
+  with ops.name_scope('interp_evaluate'):
+    t0 = ops.convert_to_tensor(t0)
+    t1 = ops.convert_to_tensor(t1)
+    t = ops.convert_to_tensor(t)
+
+    dtype = coefficients[0].dtype
+
+    assert_op = control_flow_ops.Assert(
+        (t0 <= t) & (t <= t1),
+        ['invalid interpolation, fails `t0 <= t <= t1`:', t0, t, t1])
+    with ops.control_dependencies([assert_op]):
+      x = math_ops.cast((t - t0) / (t1 - t0), dtype)
+
+    xs = [constant_op.constant(1, dtype), x]
+    for _ in range(2, len(coefficients)):
+      xs.append(xs[-1] * x)
+
+    return _dot_product(coefficients, reversed(xs))
+
+
+def _optimal_step_size(last_step,
+                       error_ratio,
+                       safety=0.9,
+                       ifactor=10.0,
+                       dfactor=0.2,
+                       order=5,
+                       name=None):
+  """Calculate the optimal size for the next Runge-Kutta step."""
+  with ops.name_scope(
+      name, 'optimal_step_size', [last_step, error_ratio]) as scope:
+    error_ratio = math_ops.cast(error_ratio, last_step.dtype)
+    exponent = math_ops.cast(1 / order, last_step.dtype)
+    # this looks more complex than necessary, but importantly it keeps
+    # error_ratio in the numerator so we can't divide by zero:
+    factor = math_ops.maximum(
+        1 / ifactor,
+        math_ops.minimum(error_ratio ** exponent / safety, 1 / dfactor))
+    return math_ops.div(last_step, factor, name=scope)
+
+
+def _abs_square(x):
+  if x.dtype.is_complex:
+    return math_ops.square(math_ops.real(x)) + math_ops.square(math_ops.imag(x))
+  else:
+    return math_ops.square(x)
+
+
+def _ta_append(tensor_array, value):
+  """Append a value to the end of a tf.TensorArray."""
+  return tensor_array.write(tensor_array.size(), value)
+
+
+class _RungeKuttaState(collections.namedtuple(
+    '_RungeKuttaState', 'y1, f1, t0, t1, dt, interp_coeff')):
+  """Saved state of the Runge Kutta solver.
+
+  Attributes:
+    y1: Tensor giving the function value at the end of the last time step.
+    f1: Tensor giving derivative at the end of the last time step.
+    t0: scalar float64 Tensor giving start of the last time step.
+    t1: scalar float64 Tensor giving end of the last time step.
+    dt: scalar float64 Tensor giving the size for the next time step.
+    interp_coef: list of Tensors giving coefficients for polynomial
+      interpolation between `t0` and `t1`.
+  """
+
+
+class _History(collections.namedtuple(
+    '_History', 'integrate_points, error_ratio')):
+  """Saved integration history for use in `info_dict`.
+
+  Attributes:
+    integrate_points: tf.TensorArray storing integrating time points.
+    error_ratio: tf.TensorArray storing computed error ratios at each
+      integration step.
+  """
+
+
+def _dopri5(func,
+            y0,
+            t,
+            rtol,
+            atol,
+            full_output=False,
+            first_step=None,
+            safety=0.9,
+            ifactor=10.0,
+            dfactor=0.2,
+            max_num_steps=1000,
+            name=None):
+  """Solve an ODE for `odeint` using method='dopri5'."""
+
+  if first_step is None:
+    # at some point, we might want to switch to picking the step size
+    # automatically
+    first_step = 1.0
+
+  with ops.name_scope(
+      name, 'dopri5',
+      [y0, t, rtol, atol, safety, ifactor, dfactor, max_num_steps]) as scope:
+
+    first_step = ops.convert_to_tensor(first_step, dtype=t.dtype,
+                                       name='first_step')
+    safety = ops.convert_to_tensor(safety, dtype=t.dtype, name='safety')
+    ifactor = ops.convert_to_tensor(ifactor, dtype=t.dtype, name='ifactor')
+    dfactor = ops.convert_to_tensor(dfactor, dtype=t.dtype, name='dfactor')
+    max_num_steps = ops.convert_to_tensor(max_num_steps, dtype=dtypes.int32,
+                                          name='max_num_steps')
+
+    def adaptive_runge_kutta_step(rk_state, history, n_steps):
+      """Take an adaptive Runge-Kutta step to integrate the ODE."""
+      y0, f0, _, t0, dt, interp_coeff = rk_state
+      with ops.name_scope('assertions'):
+        check_underflow = control_flow_ops.Assert(
+            t0 + dt > t0, ['underflow in dt', dt])
+        check_max_num_steps = control_flow_ops.Assert(
+            n_steps < max_num_steps, ['max_num_steps exceeded'])
+        check_numerics = control_flow_ops.Assert(
+            math_ops.reduce_all(math_ops.is_finite(abs(y0))),
+            ['non-finite values in state `y`', y0])
+      with ops.control_dependencies(
+          [check_underflow, check_max_num_steps, check_numerics]):
+        y1, f1, y1_error, k = _runge_kutta_step(func, y0, f0, t0, dt)
+
+      with ops.name_scope('error_ratio'):
+        # We use the same approach as the dopri5 fortran code.
+        error_tol = atol + rtol * math_ops.maximum(abs(y0), abs(y1))
+        tensor_error_ratio = _abs_square(y1_error) / _abs_square(error_tol)
+        # Could also use reduce_maximum here.
+        error_ratio = math_ops.sqrt(math_ops.reduce_mean(tensor_error_ratio))
+        accept_step = error_ratio <= 1
+
+      with ops.name_scope('update/rk_state'):
+        # If we don't accept the step, the _RungeKuttaState will be useless
+        # (covering a time-interval of size 0), but that's OK, because in such
+        # cases we always immediately take another Runge-Kutta step.
+        y_next = control_flow_ops.cond(accept_step, lambda: y1, lambda: y0)
+        f_next = control_flow_ops.cond(accept_step, lambda: f1, lambda: f0)
+        t_next = control_flow_ops.cond(accept_step, lambda: t0 + dt, lambda: t0)
+        interp_coeff = control_flow_ops.cond(
+            accept_step,
+            lambda: _interp_fit_rk(y0, y1, k, dt),
+            lambda: interp_coeff)
+        dt_next = _optimal_step_size(dt, error_ratio, safety, ifactor, dfactor)
+        rk_state = _RungeKuttaState(
+            y_next, f_next, t0, t_next, dt_next, interp_coeff)
+
+      with ops.name_scope('update/history'):
+        history = _History(_ta_append(history.integrate_points, t0 + dt),
+                           _ta_append(history.error_ratio, error_ratio))
+      return rk_state, history, n_steps + 1
+
+    def interpolate(solution, history, rk_state, i):
+      """Interpolate through the next time point, integrating as necessary."""
+      with ops.name_scope('interpolate'):
+        rk_state, history, _ = control_flow_ops.while_loop(
+            lambda rk_state, *_: t[i] > rk_state.t1,
+            adaptive_runge_kutta_step,
+            (rk_state, history, 0),
+            name='integrate_loop')
+        y = _interp_evaluate(
+            rk_state.interp_coeff, rk_state.t0, rk_state.t1, t[i])
+        solution = solution.write(i, y)
+        return solution, history, rk_state, i + 1
+
+    assert_increasing = control_flow_ops.Assert(
+        math_ops.reduce_all(t[1:] > t[:-1]),
+        ['`t` must be monotonic increasing'])
+    with ops.control_dependencies([assert_increasing]):
+      num_times = array_ops.size(t)
+
+    solution = tensor_array_ops.TensorArray(
+        y0.dtype, size=num_times).write(0, y0)
+    history = _History(
+        integrate_points=tensor_array_ops.TensorArray(
+            t.dtype, size=0, dynamic_size=True),
+        error_ratio=tensor_array_ops.TensorArray(
+            rtol.dtype, size=0, dynamic_size=True))
+    rk_state = _RungeKuttaState(
+        y0, func(y0, t[0]), t[0], t[0], first_step, interp_coeff=[y0] * 5)
+
+    solution, history, _, _ = control_flow_ops.while_loop(
+        lambda _, __, ___, i: i < num_times,
+        interpolate,
+        (solution, history, rk_state, 1),
+        name='interpolate_loop')
+
+    y = solution.pack(name=scope)
+    y.set_shape(t.get_shape().concatenate(y0.get_shape()))
+    if not full_output:
+      return y
+    else:
+      integrate_points = history.integrate_points.pack()
+      info_dict = {'num_func_evals': 6 * array_ops.size(integrate_points) + 1,
+                   'integrate_points': integrate_points,
+                   'error_ratio': history.error_ratio.pack()}
+      return (y, info_dict)
+
+
+def odeint(func,
+           y0,
+           t,
+           rtol=1e-6,
+           atol=1e-12,
+           method=None,
+           options=None,
+           full_output=False,
+           name=None):
+  """Integrate a system of ordinary differential equations.
+
+  Solves the initial value problem for a non-stiff system of first order ode-s:
+
+    ```
+    dy/dt = func(y, t), y(t[0]) = y0
+    ```
+
+  where y is a Tensor of any shape.
+
+  For example:
+
+    ```
+    # solve `dy/dt = -y`, corresponding to exponential decay
+    tf.contrib.integrate.odeint(lambda y, _: -y, 1.0, [0, 1, 2])
+    => [1, exp(-1), exp(-2)]
+    ```
+
+  Output dtypes and numerical precision are based on the dtypes of the inputs
+  `y0` and `t`.
+
+  Currently, implements 5th order Runge-Kutta with adaptive step size control
+  and dense output, using the Dormand-Prince method. Similar to the 'dopri5'
+  method of `scipy.integrate.ode` and MATLAB's `ode45`.
+
+  Based on: Shampine, Lawrence F. (1986), "Some Practical Runge-Kutta Formulas",
+  Mathematics of Computation, American Mathematical Society, 46 (173): 135-150,
+  doi:10.2307/2008219
+
+  Args:
+    func: Function that maps a Tensor holding the state `y` and a scalar Tensor
+      `t` into a Tensor of state derivatives with respect to time.
+    y0: N-D Tensor giving starting value of `y` at time point `t[0]`. May
+      have any floating point or complex dtype.
+    t: 1-D Tensor holding a sequence of time points for which to solve for
+      `y`. The initial time point should be the first element of this sequence,
+      and each time must be larger than the previous time. May have any floating
+      point dtype. If not provided as a Tensor, converted to a Tensor with
+      float64 dtype.
+    rtol: optional float64 Tensor specifying an upper bound on relative error,
+      per element of `y`.
+    atol: optional float64 Tensor specifying an upper bound on absolute error,
+      per element of `y`.
+    method: optional string indicating the integration method to use. Currently,
+      the only valid option is `'dopri5'`.
+    options: optional dict of configuring options for the indicated integration
+      method. Can only be provided if a `method` is explicitly set. For
+      `'dopri5'`, valid options include:
+      * first_step: an initial guess for the size of the first integration
+        (current default: 1.0, but may later be changed to use heuristics based
+        on the gradient).
+      * safety: safety factor for adaptive step control, generally a constant
+        in the range 0.8-1 (default: 0.9).
+      * ifactor: maximum factor by which the adaptive step may be increased
+        (default: 10.0).
+      * dfactor: maximum factor by which the adpative step may be decreased
+        (default: 0.2).
+      * max_num_steps: integer maximum number of integrate steps between time
+        points in `t` (default: 1000).
+    full_output: optional boolean. If True, `odeint` returns a tuple
+      `(y, info_dict)` describing the integration process.
+    name: Optional name for this operation.
+
+  Returns:
+    y: (N+1)-D tensor, where the first dimension corresponds to different
+      time points. Contains the solved value of y for each desired time point in
+      `t`, with the initial value `y0` being the first element along the first
+      dimension.
+    info_dict: only if `full_output == True`. A dict with the following values:
+      * num_func_evals: integer Tensor counting the number of function
+        evaluations.
+      * integrate_points: 1D float64 Tensor with the upper bound of each
+        integration time step.
+      * error_ratio: 1D float Tensor with the estimated ratio of the integration
+        error to the error tolerance at each integration step. An ratio greater
+        than 1 corresponds to rejected steps.
+
+  Raises:
+    ValueError: if an invalid `method` is provided.
+    TypeError: if `options` is supplied without `method`, or if `t` or `y0` has
+      an invalid dtype.
+  """
+  if method is not None and method != 'dopri5':
+    raise ValueError('invalid method: %r' % method)
+
+  if options is None:
+    options = {}
+  elif method is None:
+    raise ValueError('cannot supply `options` without specifying `method`')
+
+  with ops.name_scope(name, 'odeint', [y0, t, rtol, atol]) as scope:
+    # TODO(shoyer): use nest.flatten (like tf.while_loop) to allow `y0` to be an
+    # arbitrarily nested tuple. This will help performance and usability by
+    # avoiding the need to pack/unpack in user functions.
+    y0 = ops.convert_to_tensor(y0, name='y0')
+    if not (y0.dtype.is_floating or y0.dtype.is_complex):
+      raise TypeError('`y0` must have a floating point or complex floating '
+                      'point dtype')
+
+    t = ops.convert_to_tensor(t, preferred_dtype=dtypes.float64, name='t')
+    if not t.dtype.is_floating:
+      raise TypeError('`t` must have a floating point dtype')
+
+    error_dtype = abs(y0).dtype
+    rtol = ops.convert_to_tensor(rtol, dtype=error_dtype, name='rtol')
+    atol = ops.convert_to_tensor(atol, dtype=error_dtype, name='atol')
+
+    return _dopri5(func, y0, t,
+                   rtol=rtol,
+                   atol=atol,
+                   full_output=full_output,
+                   name=scope,
+                   **options)
diff --git a/tensorflow/contrib/integrate/python/ops/odes_test.py b/tensorflow/contrib/integrate/python/ops/odes_test.py
new file mode 100644
index 00000000000..cb036bf05ac
--- /dev/null
+++ b/tensorflow/contrib/integrate/python/ops/odes_test.py
@@ -0,0 +1,232 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""Tests for ODE solvers."""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import numpy as np
+import tensorflow as tf
+
+from tensorflow.contrib.integrate.python.ops import odes
+
+
+class OdeIntTest(tf.test.TestCase):
+
+  def setUp(self):
+    super(OdeIntTest, self).setUp()
+    # simple defaults (solution is a sin-wave)
+    matrix = tf.constant([[0, 1], [-1, 0]], dtype=tf.float64)
+    self.func = lambda y, t: tf.matmul(matrix, y)
+    self.y0 = np.array([[1.0], [0.0]])
+
+  def test_odeint_exp(self):
+    # Test odeint by an exponential function:
+    #   dy / dt = y,  y(0) = 1.0.
+    # Its analytical solution is y = exp(t).
+    func = lambda y, t: y
+    y0 = tf.constant(1.0, dtype=tf.float64)
+    t = np.linspace(0.0, 1.0, 11)
+    y_solved = tf.contrib.integrate.odeint(func, y0, t)
+    self.assertIn('odeint', y_solved.name)
+    self.assertEqual(y_solved.get_shape(), tf.TensorShape([11]))
+    with self.test_session() as sess:
+      y_solved = sess.run(y_solved)
+    y_true = np.exp(t)
+    self.assertAllClose(y_true, y_solved)
+
+  def test_odeint_complex(self):
+    # Test a complex, linear ODE:
+    #   dy / dt = k * y,  y(0) = 1.0.
+    # Its analytical solution is y = exp(k * t).
+    k = 1j - 0.1
+    func = lambda y, t: k * y
+    t = np.linspace(0.0, 1.0, 11)
+    y_solved = tf.contrib.integrate.odeint(func, 1.0 + 0.0j, t)
+    with self.test_session() as sess:
+      y_solved = sess.run(y_solved)
+    y_true = np.exp(k * t)
+    self.assertAllClose(y_true, y_solved)
+
+  def test_odeint_riccati(self):
+    # The Ricatti equation is:
+    #   dy / dt = (y - t) ** 2 + 1.0,  y(0) = 0.5.
+    # Its analytical solution is y = 1.0 / (2.0 - t) + t.
+    func = lambda t, y: (y - t)**2 + 1.0
+    t = np.linspace(0.0, 1.0, 11)
+    y_solved = tf.contrib.integrate.odeint(func, np.float64(0.5), t)
+    with self.test_session() as sess:
+      y_solved = sess.run(y_solved)
+    y_true = 1.0 / (2.0 - t) + t
+    self.assertAllClose(y_true, y_solved)
+
+  def test_odeint_2d_linear(self):
+    # Solve the 2D linear differential equation:
+    #   dy1 / dt = 3.0 * y1 + 4.0 * y2,
+    #   dy2 / dt = -4.0 * y1 + 3.0 * y2,
+    #   y1(0) = 0.0,
+    #   y2(0) = 1.0.
+    # Its analytical solution is
+    #   y1 = sin(4.0 * t) * exp(3.0 * t),
+    #   y2 = cos(4.0 * t) * exp(3.0 * t).
+    matrix = tf.constant([[3.0, 4.0], [-4.0, 3.0]], dtype=tf.float64)
+    func = lambda y, t: tf.matmul(matrix, y)
+
+    y0 = tf.constant([[0.0], [1.0]], dtype=tf.float64)
+    t = np.linspace(0.0, 1.0, 11)
+
+    y_solved = tf.contrib.integrate.odeint(func, y0, t)
+    with self.test_session() as sess:
+      y_solved = sess.run(y_solved)
+
+    y_true = np.zeros((len(t), 2, 1))
+    y_true[:, 0, 0] = np.sin(4.0 * t) * np.exp(3.0 * t)
+    y_true[:, 1, 0] = np.cos(4.0 * t) * np.exp(3.0 * t)
+    self.assertAllClose(y_true, y_solved, atol=1e-5)
+
+  def test_odeint_higher_rank(self):
+    func = lambda y, t: y
+    y0 = tf.constant(1.0, dtype=tf.float64)
+    t = np.linspace(0.0, 1.0, 11)
+    for shape in [(), (1,), (1, 1)]:
+      expected_shape = (len(t),) + shape
+      y_solved = tf.contrib.integrate.odeint(func, tf.reshape(y0, shape), t)
+      self.assertEqual(y_solved.get_shape(), tf.TensorShape(expected_shape))
+      with self.test_session() as sess:
+        y_solved = sess.run(y_solved)
+        self.assertEquals(y_solved.shape, expected_shape)
+
+  def test_odeint_all_dtypes(self):
+    func = lambda y, t: y
+    t = np.linspace(0.0, 1.0, 11)
+    for y0_dtype in [tf.float32, tf.float64, tf.complex64, tf.complex128]:
+      for t_dtype in [tf.float32, tf.float64]:
+        y0 = tf.cast(1.0, y0_dtype)
+        y_solved = tf.contrib.integrate.odeint(func, y0, tf.cast(t, t_dtype))
+        with self.test_session() as sess:
+          y_solved = sess.run(y_solved)
+        expected = np.asarray(np.exp(t))
+        self.assertAllClose(y_solved, expected, rtol=1e-5)
+        self.assertEqual(tf.as_dtype(y_solved.dtype), y0_dtype)
+
+  def test_odeint_required_dtypes(self):
+    with self.assertRaisesRegexp(TypeError, '`y0` must have a floating point'):
+      tf.contrib.integrate.odeint(self.func, tf.cast(self.y0, tf.int32), [0, 1])
+
+    with self.assertRaisesRegexp(TypeError, '`t` must have a floating point'):
+      tf.contrib.integrate.odeint(self.func, self.y0, tf.cast([0, 1], tf.int32))
+
+  def test_odeint_runtime_errors(self):
+    with self.assertRaisesRegexp(
+        ValueError, 'cannot supply `options` without'):
+      tf.contrib.integrate.odeint(self.func, self.y0, [0, 1],
+                                  options={'first_step': 1.0})
+
+    y = tf.contrib.integrate.odeint(self.func, self.y0, [0, 1], method='dopri5',
+                                    options={'max_num_steps': 0})
+    with self.test_session() as sess:
+      with self.assertRaisesRegexp(
+          tf.errors.InvalidArgumentError, 'max_num_steps'):
+        sess.run(y)
+
+    y = tf.contrib.integrate.odeint(self.func, self.y0, [1, 0])
+    with self.test_session() as sess:
+      with self.assertRaisesRegexp(
+          tf.errors.InvalidArgumentError, 'monotonic increasing'):
+        sess.run(y)
+
+  def test_odeint_different_times(self):
+    # integrate steps should be independent of interpolation times
+    times0 = np.linspace(0, 10, num=11, dtype=float)
+    times1 = np.linspace(0, 10, num=101, dtype=float)
+
+    with self.test_session() as sess:
+      y_solved_0, info_0 = sess.run(
+          tf.contrib.integrate.odeint(
+              self.func, self.y0, times0, full_output=True))
+      y_solved_1, info_1 = sess.run(
+          tf.contrib.integrate.odeint(
+              self.func, self.y0, times1, full_output=True))
+
+    self.assertAllClose(y_solved_0, y_solved_1[::10])
+    self.assertEqual(info_0['num_func_evals'], info_1['num_func_evals'])
+    self.assertAllEqual(info_0['integrate_points'], info_1['integrate_points'])
+    self.assertAllEqual(info_0['error_ratio'], info_1['error_ratio'])
+
+  def test_odeint_5th_order_accuracy(self):
+    t = [0, 20]
+    kwargs = dict(full_output=True,
+                  method='dopri5',
+                  options=dict(max_num_steps=2000))
+    with self.test_session() as sess:
+      _, info_0 = sess.run(tf.contrib.integrate.odeint(
+          self.func, self.y0, t, rtol=0, atol=1e-6, **kwargs))
+      _, info_1 = sess.run(tf.contrib.integrate.odeint(
+          self.func, self.y0, t, rtol=0, atol=1e-9, **kwargs))
+    self.assertAllClose(info_0['integrate_points'].size * 1000 ** 0.2,
+                        float(info_1['integrate_points'].size),
+                        rtol=0.01)
+
+
+class StepSizeTest(tf.test.TestCase):
+
+  def test_error_ratio_one(self):
+    new_step = odes._optimal_step_size(last_step=tf.constant(1.0),
+                                       error_ratio=tf.constant(1.0))
+    with self.test_session() as sess:
+      new_step = sess.run(new_step)
+    self.assertAllClose(new_step, 0.9)
+
+  def test_ifactor(self):
+    new_step = odes._optimal_step_size(last_step=tf.constant(1.0),
+                                       error_ratio=tf.constant(0.0))
+    with self.test_session() as sess:
+      new_step = sess.run(new_step)
+    self.assertAllClose(new_step, 10.0)
+
+  def test_dfactor(self):
+    new_step = odes._optimal_step_size(last_step=tf.constant(1.0),
+                                       error_ratio=tf.constant(1e6))
+    with self.test_session() as sess:
+      new_step = sess.run(new_step)
+    self.assertAllClose(new_step, 0.2)
+
+
+class InterpolationTest(tf.test.TestCase):
+
+  def test_5th_order_polynomial(self):
+    # this should be an exact fit
+    f = lambda x: x ** 4 + x ** 3 - 2 * x ** 2 + 4 * x + 5
+    f_prime = lambda x: 4 * x ** 3 + 3 * x ** 2 - 4 * x + 4
+    coeffs = odes._interp_fit(
+        f(0.0), f(10.0), f(5.0), f_prime(0.0), f_prime(10.0), 10.0)
+    times = np.linspace(0, 10, dtype=np.float32)
+    y_fit = tf.pack([odes._interp_evaluate(coeffs, 0.0, 10.0, t)
+                     for t in times])
+    y_expected = f(times)
+    with self.test_session() as sess:
+      y_actual = sess.run(y_fit)
+      self.assertAllClose(y_expected, y_actual)
+
+    # attempt interpolation outside bounds
+    y_invalid = odes._interp_evaluate(coeffs, 0.0, 10.0, 100.0)
+    with self.test_session() as sess:
+      with self.assertRaises(tf.errors.InvalidArgumentError):
+        sess.run(y_invalid)
+
+
+if __name__ == '__main__':
+  tf.test.main()
diff --git a/tensorflow/contrib/layers/python/layers/embedding_ops.py b/tensorflow/contrib/layers/python/layers/embedding_ops.py
index 106f7bcf50a..299282b45db 100644
--- a/tensorflow/contrib/layers/python/layers/embedding_ops.py
+++ b/tensorflow/contrib/layers/python/layers/embedding_ops.py
@@ -22,6 +22,7 @@ from tensorflow.contrib.layers.python.ops import sparse_feature_cross_op
 
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import embedding_ops
@@ -114,8 +115,9 @@ def safe_embedding_lookup_sparse(embedding_weights,
             array_ops.slice(original_shape, [0], [original_rank - 1])),
         array_ops.gather(original_shape, original_rank - 1)])
     if sparse_weights is not None:
-      sparse_weights = ops.SparseTensor(sparse_ids.indices,
-                                        sparse_weights.values, sparse_ids.shape)
+      sparse_weights = sparse_tensor.SparseTensor(
+          sparse_ids.indices,
+          sparse_weights.values, sparse_ids.shape)
 
     # Prune invalid ids and weights.
     sparse_ids, sparse_weights = _prune_invalid_ids(sparse_ids, sparse_weights)
@@ -302,7 +304,7 @@ def hashed_embedding_lookup_sparse(params,
     params = list(params)
   if not isinstance(params, list):
     params = [params]
-  if not isinstance(sparse_values, ops.SparseTensor):
+  if not isinstance(sparse_values, sparse_tensor.SparseTensor):
     raise TypeError("sparse_values must be SparseTensor")
 
   with ops.name_scope(name, "hashed_sparse_embedding_lookup",
diff --git a/tensorflow/contrib/layers/python/layers/encoders.py b/tensorflow/contrib/layers/python/layers/encoders.py
index e770f9116f1..8b6abb4b456 100644
--- a/tensorflow/contrib/layers/python/layers/encoders.py
+++ b/tensorflow/contrib/layers/python/layers/encoders.py
@@ -21,7 +21,7 @@ from __future__ import print_function
 from tensorflow.contrib.framework.python.ops import variables
 from tensorflow.contrib.layers.python.layers import embedding_ops as contrib_embedding_ops
 from tensorflow.contrib.layers.python.ops import sparse_ops
-from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import embedding_ops
 from tensorflow.python.ops import math_ops
 from tensorflow.python.ops import variable_scope
@@ -74,14 +74,14 @@ def bow_encoder(ids,
         initializer=initializer, regularizer=regularizer,
         trainable=trainable)
     if sparse_lookup:
-      if isinstance(ids, ops.SparseTensor):
+      if isinstance(ids, sparse_tensor.SparseTensor):
         sparse_ids = ids
       else:
         sparse_ids = sparse_ops.dense_to_sparse_tensor(ids)
       return contrib_embedding_ops.safe_embedding_lookup_sparse(
           [embeddings], sparse_ids, combiner='mean', default_id=0)
     else:
-      if isinstance(ids, ops.SparseTensor):
+      if isinstance(ids, sparse_tensor.SparseTensor):
         raise TypeError('ids are expected to be dense Tensor, got: %s', ids)
       return math_ops.reduce_mean(
           embedding_ops.embedding_lookup(embeddings, ids),
diff --git a/tensorflow/contrib/layers/python/layers/feature_column.py b/tensorflow/contrib/layers/python/layers/feature_column.py
index 75d77f881e0..314156a5e44 100644
--- a/tensorflow/contrib/layers/python/layers/feature_column.py
+++ b/tensorflow/contrib/layers/python/layers/feature_column.py
@@ -76,13 +76,12 @@ import collections
 import math
 import six
 
-from tensorflow.contrib.framework.python.framework import deprecation
 from tensorflow.contrib.layers.python.layers import layers
 from tensorflow.contrib.layers.python.ops import bucketization_op
 from tensorflow.contrib.layers.python.ops import sparse_feature_cross_op
 from tensorflow.contrib.lookup import lookup_ops as contrib_lookup_ops
 from tensorflow.python.framework import dtypes
-from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor as sparse_tensor_py
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import init_ops
 from tensorflow.python.ops import math_ops
@@ -90,6 +89,7 @@ from tensorflow.python.ops import parsing_ops
 from tensorflow.python.ops import sparse_ops
 from tensorflow.python.ops import string_ops
 from tensorflow.python.platform import tf_logging as logging
+from tensorflow.python.util import deprecation
 
 
 class _LinearEmbeddingLookupArguments(
@@ -390,7 +390,7 @@ class _SparseColumnIntegerized(_SparseColumn):
     sparse_id_values = math_ops.mod(columns_to_tensors[self.name].values,
                                     self.bucket_size,
                                     name="mod")
-    columns_to_tensors[self] = ops.SparseTensor(
+    columns_to_tensors[self] = sparse_tensor_py.SparseTensor(
         columns_to_tensors[self.name].indices, sparse_id_values,
         columns_to_tensors[self.name].shape)
 
@@ -464,7 +464,7 @@ class _SparseColumnHashed(_SparseColumn):
 
     sparse_id_values = string_ops.string_to_hash_bucket_fast(
         sparse_values, self.bucket_size, name="lookup")
-    columns_to_tensors[self] = ops.SparseTensor(
+    columns_to_tensors[self] = sparse_tensor_py.SparseTensor(
         sparse_tensor.indices, sparse_id_values, sparse_tensor.shape)
 
 
@@ -1452,7 +1452,8 @@ class _BucketizedColumn(_FeatureColumn, collections.namedtuple(
 
     indices = math_ops.to_int64(array_ops.transpose(array_ops.pack((i1, i2))))
     shape = math_ops.to_int64(array_ops.pack([batch_size, dimension]))
-    sparse_id_values = ops.SparseTensor(indices, bucket_indices, shape)
+    sparse_id_values = sparse_tensor_py.SparseTensor(
+        indices, bucket_indices, shape)
 
     return sparse_id_values
 
diff --git a/tensorflow/contrib/layers/python/layers/feature_column_ops.py b/tensorflow/contrib/layers/python/layers/feature_column_ops.py
index 4000ce88850..16ecd92e670 100644
--- a/tensorflow/contrib/layers/python/layers/feature_column_ops.py
+++ b/tensorflow/contrib/layers/python/layers/feature_column_ops.py
@@ -26,6 +26,7 @@ from tensorflow.contrib.layers.python.layers import feature_column as fc
 from tensorflow.contrib.layers.python.layers import layers
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor as sparse_tensor_py
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import init_ops
 from tensorflow.python.ops import math_ops
@@ -362,9 +363,9 @@ def _create_joint_embedding_lookup(columns_to_tensors,
     values = t.values + prev_size
     prev_size += a.vocab_size
     sparse_tensors.append(
-        ops.SparseTensor(t.indices,
-                         values,
-                         t.shape))
+        sparse_tensor_py.SparseTensor(t.indices,
+                                      values,
+                                      t.shape))
   sparse_tensor = sparse_ops.sparse_concat(1, sparse_tensors)
   with variable_scope.variable_scope(
       None, default_name='linear_weights', values=columns_to_tensors.values()):
@@ -695,7 +696,7 @@ def _log_variable(variable):
 
 def _infer_real_valued_column_for_tensor(name, tensor):
   """Creates a real_valued_column for given tensor and name."""
-  if isinstance(tensor, ops.SparseTensor):
+  if isinstance(tensor, sparse_tensor_py.SparseTensor):
     raise ValueError(
         'SparseTensor is not supported for auto detection. Please define '
         'corresponding FeatureColumn for tensor {} {}.', name, tensor)
diff --git a/tensorflow/contrib/layers/python/layers/feature_column_test.py b/tensorflow/contrib/layers/python/layers/feature_column_test.py
index 67c2d3c6525..2e8bf9ffef2 100644
--- a/tensorflow/contrib/layers/python/layers/feature_column_test.py
+++ b/tensorflow/contrib/layers/python/layers/feature_column_test.py
@@ -21,6 +21,7 @@ from __future__ import print_function
 
 import itertools
 import os
+import tempfile
 
 import numpy as np
 import tensorflow as tf
@@ -609,7 +610,10 @@ class FeatureColumnTest(tf.test.TestCase):
             {embedding_col: input_tensor}, [embedding_col])
 
     save = tf.train.Saver()
-    checkpoint_path = os.path.join(self.get_temp_dir(), "model.ckpt")
+    ckpt_dir_prefix = os.path.join(
+        self.get_temp_dir(), "init_embedding_col_w_from_ckpt")
+    ckpt_dir = tempfile.mkdtemp(prefix=ckpt_dir_prefix)
+    checkpoint_path = os.path.join(ckpt_dir, "model.ckpt")
 
     with self.test_session() as sess:
       sess.run(tf.initialize_all_variables())
@@ -670,7 +674,10 @@ class FeatureColumnTest(tf.test.TestCase):
           assign_op = tf.assign(weight[0], weight[0] + 0.5)
 
     save = tf.train.Saver()
-    checkpoint_path = os.path.join(self.get_temp_dir(), "model.ckpt")
+    ckpt_dir_prefix = os.path.join(
+        self.get_temp_dir(), "init_crossed_col_w_from_ckpt")
+    ckpt_dir = tempfile.mkdtemp(prefix=ckpt_dir_prefix)
+    checkpoint_path = os.path.join(ckpt_dir, "model.ckpt")
 
     with self.test_session() as sess:
       sess.run(tf.initialize_all_variables())
diff --git a/tensorflow/contrib/layers/python/layers/layers.py b/tensorflow/contrib/layers/python/layers/layers.py
index cb5d34faeff..3d08cedcab4 100644
--- a/tensorflow/contrib/layers/python/layers/layers.py
+++ b/tensorflow/contrib/layers/python/layers/layers.py
@@ -31,6 +31,7 @@ from tensorflow.contrib.layers.python.layers import utils
 
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import check_ops
 from tensorflow.python.ops import init_ops
@@ -1217,7 +1218,7 @@ def _inner_flatten(inputs, new_rank, output_collections=None, scope=None):
     TypeError: `inputs` is not a `Tensor` or `SparseTensor`.
   """
   with ops.name_scope(scope, 'InnerFlatten', [inputs, new_rank]) as sc:
-    if isinstance(inputs, ops.SparseTensor):
+    if isinstance(inputs, sparse_tensor.SparseTensor):
       flattened = _sparse_inner_flatten(inputs, new_rank)
     else:
       inputs = ops.convert_to_tensor(inputs)
diff --git a/tensorflow/contrib/layers/python/layers/optimizers.py b/tensorflow/contrib/layers/python/layers/optimizers.py
index 8c06202f47b..6cb7e91b73f 100644
--- a/tensorflow/contrib/layers/python/layers/optimizers.py
+++ b/tensorflow/contrib/layers/python/layers/optimizers.py
@@ -258,10 +258,11 @@ def optimize_loss(loss,
         grad_values = gradient
 
       if grad_values is not None:
+        var_name = variable.name.replace(":", "_")
         if "gradients" in summaries:
-          summary.histogram("gradients/" + variable.name, grad_values)
+          summary.histogram("gradients/%s" % var_name, grad_values)
         if "gradient_norm" in summaries:
-          summary.scalar("gradient_norm/" + variable.name,
+          summary.scalar("gradient_norm/%s" % var_name,
                          clip_ops.global_norm([grad_values]))
 
     if clip_gradients is not None and "gradient_norm" in summaries:
diff --git a/tensorflow/contrib/layers/python/layers/target_column_test.py b/tensorflow/contrib/layers/python/layers/target_column_test.py
index 1573517b6f4..defbd2f455e 100644
--- a/tensorflow/contrib/layers/python/layers/target_column_test.py
+++ b/tensorflow/contrib/layers/python/layers/target_column_test.py
@@ -58,7 +58,7 @@ class MultiClassTargetColumnTest(tf.test.TestCase):
       labels = tf.constant([[1.], [0.]])
       # logloss: z:label, x:logit
       # z * -log(sigmoid(x)) + (1 - z) * -log(1 - sigmoid(x))
-      self.assertAlmostEqual(.81326163,
+      self.assertAlmostEqual(0.81326175,
                              sess.run(target_column.loss(logits, labels, {})))
 
   def testBinaryClassificationWithWeights(self):
diff --git a/tensorflow/contrib/layers/python/ops/sparse_feature_cross_op.py b/tensorflow/contrib/layers/python/ops/sparse_feature_cross_op.py
index 7a35732049c..35edf280ef8 100644
--- a/tensorflow/contrib/layers/python/ops/sparse_feature_cross_op.py
+++ b/tensorflow/contrib/layers/python/ops/sparse_feature_cross_op.py
@@ -23,6 +23,7 @@ from tensorflow.contrib.util import loader
 from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import math_ops
 from tensorflow.python.platform import resource_loader
 
@@ -69,12 +70,14 @@ def sparse_feature_cross(inputs, hashed_output=False, num_buckets=0,
   """
   if not isinstance(inputs, list):
     raise TypeError("Inputs must be a list")
-  if not all(isinstance(i, ops.SparseTensor) or
+  if not all(isinstance(i, sparse_tensor.SparseTensor) or
              isinstance(i, ops.Tensor) for i in inputs):
     raise TypeError("All inputs must be SparseTensors")
 
-  sparse_inputs = [i for i in inputs if isinstance(i, ops.SparseTensor)]
-  dense_inputs = [i for i in inputs if not isinstance(i, ops.SparseTensor)]
+  sparse_inputs = [i for i in inputs
+                   if isinstance(i, sparse_tensor.SparseTensor)]
+  dense_inputs = [i for i in inputs
+                  if not isinstance(i, sparse_tensor.SparseTensor)]
 
   indices = [sp_input.indices for sp_input in sparse_inputs]
   values = [sp_input.values for sp_input in sparse_inputs]
@@ -117,7 +120,7 @@ def sparse_feature_cross(inputs, hashed_output=False, num_buckets=0,
             internal_type=internal_type,
             name=name))
 
-  return ops.SparseTensor(indices_out, values_out, shape_out)
+  return sparse_tensor.SparseTensor(indices_out, values_out, shape_out)
 
 
 ops.RegisterShape("SparseFeatureCross")(common_shapes.call_cpp_shape_fn)
diff --git a/tensorflow/contrib/layers/python/ops/sparse_ops.py b/tensorflow/contrib/layers/python/ops/sparse_ops.py
index a6e5ac0aa88..325f5ac97bf 100644
--- a/tensorflow/contrib/layers/python/ops/sparse_ops.py
+++ b/tensorflow/contrib/layers/python/ops/sparse_ops.py
@@ -20,6 +20,7 @@ from __future__ import print_function
 
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import math_ops
 
@@ -78,4 +79,4 @@ def dense_to_sparse_tensor(dense_tensor, ignore_value=None):
           math_ops.mul(higher_dims, shape_multipliers), reduction_indices=[1])
       flat_indices = math_ops.add(flat_indices, offsets)
     values = array_ops.gather(flat_tensor, flat_indices)
-    return ops.SparseTensor(indices, values, dense_shape)
+    return sparse_tensor.SparseTensor(indices, values, dense_shape)
diff --git a/tensorflow/contrib/learn/BUILD b/tensorflow/contrib/learn/BUILD
index 62d7bb77c98..b93089c9cb7 100644
--- a/tensorflow/contrib/learn/BUILD
+++ b/tensorflow/contrib/learn/BUILD
@@ -291,7 +291,9 @@ py_test(
     deps = [
         ":learn",
         "//tensorflow:tensorflow_py",
+        "//tensorflow/python:extra_py_tests_deps",
         "//tensorflow/python:framework_test_lib",
+        "//tensorflow/python:test_ops",
     ],
 )
 
diff --git a/tensorflow/contrib/learn/python/learn/dataframe/estimator_utils.py b/tensorflow/contrib/learn/python/learn/dataframe/estimator_utils.py
index 16eff25d102..0ca8afe498b 100644
--- a/tensorflow/contrib/learn/python/learn/dataframe/estimator_utils.py
+++ b/tensorflow/contrib/learn/python/learn/dataframe/estimator_utils.py
@@ -22,11 +22,12 @@ from __future__ import print_function
 from tensorflow.contrib.layers import feature_column
 from tensorflow.contrib.learn.python.learn.dataframe import series as ss
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import parsing_ops
 
 
 def _to_feature_spec(tensor, default_value=None):
-  if isinstance(tensor, ops.SparseTensor):
+  if isinstance(tensor, sparse_tensor.SparseTensor):
     return parsing_ops.VarLenFeature(dtype=tensor.dtype)
   else:
     return parsing_ops.FixedLenFeature(shape=tensor.get_shape(),
diff --git a/tensorflow/contrib/learn/python/learn/dataframe/transforms/binary_transforms.py b/tensorflow/contrib/learn/python/learn/dataframe/transforms/binary_transforms.py
index b3e52254032..2a59fceb742 100644
--- a/tensorflow/contrib/learn/python/learn/dataframe/transforms/binary_transforms.py
+++ b/tensorflow/contrib/learn/python/learn/dataframe/transforms/binary_transforms.py
@@ -20,7 +20,7 @@ from __future__ import print_function
 
 from tensorflow.contrib.learn.python.learn.dataframe import series
 from tensorflow.contrib.learn.python.learn.dataframe import transform
-from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import math_ops
 
 # Each entry is a mapping from registered_name to operation. Each operation is
@@ -55,8 +55,8 @@ class SeriesBinaryTransform(transform.TensorFlowTransform):
 
   def _apply_transform(self, input_tensors, **kwargs):
     # TODO(jamieas): consider supporting sparse inputs.
-    if isinstance(input_tensors[0], ops.SparseTensor) or isinstance(
-        input_tensors[1], ops.SparseTensor):
+    if isinstance(input_tensors[0], sparse_tensor.SparseTensor) or isinstance(
+        input_tensors[1], sparse_tensor.SparseTensor):
       raise TypeError("{} does not support SparseTensors".format(
           type(self).__name__))
 
@@ -89,10 +89,10 @@ class ScalarBinaryTransform(transform.TensorFlowTransform):
 
   def _apply_transform(self, input_tensors, **kwargs):
     input_tensor = input_tensors[0]
-    if isinstance(input_tensor, ops.SparseTensor):
-      result = ops.SparseTensor(input_tensor.indices,
-                                self._apply_op(input_tensor.values),
-                                input_tensor.shape)
+    if isinstance(input_tensor, sparse_tensor.SparseTensor):
+      result = sparse_tensor.SparseTensor(input_tensor.indices,
+                                          self._apply_op(input_tensor.values),
+                                          input_tensor.shape)
     else:
       result = self._apply_op(input_tensor)
 
diff --git a/tensorflow/contrib/learn/python/learn/dataframe/transforms/boolean_mask.py b/tensorflow/contrib/learn/python/learn/dataframe/transforms/boolean_mask.py
index 880217f558a..130ac0c90f5 100644
--- a/tensorflow/contrib/learn/python/learn/dataframe/transforms/boolean_mask.py
+++ b/tensorflow/contrib/learn/python/learn/dataframe/transforms/boolean_mask.py
@@ -23,6 +23,7 @@ from tensorflow.contrib.learn.python.learn.dataframe import series
 from tensorflow.contrib.learn.python.learn.dataframe import transform
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor as sparse_tensor_py
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import functional_ops
 from tensorflow.python.ops import math_ops
@@ -93,7 +94,7 @@ class BooleanMask(transform.TensorFlowTransform):
     if mask.get_shape().ndims > 1:
       mask = array_ops.squeeze(mask)
 
-    if isinstance(input_tensor, ops.SparseTensor):
+    if isinstance(input_tensor, sparse_tensor_py.SparseTensor):
       mask_fn = sparse_boolean_mask
     else:
       mask_fn = array_ops.boolean_mask
diff --git a/tensorflow/contrib/learn/python/learn/dataframe/transforms/difference.py b/tensorflow/contrib/learn/python/learn/dataframe/transforms/difference.py
index f9cb0c94855..6ce71d882e5 100644
--- a/tensorflow/contrib/learn/python/learn/dataframe/transforms/difference.py
+++ b/tensorflow/contrib/learn/python/learn/dataframe/transforms/difference.py
@@ -21,14 +21,14 @@ from __future__ import print_function
 
 from tensorflow.contrib.learn.python.learn.dataframe import series
 from tensorflow.contrib.learn.python.learn.dataframe import transform
-from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import sparse_ops
 
 
-def _negate_sparse(sparse_tensor):
-  return ops.SparseTensor(indices=sparse_tensor.indices,
-                          values=-sparse_tensor.values,
-                          shape=sparse_tensor.shape)
+def _negate_sparse(st):
+  return sparse_tensor.SparseTensor(indices=st.indices,
+                                    values=-st.values,
+                                    shape=st.shape)
 
 
 @series.Series.register_binary_op("__sub__")
@@ -51,8 +51,8 @@ class Difference(transform.TensorFlowTransform):
     return "output",
 
   def _apply_transform(self, input_tensors, **kwargs):
-    pair_sparsity = (isinstance(input_tensors[0], ops.SparseTensor),
-                     isinstance(input_tensors[1], ops.SparseTensor))
+    pair_sparsity = (isinstance(input_tensors[0], sparse_tensor.SparseTensor),
+                     isinstance(input_tensors[1], sparse_tensor.SparseTensor))
 
     if pair_sparsity == (False, False):
       result = input_tensors[0] - input_tensors[1]
diff --git a/tensorflow/contrib/learn/python/learn/dataframe/transforms/sparsify.py b/tensorflow/contrib/learn/python/learn/dataframe/transforms/sparsify.py
index 05b66a683c0..de83a0e19f4 100644
--- a/tensorflow/contrib/learn/python/learn/dataframe/transforms/sparsify.py
+++ b/tensorflow/contrib/learn/python/learn/dataframe/transforms/sparsify.py
@@ -24,7 +24,7 @@ import numpy as np
 from tensorflow.contrib.learn.python.learn.dataframe import transform
 
 from tensorflow.python.framework import dtypes
-from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import math_ops
 
@@ -82,4 +82,5 @@ class Sparsify(transform.TensorFlowTransform):
     shape = math_ops.cast(array_ops.shape(d), dtypes.int64)
 
     # pylint: disable=not-callable
-    return self.return_type(ops.SparseTensor(sparse_indices, values, shape))
+    return self.return_type(
+        sparse_tensor.SparseTensor(sparse_indices, values, shape))
diff --git a/tensorflow/contrib/learn/python/learn/dataframe/transforms/sum.py b/tensorflow/contrib/learn/python/learn/dataframe/transforms/sum.py
index 212ac178f28..10c13ce4985 100644
--- a/tensorflow/contrib/learn/python/learn/dataframe/transforms/sum.py
+++ b/tensorflow/contrib/learn/python/learn/dataframe/transforms/sum.py
@@ -21,7 +21,7 @@ from __future__ import print_function
 
 from tensorflow.contrib.learn.python.learn.dataframe import series
 from tensorflow.contrib.learn.python.learn.dataframe import transform
-from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import sparse_ops
 
 
@@ -45,8 +45,8 @@ class Sum(transform.TensorFlowTransform):
     return "output",
 
   def _apply_transform(self, input_tensors, **kwargs):
-    pair_sparsity = (isinstance(input_tensors[0], ops.SparseTensor),
-                     isinstance(input_tensors[1], ops.SparseTensor))
+    pair_sparsity = (isinstance(input_tensors[0], sparse_tensor.SparseTensor),
+                     isinstance(input_tensors[1], sparse_tensor.SparseTensor))
 
     if pair_sparsity == (False, False):
       result = input_tensors[0] + input_tensors[1]
@@ -57,6 +57,3 @@ class Sum(transform.TensorFlowTransform):
 
     # pylint: disable=not-callable
     return self.return_type(result)
-
-
-
diff --git a/tensorflow/contrib/learn/python/learn/dataframe/transforms/unary_transforms.py b/tensorflow/contrib/learn/python/learn/dataframe/transforms/unary_transforms.py
index eab476eb99e..8734b4669d2 100644
--- a/tensorflow/contrib/learn/python/learn/dataframe/transforms/unary_transforms.py
+++ b/tensorflow/contrib/learn/python/learn/dataframe/transforms/unary_transforms.py
@@ -21,7 +21,7 @@ from __future__ import print_function
 
 from tensorflow.contrib.learn.python.learn.dataframe import series
 from tensorflow.contrib.learn.python.learn.dataframe import transform
-from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import math_ops
 
 # Each entry is a mapping from registered_name to operation. Each operation is
@@ -83,10 +83,10 @@ def register_unary_op(registered_name, operation, ignore_dtype=None):
 
   def _apply_transform(self, input_tensors, **kwargs):
     input_tensor = input_tensors[0]
-    if isinstance(input_tensor, ops.SparseTensor):
-      result = ops.SparseTensor(input_tensor.indices,
-                                operation(input_tensor.values),
-                                input_tensor.shape)
+    if isinstance(input_tensor, sparse_tensor.SparseTensor):
+      result = sparse_tensor.SparseTensor(input_tensor.indices,
+                                          operation(input_tensor.values),
+                                          input_tensor.shape)
     else:
       result = operation(input_tensor)
     # pylint: disable=not-callable
diff --git a/tensorflow/contrib/learn/python/learn/estimators/__init__.py b/tensorflow/contrib/learn/python/learn/estimators/__init__.py
index b5b1dbb6355..cfe2fb15985 100644
--- a/tensorflow/contrib/learn/python/learn/estimators/__init__.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/__init__.py
@@ -29,11 +29,11 @@ from tensorflow.contrib.learn.python.learn.estimators.estimator import Estimator
 from tensorflow.contrib.learn.python.learn.estimators.estimator import infer_real_valued_columns_from_input
 from tensorflow.contrib.learn.python.learn.estimators.estimator import infer_real_valued_columns_from_input_fn
 from tensorflow.contrib.learn.python.learn.estimators.estimator import ModeKeys
-from tensorflow.contrib.learn.python.learn.estimators.head import MetricKey
-from tensorflow.contrib.learn.python.learn.estimators.head import PredictionKey
 from tensorflow.contrib.learn.python.learn.estimators.linear import LinearClassifier
 from tensorflow.contrib.learn.python.learn.estimators.linear import LinearRegressor
 from tensorflow.contrib.learn.python.learn.estimators.logistic_regressor import LogisticRegressor
+from tensorflow.contrib.learn.python.learn.estimators.metric_key import MetricKey
+from tensorflow.contrib.learn.python.learn.estimators.prediction_key import PredictionKey
 from tensorflow.contrib.learn.python.learn.estimators.random_forest import TensorForestEstimator
 from tensorflow.contrib.learn.python.learn.estimators.random_forest import TensorForestLossHook
 from tensorflow.contrib.learn.python.learn.estimators.run_config import RunConfig
diff --git a/tensorflow/contrib/learn/python/learn/estimators/dnn_linear_combined.py b/tensorflow/contrib/learn/python/learn/estimators/dnn_linear_combined.py
index 64a92f5ffbb..3146a1e7c81 100644
--- a/tensorflow/contrib/learn/python/learn/estimators/dnn_linear_combined.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/dnn_linear_combined.py
@@ -19,7 +19,8 @@ from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 
-import numpy as np
+import math
+import re
 import six
 
 from tensorflow.contrib import layers
@@ -27,13 +28,23 @@ from tensorflow.contrib.framework import deprecated
 from tensorflow.contrib.framework import deprecated_arg_values
 from tensorflow.contrib.framework.python.ops import variables as contrib_variables
 from tensorflow.contrib.layers.python.layers import feature_column_ops
+from tensorflow.contrib.layers.python.layers import optimizers
+from tensorflow.contrib.learn.python.learn import evaluable
+from tensorflow.contrib.learn.python.learn import session_run_hook
+from tensorflow.contrib.learn.python.learn import trainable
 from tensorflow.contrib.learn.python.learn.estimators import composable_model
 from tensorflow.contrib.learn.python.learn.estimators import estimator
 from tensorflow.contrib.learn.python.learn.estimators import head as head_lib
+from tensorflow.contrib.learn.python.learn.estimators import prediction_key
+from tensorflow.contrib.learn.python.learn.utils import export
 from tensorflow.python.framework import ops
+from tensorflow.python.ops import control_flow_ops
+from tensorflow.python.ops import logging_ops
 from tensorflow.python.ops import nn
 from tensorflow.python.ops import parsing_ops
+from tensorflow.python.ops import partitioned_variables
 from tensorflow.python.ops import state_ops
+from tensorflow.python.ops import variable_scope
 
 
 class _DNNLinearCombinedBaseEstimator(estimator.BaseEstimator):
@@ -307,7 +318,236 @@ class _DNNLinearCombinedBaseEstimator(estimator.BaseEstimator):
     return logits
 
 
-class DNNLinearCombinedClassifier(_DNNLinearCombinedBaseEstimator):
+_CENTERED_BIAS_WEIGHT = "centered_bias_weight"
+
+# The default learning rates are a historical artifact of the initial
+# implementation, but seem a reasonable choice.
+_DNN_LEARNING_RATE = 0.05
+_LINEAR_LEARNING_RATE = 0.2
+
+
+def _as_iterable(preds, output):
+  for pred in preds:
+    yield pred[output]
+
+
+def _get_feature_dict(features):
+  if isinstance(features, dict):
+    return features
+  return {"": features}
+
+
+def _get_optimizer(optimizer):
+  if callable(optimizer):
+    return optimizer()
+  else:
+    return optimizer
+
+
+def _linear_learning_rate(num_linear_feature_columns):
+  """Returns the default learning rate of the linear model.
+
+  The calculation is a historical artifact of this initial implementation, but
+  has proven a reasonable choice.
+
+  Args:
+    num_linear_feature_columns: The number of feature columns of the linear
+      model.
+
+  Returns:
+    A float.
+  """
+  default_learning_rate = 1. / math.sqrt(num_linear_feature_columns)
+  return min(_LINEAR_LEARNING_RATE, default_learning_rate)
+
+
+def _add_hidden_layer_summary(value, tag):
+  logging_ops.scalar_summary("%s:fraction_of_zero_values" % tag,
+                             nn.zero_fraction(value))
+  logging_ops.histogram_summary("%s:activation" % tag, value)
+
+
+def _dnn_linear_combined_model_fn(features, labels, mode, params):
+  """Deep Neural Net and Linear combined model_fn.
+
+  Args:
+    features: `Tensor` or dict of `Tensor` (depends on data passed to `fit`).
+    labels: `Tensor` of shape [batch_size, 1] or [batch_size] labels of dtype
+      `int32` or `int64` in the range `[0, n_classes)`.
+    mode: Defines whether this is training, evaluation or prediction.
+      See `ModeKeys`.
+    params: A dict of hyperparameters.
+      The following hyperparameters are expected:
+      * head: A `Head` instance.
+      * linear_feature_columns: An iterable containing all the feature columns
+          used by the Linear model.
+      * linear_optimizer: string, `Optimizer` object, or callable that defines
+          the optimizer to use for training the Linear model.
+      * joint_linear_weights: If True a single (possibly partitioned) variable
+          will be used to store the linear model weights. It's faster, but
+          requires all columns are sparse and have the 'sum' combiner.
+      * dnn_feature_columns: An iterable containing all the feature columns used
+          by the DNN model.
+      * dnn_optimizer: string, `Optimizer` object, or callable that defines the
+          optimizer to use for training the DNN model.
+      * dnn_hidden_units: List of hidden units per DNN layer.
+      * dnn_activation_fn: Activation function applied to each DNN layer. If
+          `None`, will use `tf.nn.relu`.
+      * dnn_dropout: When not `None`, the probability we will drop out a given
+          DNN coordinate.
+      * gradient_clip_norm: A float > 0. If provided, gradients are
+          clipped to their global norm with this clipping ratio.
+      * num_ps_replicas: The number of parameter server replicas.
+
+  Returns:
+    `estimator.ModelFnOps`
+
+  Raises:
+    ValueError: If both `linear_feature_columns` and `dnn_features_columns`
+      are empty at the same time.
+  """
+  head = params["head"]
+  linear_feature_columns = params.get("linear_feature_columns")
+  linear_optimizer = params.get("linear_optimizer")
+  joint_linear_weights = params.get("joint_linear_weights")
+  dnn_feature_columns = params.get("dnn_feature_columns")
+  dnn_optimizer = params.get("dnn_optimizer")
+  dnn_hidden_units = params.get("dnn_hidden_units")
+  dnn_activation_fn = params.get("dnn_activation_fn")
+  dnn_dropout = params.get("dnn_dropout")
+  gradient_clip_norm = params.get("gradient_clip_norm")
+  num_ps_replicas = params["num_ps_replicas"]
+
+  if not linear_feature_columns and not dnn_feature_columns:
+    raise ValueError(
+        "Either linear_feature_columns or dnn_feature_columns must be defined.")
+
+  features = _get_feature_dict(features)
+
+  # Build DNN Logits.
+  dnn_parent_scope = "dnn"
+
+  if not dnn_feature_columns:
+    dnn_logits = None
+  else:
+    input_layer_partitioner = (
+        partitioned_variables.min_max_variable_partitioner(
+            max_partitions=num_ps_replicas,
+            min_slice_size=64 << 20))
+    with variable_scope.variable_scope(
+        dnn_parent_scope + "/input_from_feature_columns",
+        values=features.values(),
+        partitioner=input_layer_partitioner) as scope:
+      net = layers.input_from_feature_columns(
+          columns_to_tensors=features,
+          feature_columns=dnn_feature_columns,
+          weight_collections=[dnn_parent_scope],
+          scope=scope)
+
+    hidden_layer_partitioner = (
+        partitioned_variables.min_max_variable_partitioner(
+            max_partitions=num_ps_replicas))
+    for layer_id, num_hidden_units in enumerate(dnn_hidden_units):
+      with variable_scope.variable_scope(
+          dnn_parent_scope + "/hiddenlayer_%d" % layer_id,
+          values=[net],
+          partitioner=hidden_layer_partitioner) as scope:
+        net = layers.fully_connected(
+            net,
+            num_hidden_units,
+            activation_fn=dnn_activation_fn,
+            variables_collections=[dnn_parent_scope],
+            scope=scope)
+        if dnn_dropout is not None and mode == estimator.ModeKeys.TRAIN:
+          net = layers.dropout(
+              net,
+              keep_prob=(1.0 - dnn_dropout))
+      # TODO(b/31209633): Consider adding summary before dropout.
+      _add_hidden_layer_summary(net, scope.name)
+
+    with variable_scope.variable_scope(
+        dnn_parent_scope + "/logits",
+        values=[net],
+        partitioner=hidden_layer_partitioner) as scope:
+      dnn_logits = layers.fully_connected(
+          net,
+          head.logits_dimension,
+          activation_fn=None,
+          variables_collections=[dnn_parent_scope],
+          scope=scope)
+    _add_hidden_layer_summary(dnn_logits, scope.name)
+
+  # Build Linear logits.
+  linear_parent_scope = "linear"
+
+  if not linear_feature_columns:
+    linear_logits = None
+  else:
+    linear_partitioner = partitioned_variables.min_max_variable_partitioner(
+        max_partitions=num_ps_replicas,
+        min_slice_size=64 << 20)
+    with variable_scope.variable_scope(
+        linear_parent_scope,
+        values=features.values(),
+        partitioner=linear_partitioner) as scope:
+      if joint_linear_weights:
+        linear_logits, _, _ = layers.joint_weighted_sum_from_feature_columns(
+            columns_to_tensors=features,
+            feature_columns=linear_feature_columns,
+            num_outputs=head.logits_dimension,
+            weight_collections=[linear_parent_scope],
+            scope=scope)
+      else:
+        linear_logits, _, _ = layers.weighted_sum_from_feature_columns(
+            columns_to_tensors=features,
+            feature_columns=linear_feature_columns,
+            num_outputs=head.logits_dimension,
+            weight_collections=[linear_parent_scope],
+            scope=scope)
+
+  # Combine logits and build full model.
+  if dnn_logits is not None and linear_logits is not None:
+    logits = dnn_logits + linear_logits
+  elif dnn_logits is not None:
+    logits = dnn_logits
+  else:
+    logits = linear_logits
+
+  def _make_training_op(training_loss):
+    """Training op for the DNN linear combined model."""
+    train_ops = []
+    if dnn_logits is not None:
+      train_ops.append(
+          optimizers.optimize_loss(
+              loss=training_loss,
+              global_step=contrib_variables.get_global_step(),
+              learning_rate=_DNN_LEARNING_RATE,
+              optimizer=_get_optimizer(dnn_optimizer),
+              clip_gradients=gradient_clip_norm,
+              variables=ops.get_collection(dnn_parent_scope),
+              name=dnn_parent_scope,
+              # Empty summaries, because head already logs "loss" summary.
+              summaries=[]))
+    if linear_logits is not None:
+      train_ops.append(
+          optimizers.optimize_loss(
+              loss=training_loss,
+              global_step=contrib_variables.get_global_step(),
+              learning_rate=_linear_learning_rate(len(linear_feature_columns)),
+              optimizer=_get_optimizer(linear_optimizer),
+              clip_gradients=gradient_clip_norm,
+              variables=ops.get_collection(linear_parent_scope),
+              name=linear_parent_scope,
+              # Empty summaries, because head already logs "loss" summary.
+              summaries=[]))
+
+    return control_flow_ops.group(*train_ops)
+
+  return head.head_ops(
+      features, labels, mode, _make_training_op, logits=logits)
+
+
+class DNNLinearCombinedClassifier(evaluable.Evaluable, trainable.Trainable):
   """A classifier for TensorFlow Linear and DNN joined training models.
 
   Example:
@@ -423,30 +663,71 @@ class DNNLinearCombinedClassifier(_DNNLinearCombinedBaseEstimator):
       ValueError: If both `linear_feature_columns` and `dnn_features_columns`
         are empty at the same time.
     """
-
     if n_classes < 2:
       raise ValueError("n_classes should be greater than 1. Given: {}".format(
           n_classes))
+    self._linear_optimizer = linear_optimizer or "Ftrl"
+    linear_feature_columns = linear_feature_columns or []
+    dnn_feature_columns = dnn_feature_columns or []
+    self._feature_columns = linear_feature_columns + dnn_feature_columns
+    if not self._feature_columns:
+      raise ValueError("Either linear_feature_columns or dnn_feature_columns "
+                       "must be defined.")
+    self._dnn_hidden_units = dnn_hidden_units
+    self._enable_centered_bias = enable_centered_bias
+
     head = head_lib._multi_class_head(  # pylint: disable=protected-access
         n_classes=n_classes,
         weight_column_name=weight_column_name,
         enable_centered_bias=enable_centered_bias)
-    super(DNNLinearCombinedClassifier, self).__init__(
+    self._estimator = estimator.Estimator(
+        model_fn=_dnn_linear_combined_model_fn,
         model_dir=model_dir,
-        linear_feature_columns=linear_feature_columns,
-        linear_optimizer=linear_optimizer,
-        _joint_linear_weights=_joint_linear_weights,
-        dnn_feature_columns=dnn_feature_columns,
-        dnn_optimizer=dnn_optimizer,
-        dnn_hidden_units=dnn_hidden_units,
-        dnn_activation_fn=dnn_activation_fn,
-        dnn_dropout=dnn_dropout,
-        gradient_clip_norm=gradient_clip_norm,
-        head=head,
         config=config,
-        feature_engineering_fn=feature_engineering_fn,
-        default_prediction_key=head_lib.PredictionKey.CLASSES,
-        enable_centered_bias=enable_centered_bias)
+        params={
+            "head": head,
+            "linear_feature_columns": linear_feature_columns,
+            "linear_optimizer": self._linear_optimizer,
+            "joint_linear_weights": _joint_linear_weights,
+            "dnn_feature_columns": dnn_feature_columns,
+            "dnn_optimizer": dnn_optimizer or "Adagrad",
+            "dnn_hidden_units": dnn_hidden_units,
+            "dnn_activation_fn": dnn_activation_fn,
+            "dnn_dropout": dnn_dropout,
+            "gradient_clip_norm": gradient_clip_norm,
+            "num_ps_replicas": config.num_ps_replicas if config else 0,
+        },
+        feature_engineering_fn=feature_engineering_fn)
+
+  def fit(self, x=None, y=None, input_fn=None, steps=None, batch_size=None,
+          monitors=None, max_steps=None):
+    """See trainable.Trainable."""
+    # TODO(roumposg): Remove when deprecated monitors are removed.
+    if monitors is not None:
+      deprecated_monitors = [
+          m for m in monitors
+          if not isinstance(m, session_run_hook.SessionRunHook)
+      ]
+      for monitor in deprecated_monitors:
+        monitor.set_estimator(self)
+        monitor._lock_estimator()  # pylint: disable=protected-access
+
+    result = self._estimator.fit(x=x, y=y, input_fn=input_fn, steps=steps,
+                                 batch_size=batch_size, monitors=monitors,
+                                 max_steps=max_steps)
+
+    if monitors is not None:
+      for monitor in deprecated_monitors:
+        monitor._unlock_estimator()  # pylint: disable=protected-access
+
+    return result
+
+  def evaluate(self, x=None, y=None, input_fn=None, feed_fn=None,
+               batch_size=None, steps=None, metrics=None, name=None):
+    """See evaluable.Evaluable."""
+    return self._estimator.evaluate(
+        x=x, y=y, input_fn=input_fn, feed_fn=feed_fn, batch_size=batch_size,
+        steps=steps, metrics=metrics, name=name)
 
   @deprecated_arg_values(
       estimator.AS_ITERABLE_DATE, estimator.AS_ITERABLE_INSTRUCTIONS,
@@ -467,12 +748,16 @@ class DNNLinearCombinedClassifier(_DNNLinearCombinedBaseEstimator):
       Numpy array of predicted classes (or an iterable of predicted classes if
       as_iterable is True).
     """
-    predictions = self.predict_proba(
-        x=x, input_fn=input_fn, batch_size=batch_size, as_iterable=as_iterable)
+    key = prediction_key.PredictionKey.CLASSES
+    preds = self._estimator.predict(
+        x=x,
+        input_fn=input_fn,
+        batch_size=batch_size,
+        outputs=[key],
+        as_iterable=as_iterable)
     if as_iterable:
-      return (np.argmax(p, axis=0) for p in predictions)
-    else:
-      return np.argmax(predictions, axis=1)
+      return _as_iterable(preds, output=key)
+    return preds[key].reshape(-1)
 
   @deprecated_arg_values(
       estimator.AS_ITERABLE_DATE, estimator.AS_ITERABLE_INSTRUCTIONS,
@@ -494,13 +779,133 @@ class DNNLinearCombinedClassifier(_DNNLinearCombinedBaseEstimator):
       Numpy array of predicted probabilities (or an iterable of predicted
       probabilities if as_iterable is True).
     """
-    return super(DNNLinearCombinedClassifier, self).predict(
-        x=x, input_fn=input_fn, batch_size=batch_size, as_iterable=as_iterable)
+    key = prediction_key.PredictionKey.PROBABILITIES
+    preds = self._estimator.predict(
+        x=x,
+        input_fn=input_fn,
+        batch_size=batch_size,
+        outputs=[key],
+        as_iterable=as_iterable)
+    if as_iterable:
+      return _as_iterable(preds, output=key)
+    return preds[key]
 
   def _get_predict_ops(self, features):
-    """See base class."""
-    return super(DNNLinearCombinedClassifier, self)._get_predict_ops(features)[
-        head_lib.PredictionKey.PROBABILITIES]
+    """See `Estimator` class."""
+    # pylint: disable=protected-access
+    return self._estimator._get_predict_ops(features)[
+        prediction_key.PredictionKey.PROBABILITIES]
+
+  def get_variable_names(self):
+    """Returns list of all variable names in this model.
+
+    Returns:
+      List of names.
+    """
+    return self._estimator.get_variable_names()
+
+  def get_variable_value(self, name):
+    """Returns value of the variable given by name.
+
+    Args:
+      name: string, name of the tensor.
+
+    Returns:
+      `Tensor` object.
+    """
+    return self._estimator.get_variable_value(name)
+
+  def export(self,
+             export_dir,
+             input_fn=None,
+             input_feature_key=None,
+             use_deprecated_input_fn=True,
+             signature_fn=None,
+             default_batch_size=1,
+             exports_to_keep=None):
+    """See BasEstimator.export."""
+    def default_input_fn(unused_estimator, examples):
+      return layers.parse_feature_columns_from_examples(
+          examples, self._feature_columns)
+    self._estimator.export(
+        export_dir=export_dir,
+        input_fn=input_fn or default_input_fn,
+        input_feature_key=input_feature_key,
+        use_deprecated_input_fn=use_deprecated_input_fn,
+        signature_fn=(signature_fn or
+                      export.classification_signature_fn_with_prob),
+        prediction_key=prediction_key.PredictionKey.PROBABILITIES,
+        default_batch_size=default_batch_size,
+        exports_to_keep=exports_to_keep)
+
+  @property
+  def model_dir(self):
+    return self._estimator.model_dir
+
+  @property
+  @deprecated("2016-10-30",
+              "This method will be removed after the deprecation date. "
+              "To inspect variables, use get_variable_names() and "
+              "get_variable_value().")
+  def dnn_weights_(self):
+    hiddenlayer_weights = [
+        self.get_variable_value("dnn/hiddenlayer_%d/weights" % i)
+        for i, _ in enumerate(self._dnn_hidden_units)
+    ]
+    logits_weights = [self.get_variable_value("dnn/logits/weights")]
+    return hiddenlayer_weights + logits_weights
+
+  @property
+  @deprecated("2016-10-30",
+              "This method will be removed after the deprecation date. "
+              "To inspect variables, use get_variable_names() and "
+              "get_variable_value().")
+  def linear_weights_(self):
+    values = {}
+    if isinstance(self._linear_optimizer, str):
+      optimizer_name = self._linear_optimizer
+    else:
+      optimizer_name = self._linear_optimizer.get_name()
+    optimizer_regex = r".*/"+optimizer_name + r"(_\d)?$"
+    for name in self.get_variable_names():
+      if (name.startswith("linear/") and
+          name != "linear/bias_weight" and
+          name != "linear/learning_rate" and
+          not re.match(optimizer_regex, name)):
+        values[name] = self.get_variable_value(name)
+    if len(values) == 1:
+      return values[list(values.keys())[0]]
+    return values
+
+  @property
+  @deprecated("2016-10-30",
+              "This method will be removed after the deprecation date. "
+              "To inspect variables, use get_variable_names() and "
+              "get_variable_value().")
+  def dnn_bias_(self):
+    hiddenlayer_bias = [self.get_variable_value("dnn/hiddenlayer_%d/biases" % i)
+                        for i, _ in enumerate(self._dnn_hidden_units)]
+    logits_bias = [self.get_variable_value("dnn/logits/biases")]
+    if not self._enable_centered_bias:
+      return hiddenlayer_bias + logits_bias
+    centered_bias = [self.get_variable_value(_CENTERED_BIAS_WEIGHT)]
+    return hiddenlayer_bias + logits_bias  + centered_bias
+
+  @property
+  @deprecated("2016-10-30",
+              "This method will be removed after the deprecation date. "
+              "To inspect variables, use get_variable_names() and "
+              "get_variable_value().")
+  def linear_bias_(self):
+    linear_bias = self.get_variable_value("linear/bias_weight")
+    if not self._enable_centered_bias:
+      return linear_bias
+    centered_bias = [self.get_variable_value(_CENTERED_BIAS_WEIGHT)]
+    return linear_bias  + centered_bias
+
+  @property
+  def config(self):
+    return self._estimator.config
 
 
 class DNNLinearCombinedRegressor(_DNNLinearCombinedBaseEstimator):
@@ -642,12 +1047,11 @@ class DNNLinearCombinedRegressor(_DNNLinearCombinedBaseEstimator):
         head=head,
         config=config,
         feature_engineering_fn=feature_engineering_fn,
-        default_prediction_key=head_lib.PredictionKey.SCORES,
+        default_prediction_key=prediction_key.PredictionKey.SCORES,
         enable_centered_bias=enable_centered_bias)
 
   def _get_predict_ops(self, features):
     """See base class."""
-    return super(DNNLinearCombinedRegressor, self)._get_predict_ops(features)[
-        head_lib.PredictionKey.SCORES]
-
-
+    return super(
+        DNNLinearCombinedRegressor,
+        self)._get_predict_ops(features)[prediction_key.PredictionKey.SCORES]
diff --git a/tensorflow/contrib/learn/python/learn/estimators/dnn_linear_combined_test.py b/tensorflow/contrib/learn/python/learn/estimators/dnn_linear_combined_test.py
index ad574f0790e..dae1879646f 100644
--- a/tensorflow/contrib/learn/python/learn/estimators/dnn_linear_combined_test.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/dnn_linear_combined_test.py
@@ -27,6 +27,7 @@ import tensorflow as tf
 
 from tensorflow.contrib.learn.python.learn.estimators import _sklearn
 from tensorflow.contrib.learn.python.learn.estimators import estimator_test_utils
+from tensorflow.contrib.learn.python.learn.metric_spec import MetricSpec
 
 
 def _get_quantile_based_buckets(feature_values, num_buckets):
@@ -65,6 +66,15 @@ class DNNLinearCombinedClassifierTest(tf.test.TestCase):
     estimator_test_utils.assert_estimator_contract(
         self, tf.contrib.learn.DNNLinearCombinedClassifier)
 
+  def testNoFeatureColumns(self):
+    with self.assertRaisesRegexp(
+        ValueError,
+        'Either linear_feature_columns or dnn_feature_columns must be defined'):
+      tf.contrib.learn.DNNLinearCombinedClassifier(
+          linear_feature_columns=None,
+          dnn_feature_columns=None,
+          dnn_hidden_units=[3, 3])
+
   def testLogisticRegression_MatrixData(self):
     """Tests binary classification using matrix data as input."""
     iris = _prepare_iris_data_for_logistic_regression()
@@ -80,6 +90,7 @@ class DNNLinearCombinedClassifierTest(tf.test.TestCase):
 
     classifier.fit(input_fn=_iris_input_logistic_fn, steps=100)
     scores = classifier.evaluate(input_fn=_iris_input_logistic_fn, steps=100)
+    self.assertIn('auc', scores.keys())
     self.assertGreater(scores['accuracy'], 0.9)
 
   def testLogisticRegression_TensorData(self):
@@ -120,6 +131,7 @@ class DNNLinearCombinedClassifierTest(tf.test.TestCase):
 
     classifier.fit(input_fn=_input_fn, steps=100)
     scores = classifier.evaluate(input_fn=_input_fn, steps=100)
+    self.assertIn('auc', scores.keys())
     self.assertGreater(scores['accuracy'], 0.9)
 
   def testTrainWithPartitionedVariables(self):
@@ -397,9 +409,15 @@ class DNNLinearCombinedClassifierTest(tf.test.TestCase):
         input_fn=_input_fn,
         steps=100,
         metrics={
-            'my_accuracy': tf.contrib.metrics.streaming_accuracy,
-            ('my_precision', 'classes'): tf.contrib.metrics.streaming_precision,
-            ('my_metric', 'probabilities'): _my_metric_op
+            'my_accuracy': MetricSpec(
+                metric_fn=tf.contrib.metrics.streaming_accuracy,
+                prediction_key='classes'),
+            'my_precision': MetricSpec(
+                metric_fn=tf.contrib.metrics.streaming_precision,
+                prediction_key='classes'),
+            'my_metric': MetricSpec(
+                metric_fn=_my_metric_op,
+                prediction_key='probabilities')
         })
     self.assertTrue(
         set(['loss', 'my_accuracy', 'my_precision', 'my_metric'
@@ -412,7 +430,7 @@ class DNNLinearCombinedClassifierTest(tf.test.TestCase):
 
     # Test the case where the 2nd element of the key is neither "classes" nor
     # "probabilities".
-    with self.assertRaises(KeyError):
+    with self.assertRaisesRegexp(KeyError, 'bad_type'):
       classifier.evaluate(
           input_fn=_input_fn,
           steps=100,
@@ -428,6 +446,17 @@ class DNNLinearCombinedClassifierTest(tf.test.TestCase):
                   tf.contrib.metrics.streaming_accuracy
           })
 
+    # Test the case where the prediction_key is neither "classes" nor
+    # "probabilities".
+    with self.assertRaisesRegexp(KeyError, 'bad_type'):
+      classifier.evaluate(
+          input_fn=_input_fn,
+          steps=100,
+          metrics={
+              'bad_name': MetricSpec(
+                  metric_fn=tf.contrib.metrics.streaming_auc,
+                  prediction_key='bad_type')})
+
   def testVariableQuery(self):
     """Tests bias is centered or not."""
     def _input_fn_train():
@@ -447,6 +476,39 @@ class DNNLinearCombinedClassifierTest(tf.test.TestCase):
     for name in var_names:
       classifier.get_variable_value(name)
 
+  def testExport(self):
+    """Tests export model for servo."""
+
+    def input_fn():
+      return {
+          'age': tf.constant([1]),
+          'language': tf.SparseTensor(values=['english'],
+                                      indices=[[0, 0]],
+                                      shape=[1, 1])
+      }, tf.constant([[1]])
+
+    language = tf.contrib.layers.sparse_column_with_hash_bucket('language', 100)
+
+    classifier = tf.contrib.learn.DNNLinearCombinedClassifier(
+        linear_feature_columns=[
+            tf.contrib.layers.real_valued_column('age'),
+            language,
+        ],
+        dnn_feature_columns=[
+            tf.contrib.layers.embedding_column(language, dimension=1),
+        ],
+        dnn_hidden_units=[3, 3])
+    classifier.fit(input_fn=input_fn, steps=100)
+
+    export_dir = tempfile.mkdtemp()
+    input_feature_key = 'examples'
+    def serving_input_fn():
+      features, targets = input_fn()
+      features[input_feature_key] = tf.placeholder(tf.string)
+      return features, targets
+    classifier.export(export_dir, serving_input_fn, input_feature_key,
+                      use_deprecated_input_fn=False)
+
   def testCenteredBias(self):
     """Tests bias is centered or not."""
     def _input_fn_train():
@@ -461,7 +523,7 @@ class DNNLinearCombinedClassifierTest(tf.test.TestCase):
         dnn_hidden_units=[3, 3],
         enable_centered_bias=True)
 
-    classifier.fit(input_fn=_input_fn_train, steps=500)
+    classifier.fit(input_fn=_input_fn_train, steps=1000)
     # logodds(0.75) = 1.09861228867
     self.assertAlmostEqual(
         1.0986,
@@ -483,7 +545,7 @@ class DNNLinearCombinedClassifierTest(tf.test.TestCase):
         enable_centered_bias=False)
 
     classifier.fit(input_fn=_input_fn_train, steps=500)
-    self.assertFalse('centered_bias_weight' in classifier.get_variable_names())
+    self.assertNotIn('centered_bias_weight', classifier.get_variable_names())
 
   def testLinearOnly(self):
     """Tests that linear-only instantiation works."""
@@ -822,6 +884,44 @@ class DNNLinearCombinedRegressorTest(tf.test.TestCase):
           metrics={('my_error', 'predictions'
                    ): tf.contrib.metrics.streaming_mean_squared_error})
 
+  def testExport(self):
+    """Tests export model for servo."""
+    labels = [1., 0., 0.2]
+    def _input_fn(num_epochs=None):
+      features = {
+          'age': tf.train.limit_epochs(tf.constant([[0.8], [0.15], [0.]]),
+                                       num_epochs=num_epochs),
+          'language': tf.SparseTensor(values=['en', 'fr', 'zh'],
+                                      indices=[[0, 0], [0, 1], [2, 0]],
+                                      shape=[3, 2])
+      }
+      return features, tf.constant(labels, dtype=tf.float32)
+
+    language_column = tf.contrib.layers.sparse_column_with_hash_bucket(
+        'language', hash_bucket_size=20)
+
+    regressor = tf.contrib.learn.DNNLinearCombinedRegressor(
+        linear_feature_columns=[
+            language_column,
+            tf.contrib.layers.real_valued_column('age')
+        ],
+        dnn_feature_columns=[
+            tf.contrib.layers.embedding_column(language_column, dimension=1),
+        ],
+        dnn_hidden_units=[3, 3],
+        config=tf.contrib.learn.RunConfig(tf_random_seed=1))
+
+    regressor.fit(input_fn=_input_fn, steps=100)
+
+    export_dir = tempfile.mkdtemp()
+    input_feature_key = 'examples'
+    def serving_input_fn():
+      features, targets = _input_fn()
+      features[input_feature_key] = tf.placeholder(tf.string)
+      return features, targets
+    regressor.export(export_dir, serving_input_fn, input_feature_key,
+                     use_deprecated_input_fn=False)
+
   def testTrainSaveLoad(self):
     """Tests regression with restarting training / evaluate."""
     def _input_fn(num_epochs=None):
@@ -1009,7 +1109,7 @@ class FeatureEngineeringFunctionTest(tf.test.TestCase):
         config=tf.contrib.learn.RunConfig(tf_random_seed=1))
     estimator_without_fe_fn.fit(input_fn=input_fn, steps=100)
 
-     # predictions = y
+    # predictions = y
     prediction_with_fe_fn = next(
         estimator_with_fe_fn.predict(input_fn=input_fn, as_iterable=True))
     self.assertAlmostEqual(1000., prediction_with_fe_fn, delta=1.0)
diff --git a/tensorflow/contrib/learn/python/learn/estimators/estimator.py b/tensorflow/contrib/learn/python/learn/estimators/estimator.py
index 145bdcf2ee8..c9d1377ce73 100644
--- a/tensorflow/contrib/learn/python/learn/estimators/estimator.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/estimator.py
@@ -45,6 +45,7 @@ from tensorflow.contrib.learn.python.learn import metric_spec
 from tensorflow.contrib.learn.python.learn import monitors as monitor_lib
 from tensorflow.contrib.learn.python.learn import trainable
 from tensorflow.contrib.learn.python.learn.estimators import _sklearn as sklearn
+from tensorflow.contrib.learn.python.learn.estimators import metric_key
 from tensorflow.contrib.learn.python.learn.estimators import run_config
 from tensorflow.contrib.learn.python.learn.estimators import tensor_signature
 from tensorflow.contrib.learn.python.learn.estimators._sklearn import NotFittedError
@@ -1108,8 +1109,9 @@ class Estimator(BaseEstimator):
 
     result = _make_metrics_ops(all_metrics, features, labels,
                                model_fn_ops.predictions)
-    if 'loss' not in result:
-      result['loss'] = metrics_lib.streaming_mean(model_fn_ops.loss)
+    if metric_key.MetricKey.LOSS not in result:
+      result[metric_key.MetricKey.LOSS] = metrics_lib.streaming_mean(
+          model_fn_ops.loss)
     return result
 
   def _get_predict_ops(self, features):
diff --git a/tensorflow/contrib/learn/python/learn/estimators/head.py b/tensorflow/contrib/learn/python/learn/estimators/head.py
index 6bc0ba871f2..77e3067bbde 100644
--- a/tensorflow/contrib/learn/python/learn/estimators/head.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/head.py
@@ -24,9 +24,12 @@ from tensorflow.contrib import losses
 from tensorflow.contrib import metrics as metrics_lib
 from tensorflow.contrib.learn.python.learn import metric_spec
 from tensorflow.contrib.learn.python.learn.estimators import estimator
+from tensorflow.contrib.learn.python.learn.estimators import metric_key
+from tensorflow.contrib.learn.python.learn.estimators import prediction_key
 from tensorflow.contrib.session_bundle import exporter
 from tensorflow.python import summary
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import math_ops
@@ -387,17 +390,17 @@ class _RegressionHead(_Head):
   def _logits_to_prediction(self, logits=None):
     predictions = {}
     if self.logits_dimension == 1:
-      predictions[PredictionKey.SCORES] = array_ops.squeeze(
+      predictions[prediction_key.PredictionKey.SCORES] = array_ops.squeeze(
           logits, squeeze_dims=[1])
     else:
-      predictions[PredictionKey.SCORES] = logits
+      predictions[prediction_key.PredictionKey.SCORES] = logits
     return predictions
 
   # pylint: disable=undefined-variable
   def _create_signature_fn(self):
     def _regression_signature_fn(examples, unused_features, predictions):
       if isinstance(predictions, dict):
-        score = predictions[PredictionKey.SCORES]
+        score = predictions[prediction_key.PredictionKey.SCORES]
       else:
         score = predictions
 
@@ -408,11 +411,12 @@ class _RegressionHead(_Head):
     return _regression_signature_fn
 
   def _default_metric(self):
-    return {_head_prefixed(self._head_name, MetricKey.LOSS):
-            _weighted_average_loss_metric_spec(self._eval_loss_fn,
-                                               PredictionKey.SCORES,
-                                               self._label_name,
-                                               self._weight_column_name)}
+    return {_head_prefixed(self._head_name, metric_key.MetricKey.LOSS):
+            _weighted_average_loss_metric_spec(
+                self._eval_loss_fn,
+                prediction_key.PredictionKey.SCORES,
+                self._label_name,
+                self._weight_column_name)}
 
 
 class _MultiClassHead(_Head):
@@ -529,12 +533,16 @@ class _MultiClassHead(_Head):
     return self._logits_to_prediction(logits)
 
   def _logits_to_prediction(self, logits=None):
-    predictions = {PredictionKey.LOGITS: logits}
+    # pylint: disable=missing-docstring
+    predictions = {prediction_key.PredictionKey.LOGITS: logits}
     if self.logits_dimension == 1:
-      predictions[PredictionKey.LOGISTIC] = math_ops.sigmoid(logits)
+      predictions[prediction_key.PredictionKey.LOGISTIC] = math_ops.sigmoid(
+          logits)
       logits = array_ops.concat(1, [array_ops.zeros_like(logits), logits])
-    predictions[PredictionKey.PROBABILITIES] = nn.softmax(logits)
-    predictions[PredictionKey.CLASSES] = math_ops.argmax(logits, 1)
+    predictions[prediction_key.PredictionKey.PROBABILITIES] = nn.softmax(
+        logits)
+    predictions[prediction_key.PredictionKey.CLASSES] = math_ops.argmax(
+        logits, 1)
 
     return predictions
 
@@ -545,8 +553,9 @@ class _MultiClassHead(_Head):
       if isinstance(predictions, dict):
         default_signature = exporter.classification_signature(
             input_tensor=examples,
-            classes_tensor=predictions[PredictionKey.CLASSES],
-            scores_tensor=predictions[PredictionKey.PROBABILITIES])
+            classes_tensor=predictions[prediction_key.PredictionKey.CLASSES],
+            scores_tensor=predictions[
+                prediction_key.PredictionKey.PROBABILITIES])
       else:
         default_signature = exporter.classification_signature(
             input_tensor=examples,
@@ -557,44 +566,49 @@ class _MultiClassHead(_Head):
     return _classification_signature_fn
 
   def _default_metric(self):
-    metrics = {_head_prefixed(self._head_name, MetricKey.LOSS):
-               _weighted_average_loss_metric_spec(self._eval_loss_fn,
-                                                  PredictionKey.LOGITS,
-                                                  self._label_name,
-                                                  self._weight_column_name)}
+    metrics = {_head_prefixed(self._head_name, metric_key.MetricKey.LOSS):
+               _weighted_average_loss_metric_spec(
+                   self._eval_loss_fn,
+                   prediction_key.PredictionKey.LOGITS,
+                   self._label_name,
+                   self._weight_column_name)}
 
     # TODO(b/29366811): This currently results in both an "accuracy" and an
     # "accuracy/threshold_0.500000_mean" metric for binary classification.
-    metrics[_head_prefixed(self._head_name, MetricKey.ACCURACY)] = (
+    metrics[_head_prefixed(self._head_name, metric_key.MetricKey.ACCURACY)] = (
         metric_spec.MetricSpec(metrics_lib.streaming_accuracy,
-                               PredictionKey.CLASSES, self._label_name,
+                               prediction_key.PredictionKey.CLASSES,
+                               self._label_name,
                                self._weight_column_name))
     if self.logits_dimension == 1:
-      def _add_binary_metric(metric_key, metric_fn):
-        metrics[_head_prefixed(self._head_name, metric_key)] = (
+      def _add_binary_metric(key, metric_fn):
+        metrics[_head_prefixed(self._head_name, key)] = (
             metric_spec.MetricSpec(metric_fn,
-                                   PredictionKey.LOGISTIC,
+                                   prediction_key.PredictionKey.LOGISTIC,
                                    self._label_name,
                                    self._weight_column_name))
-      _add_binary_metric(MetricKey.PREDICTION_MEAN, _predictions_streaming_mean)
-      _add_binary_metric(MetricKey.LABEL_MEAN, _labels_streaming_mean)
+      _add_binary_metric(
+          metric_key.MetricKey.PREDICTION_MEAN, _predictions_streaming_mean)
+      _add_binary_metric(
+          metric_key.MetricKey.LABEL_MEAN, _labels_streaming_mean)
 
       # Also include the streaming mean of the label as an accuracy baseline, as
       # a reminder to users.
-      _add_binary_metric(MetricKey.ACCURACY_BASELINE, _labels_streaming_mean)
+      _add_binary_metric(
+          metric_key.MetricKey.ACCURACY_BASELINE, _labels_streaming_mean)
 
-      _add_binary_metric(MetricKey.AUC, _streaming_auc)
+      _add_binary_metric(metric_key.MetricKey.AUC, _streaming_auc)
 
       for threshold in self._thresholds:
-        _add_binary_metric(MetricKey.ACCURACY_MEAN % threshold,
+        _add_binary_metric(metric_key.MetricKey.ACCURACY_MEAN % threshold,
                            _accuracy_at_threshold(threshold))
         # Precision for positive examples.
-        _add_binary_metric(MetricKey.PRECISION_MEAN % threshold,
+        _add_binary_metric(metric_key.MetricKey.PRECISION_MEAN % threshold,
                            _streaming_at_threshold(
                                metrics_lib.streaming_precision_at_thresholds,
                                threshold),)
         # Recall for positive examples.
-        _add_binary_metric(MetricKey.RECALL_MEAN % threshold,
+        _add_binary_metric(metric_key.MetricKey.RECALL_MEAN % threshold,
                            _streaming_at_threshold(
                                metrics_lib.streaming_recall_at_thresholds,
                                threshold))
@@ -603,7 +617,7 @@ class _MultiClassHead(_Head):
 
 def _check_labels(labels, label_name):
   labels = labels[label_name] if isinstance(labels, dict) else labels
-  if isinstance(labels, ops.SparseTensor):
+  if isinstance(labels, sparse_tensor.SparseTensor):
     raise ValueError("SparseTensor is not supported as labels.")
   return labels
 
@@ -634,21 +648,24 @@ class _BinarySvmHead(_MultiClassHead):
 
   def _logits_to_prediction(self, logits=None):
     predictions = {}
-    predictions[PredictionKey.LOGITS] = logits
+    predictions[prediction_key.PredictionKey.LOGITS] = logits
     logits = array_ops.concat(1, [array_ops.zeros_like(logits), logits])
-    predictions[PredictionKey.CLASSES] = math_ops.argmax(logits, 1)
+    predictions[prediction_key.PredictionKey.CLASSES] = math_ops.argmax(
+        logits, 1)
 
     return predictions
 
   def _default_metric(self):
-    metrics = {_head_prefixed(self._head_name, MetricKey.LOSS):
-               _weighted_average_loss_metric_spec(self._eval_loss_fn,
-                                                  PredictionKey.LOGITS,
-                                                  self._label_name,
-                                                  self._weight_column_name)}
-    metrics[_head_prefixed(self._head_name, MetricKey.ACCURACY)] = (
+    metrics = {_head_prefixed(self._head_name, metric_key.MetricKey.LOSS):
+               _weighted_average_loss_metric_spec(
+                   self._eval_loss_fn,
+                   prediction_key.PredictionKey.LOGITS,
+                   self._label_name,
+                   self._weight_column_name)}
+    metrics[_head_prefixed(self._head_name, metric_key.MetricKey.ACCURACY)] = (
         metric_spec.MetricSpec(metrics_lib.streaming_accuracy,
-                               PredictionKey.CLASSES, self._label_name,
+                               prediction_key.PredictionKey.CLASSES,
+                               self._label_name,
                                self._weight_column_name))
     # TODO(sibyl-vie3Poto): add more metrics relevant for svms.
     return metrics
@@ -673,12 +690,14 @@ class _MultiLabelHead(_MultiClassHead):
         thresholds=thresholds)
 
   def _logits_to_prediction(self, logits=None):
-    predictions = {PredictionKey.LOGITS: logits}
+    predictions = {prediction_key.PredictionKey.LOGITS: logits}
     if self.logits_dimension == 1:
-      predictions[PredictionKey.LOGISTIC] = math_ops.sigmoid(logits)
+      predictions[prediction_key.PredictionKey.LOGISTIC] = math_ops.sigmoid(
+          logits)
       logits = array_ops.concat(1, [array_ops.zeros_like(logits), logits])
-    predictions[PredictionKey.PROBABILITIES] = math_ops.sigmoid(logits)
-    predictions[PredictionKey.CLASSES] = math_ops.to_int64(
+    predictions[prediction_key.PredictionKey.PROBABILITIES] = math_ops.sigmoid(
+        logits)
+    predictions[prediction_key.PredictionKey.CLASSES] = math_ops.to_int64(
         math_ops.greater(logits, 0))
     return predictions
 
@@ -848,23 +867,3 @@ def _streaming_at_threshold(streaming_metrics_fn, threshold):
     return array_ops.squeeze(precision_tensor), update_op
 
   return _streaming_metrics
-
-
-class PredictionKey(object):
-  CLASSES = "classes"
-  PROBABILITIES = "probabilities"
-  LOGITS = "logits"
-  LOGISTIC = "logistic"
-  SCORES = "scores"
-
-
-class MetricKey(object):
-  LOSS = "loss"
-  AUC = "auc"
-  PREDICTION_MEAN = "labels/prediction_mean"
-  LABEL_MEAN = "labels/actual_label_mean"
-  ACCURACY = "accuracy"
-  ACCURACY_BASELINE = "accuracy/baseline_label_mean"
-  ACCURACY_MEAN = "accuracy/threshold_%f_mean"
-  PRECISION_MEAN = "precision/positive_threshold_%f_mean"
-  RECALL_MEAN = "recall/positive_threshold_%f_mean"
diff --git a/tensorflow/contrib/learn/python/learn/estimators/head_test.py b/tensorflow/contrib/learn/python/learn/estimators/head_test.py
index 5e57ae58b87..865acc0a276 100644
--- a/tensorflow/contrib/learn/python/learn/estimators/head_test.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/head_test.py
@@ -74,7 +74,7 @@ class MultiClassModelHeadTest(tf.test.TestCase):
       model_fn_ops = head.head_ops({}, labels,
                                    tf.contrib.learn.ModeKeys.TRAIN,
                                    _noop_train_op, logits=logits)
-      self.assertAlmostEqual(.81326163, sess.run(model_fn_ops.loss))
+      self.assertAlmostEqual(0.81326175, sess.run(model_fn_ops.loss))
 
   def testErrorInSparseTensorLabels(self):
     head = head_lib._multi_class_head(n_classes=2)
diff --git a/tensorflow/contrib/learn/python/learn/estimators/linear.py b/tensorflow/contrib/learn/python/learn/estimators/linear.py
index 4e25b12feb6..8d887f20c5e 100644
--- a/tensorflow/contrib/learn/python/learn/estimators/linear.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/linear.py
@@ -32,6 +32,7 @@ from tensorflow.contrib.learn.python.learn import evaluable
 from tensorflow.contrib.learn.python.learn import trainable
 from tensorflow.contrib.learn.python.learn.estimators import estimator
 from tensorflow.contrib.learn.python.learn.estimators import head as head_lib
+from tensorflow.contrib.learn.python.learn.estimators import prediction_key
 from tensorflow.contrib.learn.python.learn.utils import export
 from tensorflow.contrib.linear_optimizer.python import sdca_optimizer
 from tensorflow.python.framework import dtypes
@@ -267,21 +268,18 @@ class LinearClassifier(evaluable.Evaluable, trainable.Trainable):
   Example:
 
   ```python
-  education = sparse_column_with_hash_bucket(column_name="education",
-                                             hash_bucket_size=1000)
-  occupation = sparse_column_with_hash_bucket(column_name="occupation",
-                                              hash_bucket_size=1000)
+  sparse_column_a = sparse_column_with_hash_bucket(...)
+  sparse_column_b = sparse_column_with_hash_bucket(...)
 
-  education_x_occupation = crossed_column(columns=[education, occupation],
-                                          hash_bucket_size=10000)
+  sparse_feature_a_x_sparse_feature_b = crossed_column(...)
 
   # Estimator using the default optimizer.
   estimator = LinearClassifier(
-      feature_columns=[occupation, education_x_occupation])
+      feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b])
 
   # Or estimator using the FTRL optimizer with regularization.
   estimator = LinearClassifier(
-      feature_columns=[occupation, education_x_occupation],
+      feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b],
       optimizer=tf.train.FtrlOptimizer(
         learning_rate=0.1,
         l1_regularization_strength=0.001
@@ -289,7 +287,7 @@ class LinearClassifier(evaluable.Evaluable, trainable.Trainable):
 
   # Or estimator using the SDCAOptimizer.
   estimator = LinearClassifier(
-     feature_columns=[occupation, education_x_occupation],
+     feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b],
      optimizer=tf.contrib.linear_optimizer.SDCAOptimizer(
        example_id_column='example_id',
        num_loss_partitions=...,
@@ -465,13 +463,16 @@ class LinearClassifier(evaluable.Evaluable, trainable.Trainable):
       as_iterable=False)
   def predict(self, x=None, input_fn=None, batch_size=None, as_iterable=True):
     """Runs inference to determine the predicted class."""
-    preds = self._estimator.predict(x=x, input_fn=input_fn,
-                                    batch_size=batch_size,
-                                    outputs=[head_lib.PredictionKey.CLASSES],
-                                    as_iterable=as_iterable)
+    key = prediction_key.PredictionKey.CLASSES
+    preds = self._estimator.predict(
+        x=x,
+        input_fn=input_fn,
+        batch_size=batch_size,
+        outputs=[key],
+        as_iterable=as_iterable)
     if as_iterable:
-      return _as_iterable(preds, output=head_lib.PredictionKey.CLASSES)
-    return preds[head_lib.PredictionKey.CLASSES]
+      return _as_iterable(preds, output=key)
+    return preds[key]
 
   @deprecated_arg_values(
       estimator.AS_ITERABLE_DATE, estimator.AS_ITERABLE_INSTRUCTIONS,
@@ -479,14 +480,16 @@ class LinearClassifier(evaluable.Evaluable, trainable.Trainable):
   def predict_proba(self, x=None, input_fn=None, batch_size=None, outputs=None,
                     as_iterable=True):
     """Runs inference to determine the class probability predictions."""
-    preds = self._estimator.predict(x=x, input_fn=input_fn,
-                                    batch_size=batch_size,
-                                    outputs=[
-                                        head_lib.PredictionKey.PROBABILITIES],
-                                    as_iterable=as_iterable)
+    key = prediction_key.PredictionKey.PROBABILITIES
+    preds = self._estimator.predict(
+        x=x,
+        input_fn=input_fn,
+        batch_size=batch_size,
+        outputs=[key],
+        as_iterable=as_iterable)
     if as_iterable:
-      return _as_iterable(preds, output=head_lib.PredictionKey.PROBABILITIES)
-    return preds[head_lib.PredictionKey.PROBABILITIES]
+      return _as_iterable(preds, output=key)
+    return preds[key]
 
   def get_variable_names(self):
     return self._estimator.get_variable_names()
@@ -512,9 +515,9 @@ class LinearClassifier(evaluable.Evaluable, trainable.Trainable):
         input_fn=input_fn or default_input_fn,
         input_feature_key=input_feature_key,
         use_deprecated_input_fn=use_deprecated_input_fn,
-        signature_fn=(
-            signature_fn or export.classification_signature_fn_with_prob),
-        prediction_key=head_lib.PredictionKey.PROBABILITIES,
+        signature_fn=(signature_fn or
+                      export.classification_signature_fn_with_prob),
+        prediction_key=prediction_key.PredictionKey.PROBABILITIES,
         default_batch_size=default_batch_size,
         exports_to_keep=exports_to_keep)
 
@@ -561,16 +564,13 @@ class LinearRegressor(evaluable.Evaluable, trainable.Trainable):
   Example:
 
   ```python
-  education = sparse_column_with_hash_bucket(column_name="education",
-                                             hash_bucket_size=1000)
-  occupation = sparse_column_with_hash_bucket(column_name="occupation",
-                                              hash_bucket_size=1000)
+  sparse_column_a = sparse_column_with_hash_bucket(...)
+  sparse_column_b = sparse_column_with_hash_bucket(...)
 
-  education_x_occupation = crossed_column(columns=[education, occupation],
-                                          hash_bucket_size=10000)
+  sparse_feature_a_x_sparse_feature_b = crossed_column(...)
 
   estimator = LinearRegressor(
-      feature_columns=[occupation, education_x_occupation])
+      feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b])
 
   # Input builders
   def input_fn_train: # returns x, y
@@ -731,13 +731,16 @@ class LinearRegressor(evaluable.Evaluable, trainable.Trainable):
       as_iterable=False)
   def predict(self, x=None, input_fn=None, batch_size=None, as_iterable=True):
     """Runs inference to determine the predicted class."""
-    preds = self._estimator.predict(x=x, input_fn=input_fn,
-                                    batch_size=batch_size,
-                                    outputs=[head_lib.PredictionKey.SCORES],
-                                    as_iterable=as_iterable)
+    key = prediction_key.PredictionKey.SCORES
+    preds = self._estimator.predict(
+        x=x,
+        input_fn=input_fn,
+        batch_size=batch_size,
+        outputs=[key],
+        as_iterable=as_iterable)
     if as_iterable:
-      return _as_iterable(preds, output=head_lib.PredictionKey.SCORES)
-    return preds[head_lib.PredictionKey.SCORES]
+      return _as_iterable(preds, output=key)
+    return preds[key]
 
   def get_variable_names(self):
     return self._estimator.get_variable_names()
@@ -764,7 +767,7 @@ class LinearRegressor(evaluable.Evaluable, trainable.Trainable):
         input_feature_key=input_feature_key,
         use_deprecated_input_fn=use_deprecated_input_fn,
         signature_fn=(signature_fn or export.regression_signature_fn),
-        prediction_key=head_lib.PredictionKey.SCORES,
+        prediction_key=prediction_key.PredictionKey.SCORES,
         default_batch_size=default_batch_size,
         exports_to_keep=exports_to_keep)
 
diff --git a/tensorflow/contrib/learn/python/learn/estimators/metric_key.py b/tensorflow/contrib/learn/python/learn/estimators/metric_key.py
new file mode 100644
index 00000000000..8df08e507fe
--- /dev/null
+++ b/tensorflow/contrib/learn/python/learn/estimators/metric_key.py
@@ -0,0 +1,30 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Enum for metric keys."""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+
+class MetricKey(object):
+  LOSS = "loss"
+  AUC = "auc"
+  PREDICTION_MEAN = "labels/prediction_mean"
+  LABEL_MEAN = "labels/actual_label_mean"
+  ACCURACY = "accuracy"
+  ACCURACY_BASELINE = "accuracy/baseline_label_mean"
+  ACCURACY_MEAN = "accuracy/threshold_%f_mean"
+  PRECISION_MEAN = "precision/positive_threshold_%f_mean"
+  RECALL_MEAN = "recall/positive_threshold_%f_mean"
diff --git a/tensorflow/contrib/learn/python/learn/estimators/prediction_key.py b/tensorflow/contrib/learn/python/learn/estimators/prediction_key.py
new file mode 100644
index 00000000000..a9c0c329584
--- /dev/null
+++ b/tensorflow/contrib/learn/python/learn/estimators/prediction_key.py
@@ -0,0 +1,26 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Enum for model prediction keys."""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+
+class PredictionKey(object):
+  CLASSES = "classes"
+  PROBABILITIES = "probabilities"
+  LOGITS = "logits"
+  LOGISTIC = "logistic"
+  SCORES = "scores"
diff --git a/tensorflow/contrib/learn/python/learn/estimators/svm.py b/tensorflow/contrib/learn/python/learn/estimators/svm.py
index 6fd675e1b8b..0af33baeeb5 100644
--- a/tensorflow/contrib/learn/python/learn/estimators/svm.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/svm.py
@@ -30,6 +30,7 @@ from tensorflow.contrib.learn.python.learn import trainable
 from tensorflow.contrib.learn.python.learn.estimators import estimator
 from tensorflow.contrib.learn.python.learn.estimators import head as head_lib
 from tensorflow.contrib.learn.python.learn.estimators import linear
+from tensorflow.contrib.learn.python.learn.estimators import prediction_key
 from tensorflow.contrib.linear_optimizer.python import sdca_optimizer
 
 
@@ -188,13 +189,16 @@ class SVM(trainable.Trainable, evaluable.Evaluable):
       as_iterable=False)
   def predict(self, x=None, input_fn=None, batch_size=None, as_iterable=True):
     """Runs inference to determine the predicted class."""
-    preds = self._estimator.predict(x=x, input_fn=input_fn,
-                                    batch_size=batch_size,
-                                    outputs=[head_lib.PredictionKey.CLASSES],
-                                    as_iterable=as_iterable)
+    key = prediction_key.PredictionKey.CLASSES
+    preds = self._estimator.predict(
+        x=x,
+        input_fn=input_fn,
+        batch_size=batch_size,
+        outputs=[key],
+        as_iterable=as_iterable)
     if as_iterable:
-      return _as_iterable(preds, output=head_lib.PredictionKey.CLASSES)
-    return preds[head_lib.PredictionKey.CLASSES]
+      return _as_iterable(preds, output=key)
+    return preds[key]
 
   @deprecated_arg_values(
       estimator.AS_ITERABLE_DATE, estimator.AS_ITERABLE_INSTRUCTIONS,
@@ -202,14 +206,16 @@ class SVM(trainable.Trainable, evaluable.Evaluable):
   def predict_proba(self, x=None, input_fn=None, batch_size=None, outputs=None,
                     as_iterable=True):
     """Runs inference to determine the class probability predictions."""
-    preds = self._estimator.predict(x=x, input_fn=input_fn,
-                                    batch_size=batch_size,
-                                    outputs=[
-                                        head_lib.PredictionKey.PROBABILITIES],
-                                    as_iterable=as_iterable)
+    key = prediction_key.PredictionKey.PROBABILITIES
+    preds = self._estimator.predict(
+        x=x,
+        input_fn=input_fn,
+        batch_size=batch_size,
+        outputs=[key],
+        as_iterable=as_iterable)
     if as_iterable:
-      return _as_iterable(preds, output=head_lib.PredictionKey.PROBABILITIES)
-    return preds[head_lib.PredictionKey.PROBABILITIES]
+      return _as_iterable(preds, output=key)
+    return preds[key]
   # pylint: enable=protected-access
 
   def get_variable_names(self):
diff --git a/tensorflow/contrib/learn/python/learn/estimators/tensor_signature.py b/tensorflow/contrib/learn/python/learn/estimators/tensor_signature.py
index 483ccc9f119..693581dc182 100644
--- a/tensorflow/contrib/learn/python/learn/estimators/tensor_signature.py
+++ b/tensorflow/contrib/learn/python/learn/estimators/tensor_signature.py
@@ -22,7 +22,7 @@ from __future__ import print_function
 import collections
 
 from tensorflow.python.framework import dtypes
-from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import math_ops
@@ -41,7 +41,7 @@ class TensorSignature(collections.namedtuple(
   """
 
   def __new__(cls, tensor):
-    if isinstance(tensor, ops.SparseTensor):
+    if isinstance(tensor, sparse_tensor.SparseTensor):
       return super(TensorSignature, cls).__new__(
           cls, dtype=tensor.values.dtype, shape=None, is_sparse=True)
     return super(TensorSignature, cls).__new__(
diff --git a/tensorflow/contrib/learn/python/learn/graph_actions.py b/tensorflow/contrib/learn/python/learn/graph_actions.py
index 0c5152b553f..baee707a5f6 100644
--- a/tensorflow/contrib/learn/python/learn/graph_actions.py
+++ b/tensorflow/contrib/learn/python/learn/graph_actions.py
@@ -40,6 +40,7 @@ from tensorflow.python.framework import ops
 from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import data_flow_ops
 from tensorflow.python.ops import logging_ops
+from tensorflow.python.ops import resources
 from tensorflow.python.ops import variables
 from tensorflow.python.platform import tf_logging as logging
 from tensorflow.python.training import basic_session_run_hooks
@@ -77,7 +78,8 @@ def get_summary_writer(logdir):
 
 
 def _make_saver(graph, keep_checkpoint_max=5):
-  vars_to_save = graph.get_collection(ops.GraphKeys.VARIABLES)
+  vars_to_save = (graph.get_collection(ops.GraphKeys.VARIABLES) +
+                  graph.get_collection(ops.GraphKeys.SAVEABLE_OBJECTS))
   if vars_to_save:
     return tf_saver.Saver(vars_to_save,
                           sharded=True,
@@ -846,9 +848,11 @@ def run_feeds_iter(output_dict, feed_dicts, restore_checkpoint_path=None):
     raise ValueError('feed_dicts is invalid: %s.' % feed_dicts)
 
   graph = contrib_ops.get_graph_from_inputs(output_dict.values())
-
   with graph.as_default() as g:
     with tf_session.Session('') as session:
+      session.run(
+          resources.initialize_resources(resources.shared_resources() +
+                                         resources.local_resources()))
       if restore_checkpoint_path:
         _restore_from_checkpoint(session, g, restore_checkpoint_path)
       else:
diff --git a/tensorflow/contrib/learn/python/learn/graph_actions_test.py b/tensorflow/contrib/learn/python/learn/graph_actions_test.py
index 9a7306ad4ad..c8c73d5de52 100644
--- a/tensorflow/contrib/learn/python/learn/graph_actions_test.py
+++ b/tensorflow/contrib/learn/python/learn/graph_actions_test.py
@@ -28,6 +28,8 @@ from tensorflow.contrib.learn.python import learn
 from tensorflow.contrib.learn.python.learn.monitors import BaseMonitor
 from tensorflow.python.framework import meta_graph
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import test_ops
+from tensorflow.python.ops import resources
 from tensorflow.python.ops import variables
 
 
@@ -194,6 +196,19 @@ class GraphActionsTest(tf.test.TestCase):
         pass
       self.assertTrue(request_stop.called)
 
+  def test_run_feeds_iter_calls_resources_init(self):
+    with tf.Graph().as_default() as g:
+      in0, _, _ = self._build_inference_graph()
+      handle = test_ops.stub_resource_handle_op(container='a', shared_name='b')
+      resources.register_resource(
+          handle=handle,
+          create_op=test_ops.resource_create_op(handle),
+          is_initialized_op=test_ops.resource_initialized_op(handle))
+
+      for _ in learn.graph_actions.run_feeds_iter({'in0': in0},
+                                                  feed_dicts=[{}]):
+        self.assertTrue(test_ops.resource_initialized_op(handle).eval())
+
   def test_infer_different_default_graph(self):
     with self.test_session():
       self._assert_ckpt(self._output_dir, False)
diff --git a/tensorflow/contrib/learn/python/learn/learn_io/graph_io.py b/tensorflow/contrib/learn/python/learn/learn_io/graph_io.py
index ea0fb9e74e5..9542020a20c 100644
--- a/tensorflow/contrib/learn/python/learn/learn_io/graph_io.py
+++ b/tensorflow/contrib/learn/python/learn/learn_io/graph_io.py
@@ -24,6 +24,7 @@ from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import errors
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import data_flow_ops
 from tensorflow.python.ops import io_ops
 from tensorflow.python.ops import math_ops
@@ -645,7 +646,7 @@ def queue_parsed_features(parsed_features,
     # directly.
     for key in sorted(parsed_features.keys()):
       tensor = parsed_features[key]
-      if isinstance(tensor, ops.SparseTensor):
+      if isinstance(tensor, sparse_tensor.SparseTensor):
         tensors_mapping.append((key, True))
         tensors_to_enqueue.extend([tensor.indices, tensor.values, tensor.shape])
       else:
@@ -704,7 +705,7 @@ def queue_parsed_features(parsed_features,
     for key, is_sparse_tensor in tensors_mapping:
       if is_sparse_tensor:
         # Three tensors are (indices, values, shape).
-        dequeued_parsed_features[key] = ops.SparseTensor(
+        dequeued_parsed_features[key] = sparse_tensor.SparseTensor(
             dequeued_tensors[index], dequeued_tensors[index + 1],
             dequeued_tensors[index + 2])
         index += 3
diff --git a/tensorflow/contrib/learn/python/learn/monitors_test.py b/tensorflow/contrib/learn/python/learn/monitors_test.py
index ded0fb71ab7..0e5ce41f04a 100644
--- a/tensorflow/contrib/learn/python/learn/monitors_test.py
+++ b/tensorflow/contrib/learn/python/learn/monitors_test.py
@@ -542,7 +542,8 @@ class CheckpointSaverTest(tf.test.TestCase):
         self.assertEqual(1, tf.contrib.framework.load_variable(
             self.model_dir, self.global_step.name))
 
-  def test_save_secs_saves_periodically(self):
+  # TODO(gunan): Reenable this test after b/32446874 is fixed.
+  def disabled_test_save_secs_saves_periodically(self):
     with self.graph.as_default():
       monitor = learn.monitors.CheckpointSaver(
           self.model_dir, save_secs=2, scaffold=self.scaffold)
diff --git a/tensorflow/contrib/lookup/lookup_ops.py b/tensorflow/contrib/lookup/lookup_ops.py
index 23e75ae154c..d4f9c92b2de 100644
--- a/tensorflow/contrib/lookup/lookup_ops.py
+++ b/tensorflow/contrib/lookup/lookup_ops.py
@@ -20,6 +20,7 @@ from __future__ import print_function
 
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import gen_data_flow_ops
@@ -166,7 +167,7 @@ class InitializableLookupTableBase(LookupInterface):
       name = "%s_lookup_table_find" % self._name
 
     key_tensor = keys
-    if isinstance(keys, ops.SparseTensor):
+    if isinstance(keys, sparse_tensor.SparseTensor):
       key_tensor = keys.values
 
     if keys.dtype != self._key_dtype:
@@ -181,8 +182,8 @@ class InitializableLookupTableBase(LookupInterface):
     # pylint: enable=protected-access
 
     values.set_shape(key_tensor.get_shape())
-    if isinstance(keys, ops.SparseTensor):
-      return ops.SparseTensor(keys.indices, values, keys.shape)
+    if isinstance(keys, sparse_tensor.SparseTensor):
+      return sparse_tensor.SparseTensor(keys.indices, values, keys.shape)
     else:
       return values
 
diff --git a/tensorflow/contrib/lookup/lookup_ops_test.py b/tensorflow/contrib/lookup/lookup_ops_test.py
index 803cc3eb1ef..d2d72221406 100644
--- a/tensorflow/contrib/lookup/lookup_ops_test.py
+++ b/tensorflow/contrib/lookup/lookup_ops_test.py
@@ -18,6 +18,7 @@ from __future__ import division
 from __future__ import print_function
 
 import os
+import tempfile
 import numpy as np
 import six
 import tensorflow as tf
@@ -296,7 +297,8 @@ class MutableHashTableOpTest(tf.test.TestCase):
       self.assertAllEqual([0, 1, 2], sorted_values)
 
   def testSaveRestore(self):
-    save_path = os.path.join(self.get_temp_dir(), "hash")
+    save_dir = os.path.join(self.get_temp_dir(), "save_restore")
+    save_path = os.path.join(tempfile.mkdtemp(prefix=save_dir), "hash")
 
     with self.test_session(graph=tf.Graph()) as sess:
       v0 = tf.Variable(10.0, name="v0")
@@ -867,7 +869,8 @@ class MutableDenseHashTableOpTest(tf.test.TestCase):
                            [100, 0], [100, 0], [100, 0]], pairs)
 
   def testSaveRestore(self):
-    save_path = os.path.join(self.get_temp_dir(), "hash")
+    save_dir = os.path.join(self.get_temp_dir(), "save_restore")
+    save_path = os.path.join(tempfile.mkdtemp(prefix=save_dir), "hash")
 
     with self.test_session(graph=tf.Graph()) as sess:
       default_value = -1
@@ -922,7 +925,8 @@ class MutableDenseHashTableOpTest(tf.test.TestCase):
       self.assertAllEqual([-1, 0, 1, 2, -1], output.eval())
 
   def testVectorSaveRestore(self):
-    save_path = os.path.join(self.get_temp_dir(), "hash")
+    save_dir = os.path.join(self.get_temp_dir(), "vector_save_restore")
+    save_path = os.path.join(tempfile.mkdtemp(prefix=save_dir), "hash")
 
     with self.test_session(graph=tf.Graph()) as sess:
       empty_key = tf.constant([11, 13], tf.int64)
diff --git a/tensorflow/contrib/makefile/README.md b/tensorflow/contrib/makefile/README.md
index 25c03d8bf74..03a745ad4c3 100644
--- a/tensorflow/contrib/makefile/README.md
+++ b/tensorflow/contrib/makefile/README.md
@@ -1,7 +1,8 @@
 ### TensorFlow Makefile
 
 The recommended way to build TensorFlow from source is using the Bazel
-open-source build system. Sometimes this isn't possible.
+open-source build system. Sometimes this isn't possible. For example,
+if you are building for iOS, you currently need to use the Makefile.
 
  - The build system may not have the RAM or processing power to support Bazel.
  - Bazel or its dependencies may not be available.
diff --git a/tensorflow/contrib/makefile/tf_op_files.txt b/tensorflow/contrib/makefile/tf_op_files.txt
index ed5d6539b3b..cbf73a7a16f 100644
--- a/tensorflow/contrib/makefile/tf_op_files.txt
+++ b/tensorflow/contrib/makefile/tf_op_files.txt
@@ -43,6 +43,13 @@ tensorflow/core/kernels/sequence_ops.cc
 tensorflow/core/kernels/sendrecv_ops.cc
 tensorflow/core/kernels/scatter_op.cc
 tensorflow/core/kernels/scatter_functor.cc
+tensorflow/core/kernels/scatter_nd_op_cpu_impl_0.cc
+tensorflow/core/kernels/scatter_nd_op_cpu_impl_1.cc
+tensorflow/core/kernels/scatter_nd_op_cpu_impl_2.cc
+tensorflow/core/kernels/scatter_nd_op_cpu_impl_3.cc
+tensorflow/core/kernels/scatter_nd_op_cpu_impl_4.cc
+tensorflow/core/kernels/scatter_nd_op_cpu_impl_5.cc
+tensorflow/core/kernels/scatter_nd_op.cc
 tensorflow/core/kernels/save_restore_tensor.cc
 tensorflow/core/kernels/save_restore_v2_ops.cc
 tensorflow/core/kernels/save_op.cc
diff --git a/tensorflow/contrib/metrics/python/ops/confusion_matrix_ops.py b/tensorflow/contrib/metrics/python/ops/confusion_matrix_ops.py
index 1820f6bf17d..dd57f0478be 100644
--- a/tensorflow/contrib/metrics/python/ops/confusion_matrix_ops.py
+++ b/tensorflow/contrib/metrics/python/ops/confusion_matrix_ops.py
@@ -21,6 +21,7 @@ from __future__ import print_function
 from tensorflow.contrib.framework import tensor_util
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import math_ops
 from tensorflow.python.ops import sparse_ops
@@ -102,7 +103,7 @@ def confusion_matrix(predictions, labels, num_classes=None, dtype=dtypes.int32,
     indices = array_ops.transpose(array_ops.pack([predictions, labels]))
     values = (array_ops.ones_like(predictions, dtype)
               if weights is None else weights)
-    cm_sparse = ops.SparseTensor(
+    cm_sparse = sparse_tensor.SparseTensor(
         indices=indices, values=values, shape=math_ops.to_int64(shape))
     zero_matrix = array_ops.zeros(math_ops.to_int32(shape), dtype)
 
diff --git a/tensorflow/contrib/metrics/python/ops/metric_ops.py b/tensorflow/contrib/metrics/python/ops/metric_ops.py
index c7d20613713..90b56b6a971 100644
--- a/tensorflow/contrib/metrics/python/ops/metric_ops.py
+++ b/tensorflow/contrib/metrics/python/ops/metric_ops.py
@@ -29,6 +29,7 @@ from tensorflow.contrib.metrics.python.ops import confusion_matrix_ops
 from tensorflow.contrib.metrics.python.ops import set_ops
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import check_ops
 from tensorflow.python.ops import control_flow_ops
@@ -762,7 +763,12 @@ def streaming_auc(predictions, labels, weights=None, num_thresholds=200,
   computes the area under a discretized curve of precision versus recall values
   (computed using the aforementioned variables). The `num_thresholds` variable
   controls the degree of discretization with larger numbers of thresholds more
-  closely approximating the true AUC.
+  closely approximating the true AUC. The quality of the approximation may vary
+  dramatically depending on `num_thresholds`.
+
+  For best results, `predictions` should be distributed approximately uniformly
+  in the range [0, 1] and not peaked around 0 or 1. The quality of the AUC
+  approximation may be poor if this is not the case.
 
   For estimation of the metric over a stream of data, the function creates an
   `update_op` operation that updates these variables and returns the `auc`.
@@ -1601,7 +1607,8 @@ def num_relevant(labels, k):
     raise ValueError('Invalid k=%s.' % k)
   with ops.name_scope(None, 'num_relevant', (labels,)) as scope:
     # For SparseTensor, calculate separate count for each row.
-    if isinstance(labels, (ops.SparseTensor, ops.SparseTensorValue)):
+    if isinstance(
+        labels, (sparse_tensor.SparseTensor, sparse_tensor.SparseTensorValue)):
       labels_sizes = set_ops.set_size(labels)
       return math_ops.minimum(labels_sizes, k, name=scope)
 
@@ -1637,9 +1644,9 @@ def expand_and_tile(tensor, multiple, dim=0, name=None):
   with ops.name_scope(
       name, 'expand_and_tile', (tensor, multiple, dim)) as scope:
     # Sparse.
-    if isinstance(tensor, ops.SparseTensorValue):
-      tensor = ops.SparseTensor.from_value(tensor)
-    if isinstance(tensor, ops.SparseTensor):
+    if isinstance(tensor, sparse_tensor.SparseTensorValue):
+      tensor = sparse_tensor.SparseTensor.from_value(tensor)
+    if isinstance(tensor, sparse_tensor.SparseTensor):
       if dim < 0:
         expand_dims = array_ops.reshape(
             array_ops.size(tensor.shape) + dim, [1])
@@ -1871,7 +1878,8 @@ def _select_class_id(ids, selected_id):
     `SparseTensor` of same dimensions as `ids`. This contains only the entries
     equal to `selected_id`.
   """
-  if isinstance(ids, (ops.SparseTensor, ops.SparseTensorValue)):
+  if isinstance(
+      ids, (sparse_tensor.SparseTensor, sparse_tensor.SparseTensorValue)):
     return sparse_ops.sparse_retain(
         ids, math_ops.equal(ids.values, selected_id))
 
@@ -1888,7 +1896,7 @@ def _select_class_id(ids, selected_id):
   filled_selected_id = array_ops.fill(
       filled_selected_id_shape, math_ops.to_int64(selected_id))
   result = set_ops.set_intersection(filled_selected_id, ids)
-  return ops.SparseTensor(
+  return sparse_tensor.SparseTensor(
       indices=result.indices, values=result.values, shape=ids_shape)
 
 
diff --git a/tensorflow/contrib/metrics/python/ops/set_ops.py b/tensorflow/contrib/metrics/python/ops/set_ops.py
index ed9fd6ffd4a..c4c894cc0fb 100644
--- a/tensorflow/contrib/metrics/python/ops/set_ops.py
+++ b/tensorflow/contrib/metrics/python/ops/set_ops.py
@@ -23,6 +23,7 @@ from tensorflow.contrib.util import loader
 from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.platform import resource_loader
 
 
@@ -54,7 +55,7 @@ def set_size(a, validate_indices=True):
     TypeError: If `a` is an invalid types.
   """
   a = tensor_util.convert_to_tensor_or_sparse_tensor(a, name="a")
-  if not isinstance(a, ops.SparseTensor):
+  if not isinstance(a, sparse_tensor.SparseTensor):
     raise TypeError("Expected `SparseTensor`, got %s." % a)
   if a.values.dtype.base_dtype not in _VALID_DTYPES:
     raise TypeError("Invalid dtype %s." % a.values.dtype)
@@ -106,22 +107,22 @@ def _set_operation(a, b, set_operation, validate_indices=True):
   if b.dtype.base_dtype != a.dtype.base_dtype:
     raise TypeError("Types don't match, %s vs %s." % (a.dtype, b.dtype))
   # pylint: disable=protected-access
-  if isinstance(a, ops.SparseTensor):
-    if isinstance(b, ops.SparseTensor):
+  if isinstance(a, sparse_tensor.SparseTensor):
+    if isinstance(b, sparse_tensor.SparseTensor):
       indices, values, shape = _set_ops.sparse_to_sparse_set_operation(
           a.indices, a.values, a.shape, b.indices, b.values, b.shape,
           set_operation, validate_indices)
     else:
       raise ValueError("Sparse,Dense is not supported, but Dense,Sparse is. "
                        "Please flip the order of your inputs.")
-  elif isinstance(b, ops.SparseTensor):
+  elif isinstance(b, sparse_tensor.SparseTensor):
     indices, values, shape = _set_ops.dense_to_sparse_set_operation(
         a, b.indices, b.values, b.shape, set_operation, validate_indices)
   else:
     indices, values, shape = _set_ops.dense_to_dense_set_operation(
         a, b, set_operation, validate_indices)
   # pylint: enable=protected-access
-  return ops.SparseTensor(indices, values, shape)
+  return sparse_tensor.SparseTensor(indices, values, shape)
 
 
 def set_intersection(a, b, validate_indices=True):
diff --git a/tensorflow/contrib/opt/python/training/moving_average_optimizer_test.py b/tensorflow/contrib/opt/python/training/moving_average_optimizer_test.py
index 4c24276cdd5..02ce9ff24fb 100644
--- a/tensorflow/contrib/opt/python/training/moving_average_optimizer_test.py
+++ b/tensorflow/contrib/opt/python/training/moving_average_optimizer_test.py
@@ -18,6 +18,7 @@ from __future__ import division
 from __future__ import print_function
 
 import os.path
+import tempfile
 
 import six
 import tensorflow as tf
@@ -40,7 +41,9 @@ class MovingAverageOptimizerTest(tf.test.TestCase):
               tf.train.GradientDescentOptimizer(learning_rate=2.0),
               average_decay=0.5,
               sequential_update=sequential_update)
-          save_path = os.path.join(self.get_temp_dir(), 'model')
+          save_dir = tempfile.mkdtemp(
+              prefix=os.path.join(self.get_temp_dir(), 'run_1'))
+          save_path = os.path.join(save_dir, 'model')
           update = opt.apply_gradients(
               list(six.moves.zip([grads0, grads1], [var0, var1])))
           train_saver = opt.swapping_saver()
diff --git a/tensorflow/contrib/pi_examples/camera/Makefile b/tensorflow/contrib/pi_examples/camera/Makefile
index d7dd3e131f3..182baefcd65 100644
--- a/tensorflow/contrib/pi_examples/camera/Makefile
+++ b/tensorflow/contrib/pi_examples/camera/Makefile
@@ -39,7 +39,7 @@ INCLUDES := \
 -I/usr/local/include \
 -I. \
 -I$(DOWNLOADSDIR) \
--I$(DOWNLOADSDIR)/eigen-latest/ \
+-I$(DOWNLOADSDIR)/eigen/ \
 -I$(PROTOGENDIR) \
 -I$(PBTGENDIR)
 LIBS := \
diff --git a/tensorflow/contrib/pi_examples/label_image/Makefile b/tensorflow/contrib/pi_examples/label_image/Makefile
index 511da285a95..0cf71bd2943 100644
--- a/tensorflow/contrib/pi_examples/label_image/Makefile
+++ b/tensorflow/contrib/pi_examples/label_image/Makefile
@@ -39,7 +39,7 @@ INCLUDES := \
 -I/usr/local/include \
 -I. \
 -I$(DOWNLOADSDIR) \
--I$(DOWNLOADSDIR)/eigen-latest/ \
+-I$(DOWNLOADSDIR)/eigen/ \
 -I$(PROTOGENDIR) \
 -I$(PBTGENDIR)
 LIBS := \
diff --git a/tensorflow/contrib/slim/BUILD b/tensorflow/contrib/slim/BUILD
index 266605b2c29..0d489834254 100644
--- a/tensorflow/contrib/slim/BUILD
+++ b/tensorflow/contrib/slim/BUILD
@@ -46,6 +46,7 @@ py_test(
     name = "learning_test",
     srcs = ["python/slim/learning_test.py"],
     srcs_version = "PY2AND3",
+    tags = ["manual"],
     deps = [
         "//tensorflow:tensorflow_py",
         "//tensorflow/contrib/slim",
diff --git a/tensorflow/contrib/slim/python/slim/data/tfexample_decoder.py b/tensorflow/contrib/slim/python/slim/data/tfexample_decoder.py
index 65eadbf4e9e..fb5a0d677f9 100644
--- a/tensorflow/contrib/slim/python/slim/data/tfexample_decoder.py
+++ b/tensorflow/contrib/slim/python/slim/data/tfexample_decoder.py
@@ -27,7 +27,7 @@ import abc
 
 from tensorflow.contrib.slim.python.slim.data import data_decoder
 from tensorflow.python.framework import dtypes
-from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import image_ops
@@ -189,11 +189,11 @@ class Tensor(ItemHandler):
       shape_dims = []
       for k in self._shape_keys:
         shape_dim = keys_to_tensors[k]
-        if isinstance(shape_dim, ops.SparseTensor):
+        if isinstance(shape_dim, sparse_tensor.SparseTensor):
           shape_dim = sparse_ops.sparse_tensor_to_dense(shape_dim)
         shape_dims.append(shape_dim)
       shape = array_ops.reshape(array_ops.pack(shape_dims), [-1])
-    if isinstance(tensor, ops.SparseTensor):
+    if isinstance(tensor, sparse_tensor.SparseTensor):
       if shape is not None:
         tensor = sparse_ops.sparse_reshape(tensor, shape)
       tensor = sparse_ops.sparse_tensor_to_dense(tensor, self._default_value)
@@ -241,7 +241,7 @@ class SparseTensor(ItemHandler):
     values = keys_to_tensors[self._values_key]
     if self._shape_key:
       shape = keys_to_tensors[self._shape_key]
-      if isinstance(shape, ops.SparseTensor):
+      if isinstance(shape, sparse_tensor.SparseTensor):
         shape = sparse_ops.sparse_tensor_to_dense(shape)
     elif self._shape:
       shape = self._shape
@@ -255,7 +255,7 @@ class SparseTensor(ItemHandler):
     new_indices = array_ops.concat(1, [indices_columns_to_preserve,
                                        array_ops.reshape(ids, [-1, 1])])
 
-    tensor = ops.SparseTensor(new_indices, values.values, shape)
+    tensor = sparse_tensor.SparseTensor(new_indices, values.values, shape)
     if self._densify:
       tensor = sparse_ops.sparse_tensor_to_dense(tensor, self._default_value)
     return tensor
diff --git a/tensorflow/contrib/tensor_forest/core/ops/finished_nodes_op.cc b/tensorflow/contrib/tensor_forest/core/ops/finished_nodes_op.cc
index 045f16e5473..7afaa00fada 100644
--- a/tensorflow/contrib/tensor_forest/core/ops/finished_nodes_op.cc
+++ b/tensorflow/contrib/tensor_forest/core/ops/finished_nodes_op.cc
@@ -132,11 +132,9 @@ REGISTER_OP("FinishedNodes")
     .Attr("num_split_after_samples: int")
     .Attr("min_split_samples: int")
     .Attr("dominate_fraction: float = 0.99")
-    // TODO(thomaswc): Test out bootstrap on several datasets, confirm it
-    // works well, make it the default.
     .Attr(
         "dominate_method:"
-        " {'none', 'hoeffding', 'bootstrap', 'chebyshev'} = 'hoeffding'")
+        " {'none', 'hoeffding', 'bootstrap', 'chebyshev'} = 'bootstrap'")
     .Attr("random_seed: int = 0")
     .Input("leaves: int32")
     .Input("node_to_accumulator: int32")
diff --git a/tensorflow/contrib/tensor_forest/core/ops/training_ops_test.cc b/tensorflow/contrib/tensor_forest/core/ops/training_ops_test.cc
index 451dcf2a94f..f8832a48fe2 100644
--- a/tensorflow/contrib/tensor_forest/core/ops/training_ops_test.cc
+++ b/tensorflow/contrib/tensor_forest/core/ops/training_ops_test.cc
@@ -26,7 +26,7 @@ namespace tensorflow {
 
 TEST(TrainingOpsTest, UpdateFertileSlots_ShapeFn) {
   ShapeInferenceTestOp op("UpdateFertileSlots");
-  INFER_OK(op, "?;?;?;?;?;?;?", "[2,?];[2,?];[?];[?]");
+  INFER_OK(op, "?;?;?;?;?;?;?;?", "[2,?];[2,?];[?];[?]");
 }
 
 TEST(TrainingOpsTest, ScatterAddNdim_ShapeFn) {
diff --git a/tensorflow/contrib/tensor_forest/core/ops/tree_utils.h b/tensorflow/contrib/tensor_forest/core/ops/tree_utils.h
index b2f66acb6e4..7c7193f0f45 100644
--- a/tensorflow/contrib/tensor_forest/core/ops/tree_utils.h
+++ b/tensorflow/contrib/tensor_forest/core/ops/tree_utils.h
@@ -55,23 +55,29 @@ T Sum(Tensor counts) {
 // is stored in index 0, individual feature types start at index 1.
 DataColumnTypes FeatureSpec(int32 input_feature, const Tensor& spec);
 
-// Given an Eigen::Tensor type, calculate the Gini impurity, which we use
-// to determine the best split (lowest) and which nodes to allocate first
-// (highest).
-template<typename T>
-float WeightedGiniImpurity(const T& counts) {
+// Given an Eigen::Tensor type, calculate the Gini impurity.
+template <typename T>
+float RawWeightedGiniImpurity(const T& counts) {
   // Our split score is the Gini impurity times the number of examples
   // seen by the leaf.  If c(i) denotes the i-th class count and c = sum_i c(i)
   // then
   // score = c * (1 - sum_i ( c(i) / c )^2 )
   //       = c - sum_i c(i)^2 / c
-  const auto smoothed = counts + counts.constant(1.0f);
-  const auto sum = smoothed.sum();
-  const auto sum2 = smoothed.square().sum();
+  const auto sum = counts.sum();
+  const auto sum2 = counts.square().sum();
   Eigen::Tensor<float, 0, Eigen::RowMajor> ret = sum - (sum2 / sum);
   return ret(0);
 }
 
+// Given an Eigen::Tensor type, calculate the smoothed Gini impurity, which we
+// use to determine the best split (lowest) and which nodes to allocate first
+// (highest).
+template <typename T>
+float WeightedGiniImpurity(const T& counts) {
+  const auto smoothed = counts + counts.constant(1.0f);
+  return RawWeightedGiniImpurity(smoothed);
+}
+
 template<typename T1, typename T2>
 float WeightedVariance(const T1& sums, const T2& squares, float count) {
   const auto e_x = sums / count;
diff --git a/tensorflow/contrib/tensor_forest/core/ops/update_fertile_slots_op.cc b/tensorflow/contrib/tensor_forest/core/ops/update_fertile_slots_op.cc
index 448869ab750..52b7f6d3b3a 100644
--- a/tensorflow/contrib/tensor_forest/core/ops/update_fertile_slots_op.cc
+++ b/tensorflow/contrib/tensor_forest/core/ops/update_fertile_slots_op.cc
@@ -48,6 +48,7 @@ REGISTER_OP("UpdateFertileSlots")
     .Input("accumulator_sums: float")
     .Input("node_to_accumulator: int32")
     .Input("stale_leaves: int32")
+    .Input("node_sums: float")
     .Output("node_to_accumulator_map_updates: int32")
     .Output("accumulator_to_node_map_updates: int32")
     .Output("accumulators_cleared: int32")
@@ -84,6 +85,8 @@ node_to_accumulator: `node_to_accumulator[i]` is the accumulator slot used by
   fertile node i, or -1 if node i isn't fertile.
 stale_leaves:= A 1-d int32 tensor containing the indices of all leaves that
   have stopped accumulating statistics because they are too old.
+node_sums: `node_sums[n][c]` records how many
+   training examples have class c and have ended up in node n.
 node_to_accumulator_map_updates:= A 2-d int32 tensor describing the changes
   that need to be applied to the node_to_accumulator map.  Intended to be used
   with
@@ -121,6 +124,7 @@ class UpdateFertileSlots : public OpKernel {
     const Tensor& accumulator_sums = context->input(4);
     const Tensor& node_to_accumulator = context->input(5);
     const Tensor& stale_leaves = context->input(6);
+    const Tensor& node_sums = context->input(7);
 
     OP_REQUIRES(context, finished.shape().dims() == 1,
                 errors::InvalidArgument(
@@ -204,6 +208,8 @@ class UpdateFertileSlots : public OpKernel {
         non_fertile_leaves, non_fertile_leaf_scores, eot, num_new_leaves,
         static_cast<int32>(accumulator_sums.shape().dim_size(1)), &leaf_heap);
 
+    const auto sums = node_sums.unaligned_flat<float>();
+    const int32 num_columns = node_sums.shape().dim_size(1);
     // Allocate leaves.
     std::unique_ptr<HeapValuesType> values(
         leaf_heap.Extract());
@@ -218,6 +224,18 @@ class UpdateFertileSlots : public OpKernel {
         VLOG(1) << "No allocators left.";
         break;
       }
+      // For classification, don't make a node fertile until it is unpure.
+      if (!regression_) {
+        // Add 1 here because index 0 contains the sum of the weights across
+        // classes.
+        Eigen::array<int, 1> offsets = {node.first * num_columns + 1};
+        Eigen::array<int, 1> extents = {num_columns - 1};
+        const auto node_counts = sums.slice(offsets, extents);
+        // TODO(thomaswc): Implement a faster check for pure nodes.
+        if (tensorforest::RawWeightedGiniImpurity(node_counts) == 0) {
+          continue;
+        }
+      }
       VLOG(1) << "setting node " << node.first << " to accumulator "
               << accumulator;
       ++num_accumulators_allocated;
diff --git a/tensorflow/contrib/tensor_forest/data/data_ops.py b/tensorflow/contrib/tensor_forest/data/data_ops.py
index 1dfcaf5c7a4..80798d3e48a 100644
--- a/tensorflow/contrib/tensor_forest/data/data_ops.py
+++ b/tensorflow/contrib/tensor_forest/data/data_ops.py
@@ -25,6 +25,7 @@ from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import load_library
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import math_ops
 from tensorflow.python.ops import sparse_ops
@@ -77,7 +78,7 @@ def _ParseSparse(data):
     ValueError: If data contains non-string Tensors.
   """
   for k in sorted(data.keys()):
-    if not isinstance(data[k], ops.SparseTensor):
+    if not isinstance(data[k], sparse_tensor.SparseTensor):
       raise NotImplementedError(
           'Features should be either all sparse or all dense.  Use a '
           'feature engineering function to convert some of them.')
@@ -133,7 +134,7 @@ def ParseDataTensorOrDict(data):
     # If there's at least one sparse tensor, everything has to be sparse.
     is_sparse = False
     for v in data.values():
-      if isinstance(v, ops.SparseTensor):
+      if isinstance(v, sparse_tensor.SparseTensor):
         is_sparse = True
         break
     if is_sparse:
@@ -161,11 +162,11 @@ def ParseLabelTensorOrDict(labels):
   """
   if isinstance(labels, dict):
     return math_ops.to_float(array_ops.concat(
-        1, [sparse_ops.sparse_tensor_to_dense(labels[
-            k], default_value=-1) if isinstance(labels, ops.SparseTensor) else
-            labels[k] for k in sorted(labels.keys())]))
+        1, [sparse_ops.sparse_tensor_to_dense(labels[k], default_value=-1)
+            if isinstance(labels, sparse_tensor.SparseTensor)
+            else labels[k] for k in sorted(labels.keys())]))
   else:
-    if isinstance(labels, ops.SparseTensor):
+    if isinstance(labels, sparse_tensor.SparseTensor):
       return math_ops.to_float(sparse_ops.sparse_tensor_to_dense(
           labels, default_value=-1))
     else:
diff --git a/tensorflow/contrib/tensor_forest/python/kernel_tests/update_fertile_slots_op_test.py b/tensorflow/contrib/tensor_forest/python/kernel_tests/update_fertile_slots_op_test.py
index 1506f65e163..35faeed95c1 100644
--- a/tensorflow/contrib/tensor_forest/python/kernel_tests/update_fertile_slots_op_test.py
+++ b/tensorflow/contrib/tensor_forest/python/kernel_tests/update_fertile_slots_op_test.py
@@ -40,6 +40,8 @@ class UpdateFertileSlotsTest(test_util.TensorFlowTestCase):
     self.total_counts = [[80., 40., 40.]]
     self.ops = training_ops.Load()
     self.stale_leaves = []
+    self.node_sums = [[3, 1, 2], [4, 2, 2], [5, 2, 3], [6, 1, 5], [7, 5, 2],
+                      [8, 4, 4], [9, 7, 2]]
 
   def testSimple(self):
     with self.test_session():
@@ -47,7 +49,7 @@ class UpdateFertileSlotsTest(test_util.TensorFlowTestCase):
        accumulators_allocated) = self.ops.update_fertile_slots(
            self.finished, self.non_fertile_leaves, self.non_fertile_leaf_scores,
            self.end_of_tree, self.total_counts, self.node_map,
-           self.stale_leaves)
+           self.stale_leaves, self.node_sums)
 
       self.assertAllEqual([[2, 4], [-1, 0]], n2a_map_updates.eval())
       self.assertAllEqual([[0], [4]], a2n_map_updates.eval())
@@ -60,13 +62,27 @@ class UpdateFertileSlotsTest(test_util.TensorFlowTestCase):
        accumulators_allocated) = self.ops.update_fertile_slots(
            [], self.non_fertile_leaves, self.non_fertile_leaf_scores,
            self.end_of_tree, self.total_counts, self.node_map,
-           self.stale_leaves)
+           self.stale_leaves, self.node_sums)
 
       self.assertAllEqual((2, 0), n2a_map_updates.eval().shape)
       self.assertAllEqual((2, 0), a2n_map_updates.eval().shape)
       self.assertAllEqual([], accumulators_cleared.eval())
       self.assertAllEqual([], accumulators_allocated.eval())
 
+  def testPureCounts(self):
+    with self.test_session():
+      self.node_sums[4] = [10, 0, 10]
+      (n2a_map_updates, a2n_map_updates, accumulators_cleared,
+       accumulators_allocated) = self.ops.update_fertile_slots(
+           self.finished, self.non_fertile_leaves, self.non_fertile_leaf_scores,
+           self.end_of_tree, self.total_counts, self.node_map,
+           self.stale_leaves, self.node_sums)
+
+      self.assertAllEqual([[2, 3], [-1, 0]], n2a_map_updates.eval())
+      self.assertAllEqual([[0], [3]], a2n_map_updates.eval())
+      self.assertAllEqual([], accumulators_cleared.eval())
+      self.assertAllEqual([0], accumulators_allocated.eval())
+
   def testBadInput(self):
     del self.non_fertile_leaf_scores[-1]
     with self.test_session():
@@ -76,7 +92,7 @@ class UpdateFertileSlotsTest(test_util.TensorFlowTestCase):
         (n2a_map_updates, _, _, _) = self.ops.update_fertile_slots(
             self.finished, self.non_fertile_leaves,
             self.non_fertile_leaf_scores, self.end_of_tree, self.total_counts,
-            self.node_map, self.stale_leaves)
+            self.node_map, self.stale_leaves, self.node_sums)
         self.assertAllEqual((2, 0), n2a_map_updates.eval().shape)
 
 
diff --git a/tensorflow/contrib/tensor_forest/python/tensor_forest.py b/tensorflow/contrib/tensor_forest/python/tensor_forest.py
index 17d469739f9..b7b2fb96370 100644
--- a/tensorflow/contrib/tensor_forest/python/tensor_forest.py
+++ b/tensorflow/contrib/tensor_forest/python/tensor_forest.py
@@ -29,6 +29,7 @@ from tensorflow.contrib.tensor_forest.python.ops import training_ops
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import init_ops
@@ -629,7 +630,7 @@ class RandomTreeGraphs(object):
     sparse_indices = []
     sparse_values = []
     sparse_shape = []
-    if isinstance(input_data, ops.SparseTensor):
+    if isinstance(input_data, sparse_tensor.SparseTensor):
       sparse_indices = input_data.indices
       sparse_values = input_data.values
       sparse_shape = input_data.shape
@@ -780,6 +781,7 @@ class RandomTreeGraphs(object):
            self.variables.accumulator_sums,
            self.variables.node_to_accumulator_map,
            stale,
+           self.variables.node_sums,
            regression=self.params.regression))
 
     # Ensure end_of_tree doesn't get updated until UpdateFertileSlots has
@@ -881,7 +883,7 @@ class RandomTreeGraphs(object):
     sparse_indices = []
     sparse_values = []
     sparse_shape = []
-    if isinstance(input_data, ops.SparseTensor):
+    if isinstance(input_data, sparse_tensor.SparseTensor):
       sparse_indices = input_data.indices
       sparse_values = input_data.values
       sparse_shape = input_data.shape
diff --git a/tensorflow/contrib/training/BUILD b/tensorflow/contrib/training/BUILD
index 81dc8e9064f..9c116266a2d 100644
--- a/tensorflow/contrib/training/BUILD
+++ b/tensorflow/contrib/training/BUILD
@@ -15,9 +15,16 @@ py_library(
         "python/training/resample.py",
         "python/training/sampling_ops.py",
         "python/training/sequence_queueing_state_saver.py",
+        "python/training/training.py",
     ],
     srcs_version = "PY2AND3",
     visibility = ["//visibility:public"],
+    deps = [
+        "//tensorflow/python:framework",
+        "//tensorflow/python:ops",
+        "//tensorflow/python:platform",
+        "//tensorflow/python:training",
+    ],
 )
 
 py_test(
@@ -37,6 +44,7 @@ py_test(
     size = "medium",
     srcs = ["python/training/batch_sequences_with_states_test.py"],
     srcs_version = "PY2AND3",
+    tags = ["manual"],
     deps = [
         ":training_py",
         "//tensorflow:tensorflow_py",
@@ -73,7 +81,10 @@ py_test(
     size = "small",
     srcs = ["python/training/sampling_ops_threading_test.py"],
     srcs_version = "PY2AND3",
-    tags = ["notsan"],
+    tags = [
+        "manual",
+        "notsan",
+    ],
     deps = [
         ":training_py",
         "//tensorflow:tensorflow_py",
@@ -86,6 +97,20 @@ py_test(
     size = "medium",
     srcs = ["python/training/bucket_ops_test.py"],
     srcs_version = "PY2AND3",
+    tags = ["manual"],
+    deps = [
+        ":training_py",
+        "//tensorflow:tensorflow_py",
+        "//tensorflow/python:framework_test_lib",
+    ],
+)
+
+py_test(
+    name = "training_test",
+    size = "large",
+    srcs = ["python/training/training_test.py"],
+    shard_count = 3,
+    srcs_version = "PY2AND3",
     deps = [
         ":training_py",
         "//tensorflow:tensorflow_py",
diff --git a/tensorflow/contrib/training/__init__.py b/tensorflow/contrib/training/__init__.py
index d2a6368d785..721f8cdf750 100644
--- a/tensorflow/contrib/training/__init__.py
+++ b/tensorflow/contrib/training/__init__.py
@@ -70,6 +70,11 @@ from tensorflow.contrib.training.python.training.bucket_ops import *
 from tensorflow.contrib.training.python.training.resample import *
 from tensorflow.contrib.training.python.training.sampling_ops import *
 from tensorflow.contrib.training.python.training.sequence_queueing_state_saver import *
+from tensorflow.contrib.training.python.training.training import add_gradients_summaries
+from tensorflow.contrib.training.python.training.training import clip_gradient_norms
+from tensorflow.contrib.training.python.training.training import create_train_op
+from tensorflow.contrib.training.python.training.training import multiply_gradients
+from tensorflow.contrib.training.python.training.training import train
 from tensorflow.python.util.all_util import make_all
 
 __all__ = make_all(__name__)
diff --git a/tensorflow/contrib/training/python/training/training.py b/tensorflow/contrib/training/python/training/training.py
new file mode 100644
index 00000000000..e65ef6ba119
--- /dev/null
+++ b/tensorflow/contrib/training/python/training/training.py
@@ -0,0 +1,316 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Contains various routines and helper functions for training models.
+
+TODO(nsilberman): Port documentation.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from tensorflow.contrib.framework.python.ops import variables
+from tensorflow.python import summary
+from tensorflow.python.framework import constant_op
+from tensorflow.python.framework import ops
+from tensorflow.python.ops import array_ops
+from tensorflow.python.ops import clip_ops
+from tensorflow.python.ops import control_flow_ops
+from tensorflow.python.ops import variables as tf_variables
+from tensorflow.python.platform import tf_logging as logging
+from tensorflow.python.training import basic_session_run_hooks
+from tensorflow.python.training import monitored_session
+from tensorflow.python.training import optimizer as tf_optimizer
+
+# TODO(nsilberman): move add_gradients_summaries, clip_gradient_norms and
+# multiply_gradients into contrib/summaries and contrib/optimizers.py
+__all__ = [
+    'add_gradients_summaries',
+    'clip_gradient_norms',
+    'create_train_op',
+    'multiply_gradients',
+    'train',
+]
+
+
+def add_gradients_summaries(grads_and_vars):
+  """Add summaries to gradients.
+
+  Args:
+    grads_and_vars: A list of gradient to variable pairs (tuples).
+
+  Returns:
+    The list of created summaries.
+  """
+  summaries = []
+  for grad, var in grads_and_vars:
+    if grad is not None:
+      if isinstance(grad, ops.IndexedSlices):
+        grad_values = grad.values
+      else:
+        grad_values = grad
+      summaries.append(summary.histogram_summary(
+          var.op.name + ':gradient', grad_values))
+      summaries.append(summary.histogram_summary(
+          var.op.name + ':gradient_norm', clip_ops.global_norm([grad_values])))
+    else:
+      logging.info('Var %s has no gradient', var.op.name)
+
+  return summaries
+
+
+def clip_gradient_norms(gradients_to_variables, max_norm):
+  """Clips the gradients by the given value.
+
+  Args:
+    gradients_to_variables: A list of gradient to variable pairs (tuples).
+    max_norm: the maximum norm value.
+
+  Returns:
+    A list of clipped gradient to variable pairs.
+  """
+  clipped_grads_and_vars = []
+  for grad, var in gradients_to_variables:
+    if grad is not None:
+      if isinstance(grad, ops.IndexedSlices):
+        tmp = clip_ops.clip_by_norm(grad.values, max_norm)
+        grad = ops.IndexedSlices(tmp, grad.indices, grad.dense_shape)
+      else:
+        grad = clip_ops.clip_by_norm(grad, max_norm)
+    clipped_grads_and_vars.append((grad, var))
+  return clipped_grads_and_vars
+
+
+def multiply_gradients(grads_and_vars, gradient_multipliers):
+  """Multiply specified gradients.
+
+  Args:
+    grads_and_vars: A list of gradient to variable pairs (tuples).
+    gradient_multipliers: A map from either `Variables` or `Variable` op names
+      to the coefficient by which the associated gradient should be scaled.
+
+  Returns:
+    The updated list of gradient to variable pairs.
+
+  Raises:
+    ValueError: If `grads_and_vars` is not a list or if `gradient_multipliers`
+    is empty or None or if `gradient_multipliers` is not a dictionary.
+  """
+  if not isinstance(grads_and_vars, list):
+    raise ValueError('`grads_and_vars` must be a list.')
+  if not gradient_multipliers:
+    raise ValueError('`gradient_multipliers` is empty.')
+  if not isinstance(gradient_multipliers, dict):
+    raise ValueError('`gradient_multipliers` must be a dict.')
+
+  multiplied_grads_and_vars = []
+  for grad, var in grads_and_vars:
+    if var in gradient_multipliers or var.op.name in gradient_multipliers:
+      key = var if var in gradient_multipliers else var.op.name
+      if grad is None:
+        raise ValueError('Requested multiple of `None` gradient.')
+
+      if isinstance(grad, ops.IndexedSlices):
+        tmp = grad.values * constant_op.constant(
+            gradient_multipliers[key], dtype=grad.dtype)
+        grad = ops.IndexedSlices(tmp, grad.indices, grad.dense_shape)
+      else:
+        grad *= constant_op.constant(
+            gradient_multipliers[key], dtype=grad.dtype)
+    multiplied_grads_and_vars.append((grad, var))
+  return multiplied_grads_and_vars
+
+
+def create_train_op(total_loss,
+                    optimizer,
+                    global_step=None,
+                    update_ops=None,
+                    variables_to_train=None,
+                    transform_grads_fn=None,
+                    summarize_gradients=False,
+                    gate_gradients=tf_optimizer.Optimizer.GATE_OP,
+                    aggregation_method=None,
+                    colocate_gradients_with_ops=False):
+  """Creates an `Operation` that evaluates the gradients and returns the loss.
+
+  Args:
+    total_loss: A `Tensor` representing the total loss.
+    optimizer: A tf.Optimizer to use for computing the gradients.
+    global_step: A `Tensor` representing the global step variable. If left as
+      `None`, then slim.variables.global_step() is used.
+    update_ops: An optional list of updates to execute. If `update_ops` is
+      `None`, then the update ops are set to the contents of the
+      `tf.GraphKeys.UPDATE_OPS` collection. If `update_ops` is not `None`, but
+      it doesn't contain all of the update ops in `tf.GraphKeys.UPDATE_OPS`,
+      a warning will be displayed.
+    variables_to_train: an optional list of variables to train. If None, it will
+      default to all tf.trainable_variables().
+    transform_grads_fn: A function which takes a single argument, a list of
+      gradient to variable pairs (tuples), performs any requested gradient
+      updates, such as gradient clipping or multipliers, and returns the updated
+      list.
+    summarize_gradients: Whether or not add summaries for each gradient.
+    gate_gradients: How to gate the computation of gradients. See tf.Optimizer.
+    aggregation_method: Specifies the method used to combine gradient terms.
+      Valid values are defined in the class `AggregationMethod`.
+    colocate_gradients_with_ops: Whether or not to try colocating the gradients
+      with the ops that generated them.
+
+  Returns:
+    A `Tensor` that when evaluated, computes the gradients and returns the total
+      loss value.
+  """
+  if global_step is None:
+    global_step = variables.get_or_create_global_step()
+
+  # Update ops use GraphKeys.UPDATE_OPS collection if update_ops is None.
+  global_update_ops = set(ops.get_collection(ops.GraphKeys.UPDATE_OPS))
+  if update_ops is None:
+    update_ops = global_update_ops
+  else:
+    update_ops = set(update_ops)
+  if not global_update_ops.issubset(update_ops):
+    logging.warning('update_ops in create_train_op does not contain all the '
+                    ' update_ops in GraphKeys.UPDATE_OPS')
+
+  # Make sure update_ops are computed before total_loss.
+  if update_ops:
+    with ops.control_dependencies(update_ops):
+      barrier = control_flow_ops.no_op(name='update_barrier')
+    total_loss = control_flow_ops.with_dependencies([barrier], total_loss)
+
+  if variables_to_train is None:
+    # Default to tf.trainable_variables()
+    variables_to_train = tf_variables.trainable_variables()
+  else:
+    # Make sure that variables_to_train are in tf.trainable_variables()
+    for v in variables_to_train:
+      assert v in tf_variables.trainable_variables()
+
+  assert variables_to_train
+
+  # Create the gradients. Note that apply_gradients adds the gradient
+  # computation to the current graph.
+  grads = optimizer.compute_gradients(
+      total_loss,
+      variables_to_train,
+      gate_gradients=gate_gradients,
+      aggregation_method=aggregation_method,
+      colocate_gradients_with_ops=colocate_gradients_with_ops)
+
+  if transform_grads_fn:
+    grads = transform_grads_fn(grads)
+
+  # Summarize gradients.
+  if summarize_gradients:
+    with ops.name_scope('summarize_grads'):
+      add_gradients_summaries(grads)
+
+  # Create gradient updates.
+  grad_updates = optimizer.apply_gradients(grads, global_step=global_step)
+
+  with ops.name_scope('train_op'):
+    # Make sure total_loss is valid.
+    total_loss = array_ops.check_numerics(total_loss,
+                                          'LossTensor is inf or nan')
+
+    # Ensure the train_tensor computes grad_updates.
+    return control_flow_ops.with_dependencies([grad_updates], total_loss)
+
+
+def train(
+    train_op,
+    logdir,
+    master='',
+    is_chief=True,
+    scaffold=None,
+    hooks=None,
+    chief_only_hooks=None,
+    save_checkpoint_secs=600,
+    save_summaries_steps=100,
+    config=None):
+  """Runs the training loop.
+
+  Args:
+    train_op: A `Tensor` that, when executed, will apply the gradients and
+      return the loss value.
+    logdir: The directory where the graph and checkpoints are saved.
+    master: The URL of the master.
+    is_chief: Specifies whether or not the training is being run by the primary
+      replica during replica training.
+    scaffold: An tf.train.Scaffold instance.
+    hooks: List of `tf.train.SessionRunHook` callbacks which are run inside the
+      training loop.
+    chief_only_hooks: List of `tf.train.SessionRunHook` instances which are run
+      inside the training loop for the chief trainer only.
+    save_checkpoint_secs: The frequency, in seconds, that a checkpoint is saved
+      using a default checkpoint saver. If `save_checkpoint_secs` is set to
+      `None`, then the default checkpoint saver isn't used.
+    save_summaries_steps: The frequency, in number of global steps, that the
+      summaries are written to disk using a default summary saver. If
+      `save_summaries_steps` is set to `None`, then the default summary saver
+      isn't used.
+    config: An instance of `tf.ConfigProto`.
+
+  Returns:
+    the value of the loss function after training.
+
+  Raises:
+    ValueError: if `logdir` is `None` and either `save_checkpoint_secs` or
+    `save_summaries_steps` are `None.
+  """
+  # TODO(nsilberman): move this logic into monitored_session.py
+  scaffold = scaffold or monitored_session.Scaffold()
+
+  hooks = hooks or []
+
+  if is_chief:
+    session_creator = monitored_session.ChiefSessionCreator(
+        scaffold=scaffold,
+        checkpoint_dir=logdir,
+        master=master,
+        config=config)
+
+    if chief_only_hooks:
+      hooks.extend(chief_only_hooks)
+
+    hooks.append(basic_session_run_hooks.StepCounterHook(
+        output_dir=logdir))
+
+    if save_summaries_steps:
+      if logdir is None:
+        raise ValueError(
+            'logdir cannot be None when save_summaries_steps is None')
+      hooks.append(basic_session_run_hooks.SummarySaverHook(
+          scaffold=scaffold,
+          save_steps=save_summaries_steps,
+          output_dir=logdir))
+
+    if save_checkpoint_secs:
+      if logdir is None:
+        raise ValueError(
+            'logdir cannot be None when save_checkpoint_secs is None')
+      hooks.append(basic_session_run_hooks.CheckpointSaverHook(
+          logdir, save_secs=save_checkpoint_secs, scaffold=scaffold))
+  else:
+    session_creator = monitored_session.WorkerSessionCreator(
+        scaffold=scaffold, master=master, config=config)
+
+  with monitored_session.MonitoredSession(
+      session_creator=session_creator, hooks=hooks) as session:
+    loss = None
+    while not session.should_stop():
+      loss = session.run(train_op)
+  return loss
diff --git a/tensorflow/contrib/training/python/training/training_test.py b/tensorflow/contrib/training/python/training/training_test.py
new file mode 100644
index 00000000000..81de828a803
--- /dev/null
+++ b/tensorflow/contrib/training/python/training/training_test.py
@@ -0,0 +1,514 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Tests for tf.contrib.training.training."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import os
+
+import numpy as np
+import tensorflow as tf
+
+
+def logistic_classifier(inputs):
+  return tf.contrib.layers.fully_connected(
+      inputs, 1, activation_fn=tf.sigmoid)
+
+
+def batchnorm_classifier(inputs):
+  inputs = tf.contrib.layers.batch_norm(inputs, decay=0.1)
+  return tf.contrib.layers.fully_connected(inputs, 1, activation_fn=tf.sigmoid)
+
+
+class CreateTrainOpTest(tf.test.TestCase):
+
+  def setUp(self):
+    np.random.seed(0)
+
+    # Create an easy training set:
+    self._inputs = np.random.rand(16, 4).astype(np.float32)
+    self._labels = np.random.randint(0, 2, size=(16, 1)).astype(np.float32)
+
+  def testUseUpdateOps(self):
+    with tf.Graph().as_default():
+      tf.set_random_seed(0)
+      tf_inputs = tf.constant(self._inputs, dtype=tf.float32)
+      tf_labels = tf.constant(self._labels, dtype=tf.float32)
+
+      expected_mean = np.mean(self._inputs, axis=(0))
+      expected_var = np.var(self._inputs, axis=(0))
+
+      tf_predictions = batchnorm_classifier(tf_inputs)
+      tf.contrib.losses.log_loss(tf_predictions, tf_labels)
+      total_loss = tf.contrib.losses.get_total_loss()
+      optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+
+      train_op = tf.contrib.training.create_train_op(total_loss, optimizer)
+
+      moving_mean = tf.contrib.framework.get_variables_by_name('moving_mean')[0]
+      moving_variance = tf.contrib.framework.get_variables_by_name(
+          'moving_variance')[0]
+
+      with tf.Session() as sess:
+        # Initialize all variables
+        sess.run(tf.initialize_all_variables())
+        mean, variance = sess.run([moving_mean, moving_variance])
+        # After initialization moving_mean == 0 and moving_variance == 1.
+        self.assertAllClose(mean, [0] * 4)
+        self.assertAllClose(variance, [1] * 4)
+
+        for _ in range(10):
+          sess.run([train_op])
+        mean = moving_mean.eval()
+        variance = moving_variance.eval()
+        # After 10 updates with decay 0.1 moving_mean == expected_mean and
+        # moving_variance == expected_var.
+        self.assertAllClose(mean, expected_mean)
+        self.assertAllClose(variance, expected_var)
+
+  def testEmptyUpdateOps(self):
+    with tf.Graph().as_default():
+      tf.set_random_seed(0)
+      tf_inputs = tf.constant(self._inputs, dtype=tf.float32)
+      tf_labels = tf.constant(self._labels, dtype=tf.float32)
+
+      tf_predictions = batchnorm_classifier(tf_inputs)
+      tf.contrib.losses.log_loss(tf_predictions, tf_labels)
+      total_loss = tf.contrib.losses.get_total_loss()
+      optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+
+      train_op = tf.contrib.training.create_train_op(
+          total_loss, optimizer, update_ops=[])
+
+      moving_mean = tf.contrib.framework.get_variables_by_name('moving_mean')[0]
+      moving_variance = tf.contrib.framework.get_variables_by_name(
+          'moving_variance')[0]
+
+      with tf.Session() as sess:
+        # Initialize all variables
+        sess.run(tf.initialize_all_variables())
+        mean, variance = sess.run([moving_mean, moving_variance])
+        # After initialization moving_mean == 0 and moving_variance == 1.
+        self.assertAllClose(mean, [0] * 4)
+        self.assertAllClose(variance, [1] * 4)
+
+        for _ in range(10):
+          sess.run([train_op])
+        mean = moving_mean.eval()
+        variance = moving_variance.eval()
+
+        # Since we skip update_ops the moving_vars are not updated.
+        self.assertAllClose(mean, [0] * 4)
+        self.assertAllClose(variance, [1] * 4)
+
+
+class TrainBNClassifierTest(tf.test.TestCase):
+
+  def setUp(self):
+    # Create an easy training set:
+    np.random.seed(0)
+
+    self._inputs = np.zeros((16, 4))
+    self._labels = np.random.randint(0, 2, size=(16, 1)).astype(np.float32)
+    self._logdir = os.path.join(self.get_temp_dir(), 'tmp_bnlogs/')
+
+    for i in range(16):
+      j = int(2 * self._labels[i] + np.random.randint(0, 2))
+      self._inputs[i, j] = 1
+
+  def testTrainWithNoInitAssignCanAchieveZeroLoss(self):
+    g = tf.Graph()
+    with g.as_default():
+      tf.set_random_seed(0)
+      tf_inputs = tf.constant(self._inputs, dtype=tf.float32)
+      tf_labels = tf.constant(self._labels, dtype=tf.float32)
+
+      tf_predictions = batchnorm_classifier(tf_inputs)
+      tf.contrib.losses.log_loss(tf_predictions, tf_labels)
+      total_loss = tf.contrib.losses.get_total_loss()
+
+      optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+
+      train_op = tf.contrib.training.create_train_op(
+          total_loss, optimizer)
+
+      loss = tf.contrib.training.train(
+          train_op, self._logdir, hooks=[
+              tf.train.StopAtStepHook(num_steps=300)
+          ])
+      self.assertLess(loss, .1)
+
+
+class TrainTest(tf.test.TestCase):
+
+  def setUp(self):
+    # Create an easy training set:
+    np.random.seed(0)
+
+    self._inputs = np.zeros((16, 4))
+    self._labels = np.random.randint(0, 2, size=(16, 1)).astype(np.float32)
+
+    for i in range(16):
+      j = int(2 * self._labels[i] + np.random.randint(0, 2))
+      self._inputs[i, j] = 1
+
+  def testCanAchieveZeroLoss(self):
+    logdir = os.path.join(self.get_temp_dir(), 'can_achieve_zero_loss')
+
+    with tf.Graph().as_default():
+      tf.set_random_seed(0)
+      tf_inputs = tf.constant(self._inputs, dtype=tf.float32)
+      tf_labels = tf.constant(self._labels, dtype=tf.float32)
+
+      tf_predictions = logistic_classifier(tf_inputs)
+      tf.contrib.losses.log_loss(tf_predictions, tf_labels)
+      total_loss = tf.contrib.losses.get_total_loss()
+
+      optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+
+      train_op = tf.contrib.training.create_train_op(total_loss, optimizer)
+
+      loss = tf.contrib.training.train(
+          train_op, logdir, hooks=[
+              tf.train.StopAtStepHook(num_steps=300)
+          ])
+      self.assertIsNotNone(loss)
+      self.assertLess(loss, .015)
+
+  def testTrainWithLocalVariable(self):
+    logdir = os.path.join(self.get_temp_dir(), 'train_with_local_variable')
+
+    with tf.Graph().as_default():
+      tf.set_random_seed(0)
+      tf_inputs = tf.constant(self._inputs, dtype=tf.float32)
+      tf_labels = tf.constant(self._labels, dtype=tf.float32)
+
+      local_multiplier = tf.contrib.framework.local_variable(1.0)
+
+      tf_predictions = logistic_classifier(tf_inputs) * local_multiplier
+      tf.contrib.losses.log_loss(tf_predictions, tf_labels)
+      total_loss = tf.contrib.losses.get_total_loss()
+
+      optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+
+      train_op = tf.contrib.training.create_train_op(
+          total_loss, optimizer)
+
+      loss = tf.contrib.training.train(
+          train_op, logdir, hooks=[
+              tf.train.StopAtStepHook(num_steps=300)
+          ])
+      self.assertIsNotNone(loss)
+      self.assertLess(loss, .015)
+
+  def testResumeTrainAchievesRoughlyTheSameLoss(self):
+    number_of_steps = [300, 1, 5]
+    logdir = os.path.join(self.get_temp_dir(), 'resume_train_same_loss')
+
+    for i in range(len(number_of_steps)):
+      with tf.Graph().as_default():
+        tf.set_random_seed(i)
+        tf_inputs = tf.constant(self._inputs, dtype=tf.float32)
+        tf_labels = tf.constant(self._labels, dtype=tf.float32)
+
+        tf_predictions = logistic_classifier(tf_inputs)
+        tf.contrib.losses.log_loss(tf_predictions, tf_labels)
+        total_loss = tf.contrib.losses.get_total_loss()
+
+        optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+
+        train_op = tf.contrib.training.create_train_op(
+            total_loss, optimizer)
+
+        saver = tf.train.Saver()
+
+        loss = tf.contrib.training.train(
+            train_op, logdir, hooks=[
+                tf.train.StopAtStepHook(num_steps=number_of_steps[i]),
+                tf.train.CheckpointSaverHook(
+                    logdir, save_steps=50, saver=saver),
+            ])
+        self.assertIsNotNone(loss)
+        self.assertLess(loss, .015)
+
+  def create_train_op(self, learning_rate=1.0, gradient_multiplier=1.0):
+    tf_inputs = tf.constant(self._inputs, dtype=tf.float32)
+    tf_labels = tf.constant(self._labels, dtype=tf.float32)
+
+    tf_predictions = logistic_classifier(tf_inputs)
+    tf.contrib.losses.log_loss(tf_predictions, tf_labels)
+    total_loss = tf.contrib.losses.get_total_loss()
+
+    optimizer = tf.train.GradientDescentOptimizer(
+        learning_rate=learning_rate)
+
+    def transform_grads_fn(grads):
+      if gradient_multiplier != 1.0:
+        variables = tf.trainable_variables()
+        gradient_multipliers = {var: gradient_multiplier for var in variables}
+
+        with tf.name_scope('multiply_grads'):
+          return tf.contrib.training.multiply_gradients(
+              grads, gradient_multipliers)
+      else:
+        return grads
+
+    return tf.contrib.training.create_train_op(
+        total_loss, optimizer, transform_grads_fn=transform_grads_fn)
+
+  def testTrainWithInitFromCheckpoint(self):
+    logdir1 = os.path.join(self.get_temp_dir(), 'tmp_logs1/')
+    logdir2 = os.path.join(self.get_temp_dir(), 'tmp_logs2/')
+
+    if tf.gfile.Exists(logdir1):  # For running on jenkins.
+      tf.gfile.DeleteRecursively(logdir1)
+    if tf.gfile.Exists(logdir2):  # For running on jenkins.
+      tf.gfile.DeleteRecursively(logdir2)
+
+    # First, train the model one step (make sure the error is high).
+    with tf.Graph().as_default():
+      tf.set_random_seed(0)
+      train_op = self.create_train_op()
+      saver = tf.train.Saver()
+      loss = tf.contrib.training.train(
+          train_op, logdir1, hooks=[
+              tf.train.CheckpointSaverHook(logdir1, save_steps=1, saver=saver),
+              tf.train.StopAtStepHook(num_steps=1),
+          ], save_checkpoint_secs=None)
+      self.assertGreater(loss, .5)
+
+    # Next, train the model to convergence.
+    with tf.Graph().as_default():
+      tf.set_random_seed(1)
+      train_op = self.create_train_op()
+      saver = tf.train.Saver()
+      loss = tf.contrib.training.train(
+          train_op, logdir1, hooks=[
+              tf.train.CheckpointSaverHook(logdir1, save_steps=1, saver=saver),
+              tf.train.StopAtStepHook(num_steps=300),
+          ], save_checkpoint_secs=None)
+      self.assertIsNotNone(loss)
+      self.assertLess(loss, .02)
+
+    # Finally, advance the model a single step and validate that the loss is
+    # still low.
+    with tf.Graph().as_default():
+      tf.set_random_seed(2)
+      train_op = self.create_train_op()
+
+      model_variables = tf.all_variables()
+      model_path = os.path.join(logdir1, 'model.ckpt-300')
+
+      assign_fn = tf.contrib.framework.assign_from_checkpoint_fn(
+          model_path, model_variables)
+      def init_fn(_, session):
+        assign_fn(session)
+
+      loss = tf.contrib.training.train(
+          train_op,
+          logdir2,
+          scaffold=tf.train.Scaffold(init_fn=init_fn),
+          hooks=[tf.train.StopAtStepHook(num_steps=1)])
+
+      self.assertIsNotNone(loss)
+      self.assertLess(loss, .02)
+
+  def ModelLoss(self):
+    tf_inputs = tf.constant(self._inputs, dtype=tf.float32)
+    tf_labels = tf.constant(self._labels, dtype=tf.float32)
+
+    tf_predictions = logistic_classifier(tf_inputs)
+    tf.contrib.losses.log_loss(tf_predictions, tf_labels)
+    return tf.contrib.losses.get_total_loss()
+
+  def testTrainAllVarsHasLowerLossThanTrainSubsetOfVars(self):
+    logdir = os.path.join(self.get_temp_dir(), 'tmp_logs3/')
+    if tf.gfile.Exists(logdir):  # For running on jenkins.
+      tf.gfile.DeleteRecursively(logdir)
+
+    # First, train only the weights of the model.
+    with tf.Graph().as_default():
+      tf.set_random_seed(0)
+      total_loss = self.ModelLoss()
+      optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+      weights = tf.contrib.framework.get_variables_by_name('weights')
+
+      train_op = tf.contrib.training.create_train_op(
+          total_loss,
+          optimizer,
+          variables_to_train=weights)
+
+      saver = tf.train.Saver()
+      loss = tf.contrib.training.train(
+          train_op, logdir, hooks=[
+              tf.train.CheckpointSaverHook(logdir, save_steps=1, saver=saver),
+              tf.train.StopAtStepHook(num_steps=200),
+          ])
+      self.assertGreater(loss, .015)
+      self.assertLess(loss, .05)
+
+    # Next, train the biases of the model.
+    with tf.Graph().as_default():
+      tf.set_random_seed(1)
+      total_loss = self.ModelLoss()
+      optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+      biases = tf.contrib.framework.get_variables_by_name('biases')
+
+      train_op = tf.contrib.training.create_train_op(
+          total_loss,
+          optimizer,
+          variables_to_train=biases)
+
+      saver = tf.train.Saver()
+      loss = tf.contrib.training.train(
+          train_op, logdir, hooks=[
+              tf.train.CheckpointSaverHook(logdir, save_steps=1, saver=saver),
+              tf.train.StopAtStepHook(num_steps=300),
+          ])
+      self.assertGreater(loss, .015)
+      self.assertLess(loss, .05)
+
+    # Finally, train both weights and bias to get lower loss.
+    with tf.Graph().as_default():
+      tf.set_random_seed(2)
+      total_loss = self.ModelLoss()
+      optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+
+      train_op = tf.contrib.training.create_train_op(total_loss, optimizer)
+      saver = tf.train.Saver()
+      loss = tf.contrib.training.train(
+          train_op, logdir, hooks=[
+              tf.train.CheckpointSaverHook(logdir, save_steps=1, saver=saver),
+              tf.train.StopAtStepHook(num_steps=400),
+          ])
+      self.assertIsNotNone(loss)
+      self.assertLess(loss, .015)
+
+  def testTrainingSubsetsOfVariablesOnlyUpdatesThoseVariables(self):
+    # First, train only the weights of the model.
+    with tf.Graph().as_default():
+      tf.set_random_seed(0)
+      total_loss = self.ModelLoss()
+      optimizer = tf.train.GradientDescentOptimizer(learning_rate=1.0)
+      weights, biases = tf.contrib.framework.get_variables()
+
+      train_op = tf.contrib.training.create_train_op(total_loss, optimizer)
+      train_weights = tf.contrib.training.create_train_op(
+          total_loss, optimizer, variables_to_train=[weights])
+      train_biases = tf.contrib.training.create_train_op(
+          total_loss, optimizer, variables_to_train=[biases])
+
+      with tf.Session() as sess:
+        # Initialize the variables.
+        sess.run(tf.initialize_all_variables())
+
+        # Get the intial weights and biases values.
+        weights_values, biases_values = sess.run([weights, biases])
+        self.assertGreater(np.linalg.norm(weights_values), 0)
+        self.assertAlmostEqual(np.linalg.norm(biases_values), 0)
+
+        # Update weights and biases.
+        loss = sess.run(train_op)
+        self.assertGreater(loss, .5)
+        new_weights, new_biases = sess.run([weights, biases])
+
+        # Check that the weights and biases have been updated.
+        self.assertGreater(np.linalg.norm(weights_values - new_weights), 0)
+        self.assertGreater(np.linalg.norm(biases_values - new_biases), 0)
+
+        weights_values, biases_values = new_weights, new_biases
+
+        # Update only weights.
+        loss = sess.run(train_weights)
+        self.assertGreater(loss, .5)
+        new_weights, new_biases = sess.run([weights, biases])
+
+        # Check that the weights have been updated, but biases have not.
+        self.assertGreater(np.linalg.norm(weights_values - new_weights), 0)
+        self.assertAlmostEqual(np.linalg.norm(biases_values - new_biases), 0)
+        weights_values = new_weights
+
+        # Update only biases.
+        loss = sess.run(train_biases)
+        self.assertGreater(loss, .5)
+        new_weights, new_biases = sess.run([weights, biases])
+
+        # Check that the biases have been updated, but weights have not.
+        self.assertAlmostEqual(np.linalg.norm(weights_values - new_weights), 0)
+        self.assertGreater(np.linalg.norm(biases_values - new_biases), 0)
+
+  def testTrainWithAlteredGradients(self):
+    # Use the same learning rate but different gradient multipliers
+    # to train two models. Model with equivalently larger learning
+    # rate (i.e., learning_rate * gradient_multiplier) has smaller
+    # training loss.
+    logdir1 = os.path.join(self.get_temp_dir(), 'tmp_logs6/')
+    logdir2 = os.path.join(self.get_temp_dir(), 'tmp_logs7/')
+
+    if tf.gfile.Exists(logdir1):
+      tf.gfile.DeleteRecursively(logdir1)
+    if tf.gfile.Exists(logdir2):
+      tf.gfile.DeleteRecursively(logdir2)
+
+    multipliers = [1., 1000.]
+    number_of_steps = 10
+    losses = []
+    learning_rate = 0.001
+
+    # First, train the model with equivalently smaller learning rate.
+    with tf.Graph().as_default():
+      tf.set_random_seed(0)
+      train_op = self.create_train_op(
+          learning_rate=learning_rate,
+          gradient_multiplier=multipliers[0])
+
+      saver = tf.train.Saver()
+
+      loss = tf.contrib.training.train(
+          train_op, logdir1, hooks=[
+              tf.train.StopAtStepHook(num_steps=number_of_steps),
+              tf.train.CheckpointSaverHook(logdir1, save_steps=50, saver=saver),
+          ])
+
+      losses.append(loss)
+      self.assertGreater(loss, .5)
+
+    # Second, train the model with equivalently larger learning rate.
+    with tf.Graph().as_default():
+      tf.set_random_seed(0)
+      train_op = self.create_train_op(
+          learning_rate=learning_rate,
+          gradient_multiplier=multipliers[1])
+      saver = tf.train.Saver()
+
+      loss = tf.contrib.training.train(
+          train_op, logdir2, hooks=[
+              tf.train.StopAtStepHook(num_steps=number_of_steps),
+              tf.train.CheckpointSaverHook(logdir2, save_steps=50, saver=saver),
+          ])
+
+      losses.append(loss)
+      self.assertIsNotNone(loss)
+      self.assertLess(loss, .5)
+
+    # The loss of the model trained with larger learning rate should
+    # be smaller.
+    self.assertGreater(losses[0], losses[1])
+
+
+if __name__ == '__main__':
+  tf.test.main()
diff --git a/tensorflow/core/BUILD b/tensorflow/core/BUILD
index 6c2fec6412a..065a7c7b489 100644
--- a/tensorflow/core/BUILD
+++ b/tensorflow/core/BUILD
@@ -221,13 +221,6 @@ cc_library(
     ],
 )
 
-cc_library(
-    name = "jpeg",
-    hdrs = ["lib/jpeg/jpeg_mem.h"],
-    visibility = ["//visibility:public"],
-    deps = [":jpeg_internal"],
-)
-
 # Test support library needed for all tests
 # This is currently public, but may be made internal in the
 # future.  Try to avoid depending on it.
@@ -700,9 +693,9 @@ filegroup(
             "platform/cuda.h",
             "platform/google/**/*",
             "platform/hadoop/**/*",
-            "platform/jpeg.*",
-            "platform/png.*",
-            "platform/gif.*",
+            "platform/gif.h",
+            "platform/jpeg.h",
+            "platform/png.h",
             "platform/stream_executor.*",
             "platform/windows/**/*",
             "user_ops/**/*.cu.cc",
@@ -982,7 +975,10 @@ cc_library(
             ],
             exclude = [
                 "**/*test*",
+                "lib/gif/**/*",
                 "lib/jpeg/**/*",
+                "platform/gif.h",
+                "platform/jpeg.h",
                 "platform/**/cuda.h",
                 "platform/**/stream_executor.h",
                 "platform/load_library.cc",
@@ -999,7 +995,10 @@ cc_library(
             ],
             exclude = [
                 "**/*test*",
+                "lib/gif/**/*",
                 "lib/jpeg/**/*",
+                "platform/gif.h",
+                "platform/jpeg.h",
                 "platform/**/cuda.h",
                 "platform/**/stream_executor.h",
             ],
@@ -1017,7 +1016,6 @@ cc_library(
     hdrs = tf_additional_lib_hdrs() + [
         "lib/core/blocking_counter.h",
         "lib/core/refcount.h",
-        "lib/gif/gif_io.h",
         "lib/gtl/edit_distance.h",
         "lib/gtl/int_type.h",
         "lib/gtl/iterator_range.h",
@@ -1061,18 +1059,32 @@ cc_library(
     ],
 )
 
+cc_library(
+    name = "gif_internal",
+    srcs = [
+        "lib/gif/gif_io.cc",
+        "platform/gif.h",
+    ],
+    hdrs = ["lib/gif/gif_io.h"],
+    copts = tf_copts(),
+    linkopts = ["-ldl"],
+    deps = [
+        ":lib",
+        "//tensorflow/core/platform/default/build_config:gif",
+    ],
+)
+
 cc_library(
     name = "jpeg_internal",
-    srcs = glob(
-        [
-            "lib/jpeg/*h",
-            "lib/jpeg/*.cc",
-        ],
-        exclude = [
-            "**/*test*",
-        ],
-    ),
-    hdrs = ["lib/jpeg/jpeg_handle.h"],
+    srcs = [
+        "lib/jpeg/jpeg_handle.cc",
+        "lib/jpeg/jpeg_mem.cc",
+        "platform/jpeg.h",
+    ],
+    hdrs = [
+        "lib/jpeg/jpeg_handle.h",
+        "lib/jpeg/jpeg_mem.h",
+    ],
     copts = tf_copts(),
     linkopts = ["-ldl"],
     deps = [
@@ -1569,7 +1581,6 @@ cc_test(
     srcs = ["lib/jpeg/jpeg_mem_unittest.cc"],
     data = glob(["lib/jpeg/testdata/*.jpg"]),
     deps = [
-        ":jpeg",
         ":jpeg_internal",
         ":lib",
         ":lib_internal",
diff --git a/tensorflow/core/common_runtime/device_factory.cc b/tensorflow/core/common_runtime/device_factory.cc
index 84362d4b8ab..efbdf6bbb19 100644
--- a/tensorflow/core/common_runtime/device_factory.cc
+++ b/tensorflow/core/common_runtime/device_factory.cc
@@ -78,7 +78,7 @@ DeviceFactory* DeviceFactory::GetFactory(const string& device_type) {
 Status DeviceFactory::AddDevices(const SessionOptions& options,
                                  const string& name_prefix,
                                  std::vector<Device*>* devices) {
-  // CPU first.
+  // CPU first. A CPU device is required.
   auto cpu_factory = GetFactory("CPU");
   if (!cpu_factory) {
     return errors::NotFound(
@@ -90,7 +90,7 @@ Status DeviceFactory::AddDevices(const SessionOptions& options,
     return errors::NotFound("No CPU devices are available in this process");
   }
 
-  // Then the rest.
+  // Then the rest (including GPU).
   mutex_lock l(*get_device_factory_lock());
   for (auto& p : device_factories()) {
     auto factory = p.second.factory.get();
diff --git a/tensorflow/core/common_runtime/gpu/gpu_device.cc b/tensorflow/core/common_runtime/gpu/gpu_device.cc
index e9c48a36e0f..37ab43d90b0 100644
--- a/tensorflow/core/common_runtime/gpu/gpu_device.cc
+++ b/tensorflow/core/common_runtime/gpu/gpu_device.cc
@@ -72,56 +72,6 @@ namespace tensorflow {
 // corresponding stream have completed.  The following two classes
 // serve this purpose in two different compilation environments.
 
-#if defined(__GCUDACC__) || defined(__GCUDACC_HOST__)
-class EigenAllocator : public ::Eigen::Allocator {
- public:
-  EigenAllocator() {}
-
-  void Reinitialize(OpKernelContext* context, gpu::Stream* stream,
-                    ::tensorflow::Allocator* alloc, EventMgr* em) {
-    if (LogMemory::IsEnabled()) {
-      operation_ = context->op_kernel().name() + "/EigenAllocator";
-      step_id_ = context->step_id();
-    }
-    stream_ = stream;
-    allocator_ = alloc;
-    em_ = em;
-  }
-
-  void* allocate(size_t num_bytes) const override {
-    void* ret = allocator_->AllocateRaw(32 /* alignment */, num_bytes);
-    // Eigen doesn't typically check the return pointer from allocate,
-    // so we do it here and die with a more helpful error message.
-    if (ret == nullptr) {
-      LOG(FATAL) << "EigenAllocator for GPU ran out of memory when allocating "
-                 << num_bytes << ". See error logs for more detailed info.";
-    }
-    if (LogMemory::IsEnabled()) {
-      LogMemory::RecordRawAllocation(operation_, step_id_, num_bytes, ret,
-                                     allocator_);
-    }
-    return ret;
-  }
-
-  void deallocate(void* buffer) const override {
-    if (LogMemory::IsEnabled()) {
-      LogMemory::RecordRawDeallocation(operation_, step_id_, buffer, allocator_,
-                                       true);
-    }
-    em_->ThenDeleteBuffer(stream_, {allocator_, buffer, operation_, step_id_});
-  }
-
- private:
-  string operation_;
-  int64 step_id_;
-  gpu::Stream* stream_;                 // Not owned.
-  ::tensorflow::Allocator* allocator_;  // Not owned.
-  ::tensorflow::EventMgr* em_;          // Not owned.
-
-  TF_DISALLOW_COPY_AND_ASSIGN(EigenAllocator);
-};
-
-#else
 class EigenCudaStreamDevice : public ::Eigen::StreamInterface {
  public:
   EigenCudaStreamDevice() : scratch_(nullptr), semaphore_(nullptr) {
@@ -216,8 +166,6 @@ class EigenCudaStreamDevice : public ::Eigen::StreamInterface {
   TF_DISALLOW_COPY_AND_ASSIGN(EigenCudaStreamDevice);
 };
 
-#endif
-
 BaseGPUDevice::BaseGPUDevice(const SessionOptions& options, const string& name,
                              Bytes memory_limit, const DeviceLocality& locality,
                              int gpu_id, const string& physical_device_desc,
@@ -515,24 +463,6 @@ Status BaseGPUDevice::MakeTensorFromProto(const TensorProto& tensor_proto,
 }
 
 namespace {
-#if defined(__GCUDACC__) || defined(__GCUDACC_HOST__)
-class ConcretePerOpGpuDevice : public PerOpGpuDevice {
- public:
-  ConcretePerOpGpuDevice() : device_(nullptr) {}
-  void Reinitialize(OpKernelContext* context, gpu::Stream* stream,
-                    Allocator* base_allocator, ::tensorflow::EventMgr* em,
-                    char* scratch) {
-    allocator_.Reinitialize(context, stream, base_allocator, em);
-    device_.Reinitialize(stream, &allocator_, scratch);
-  }
-
-  const Eigen::GpuDevice& device() const override { return device_; }
-
- private:
-  EigenAllocator allocator_;
-  Eigen::GpuDevice device_;
-};
-#else
 class ConcretePerOpGpuDevice : public PerOpGpuDevice {
  public:
   ConcretePerOpGpuDevice() : device_(&stream_device_) {}
@@ -549,7 +479,6 @@ class ConcretePerOpGpuDevice : public PerOpGpuDevice {
   EigenCudaStreamDevice stream_device_;
   Eigen::GpuDevice device_;
 };
-#endif
 }  // namespace
 
 void BaseGPUDevice::ReinitializeDevice(OpKernelContext* context,
@@ -558,15 +487,10 @@ void BaseGPUDevice::ReinitializeDevice(OpKernelContext* context,
   ConcretePerOpGpuDevice* concrete_device =
       static_cast<ConcretePerOpGpuDevice*>(device);
   DCHECK(concrete_device);
-#if defined(__GCUDACC__) || defined(__GCUDACC_HOST__)
-  concrete_device->Reinitialize(context, streams_[stream_id].compute, allocator,
-                                em_.get(), scratch_[stream_id]);
-#else
   const cudaStream_t* cuda_stream = reinterpret_cast<const cudaStream_t*>(
       streams_[stream_id].compute->implementation()->CudaStreamMemberHack());
   concrete_device->Reinitialize(context, cuda_stream, gpu_id_, allocator,
                                 scratch_[stream_id]);
-#endif
 }
 
 PerOpGpuDevice* BaseGPUDevice::MakeGpuDevice() {
diff --git a/tensorflow/core/common_runtime/graph_runner.cc b/tensorflow/core/common_runtime/graph_runner.cc
index 81cedf57d54..c93ff1cdde8 100644
--- a/tensorflow/core/common_runtime/graph_runner.cc
+++ b/tensorflow/core/common_runtime/graph_runner.cc
@@ -46,12 +46,6 @@ std::unique_ptr<Device> GetCPUDevice(Env* env) {
   return nullptr;
 }
 
-thread::ThreadPool* GetThreadPool(Env* env) {
-  static thread::ThreadPool* thread_pool =
-      new thread::ThreadPool(env, "GraphRunnerCompute", 1);
-  return thread_pool;
-}
-
 // A simple rendezvous class.
 // Assumes a single sender and a single receiver, no duplicate sends, and no
 // sends of dead tensors.
@@ -113,10 +107,8 @@ Status GraphRunner::Run(Graph* graph, FunctionLibraryRuntime* function_library,
   CopyGraph(*graph, graph_to_run.get());
 
   std::unique_ptr<Device> device = GetCPUDevice(env);
-  thread::ThreadPool* thread_pool = GetThreadPool(env);
-  if (!device || !thread_pool) {
-    return errors::NotFound(
-        "Cannot find a device and/or a thread pool for GraphRunner.");
+  if (!device) {
+    return errors::NotFound("Cannot find a device for GraphRunner.");
   }
 
   SimpleRendezvous* rendez = new SimpleRendezvous;
@@ -142,9 +134,10 @@ Status GraphRunner::Run(Graph* graph, FunctionLibraryRuntime* function_library,
 
   // Create the local executor and the Rendezvous for fetching back the
   // constants.
-  auto runner = [thread_pool](Executor::Args::Closure c) {
-    thread_pool->Schedule(c);
-  };
+
+  // Run operators on the local thread. We should not need concurrency here; we
+  // should not be running expensive operators.
+  auto runner = [](Executor::Args::Closure c) { c(); };
 
   // Take ownership and pass to NewLocalExecutor
   Graph* g = graph_to_run.release();
diff --git a/tensorflow/core/common_runtime/simple_placer.cc b/tensorflow/core/common_runtime/simple_placer.cc
index fda429b52a0..721e73898b7 100644
--- a/tensorflow/core/common_runtime/simple_placer.cc
+++ b/tensorflow/core/common_runtime/simple_placer.cc
@@ -815,9 +815,11 @@ void SimplePlacer::AssignAndLog(const string& assigned_device,
   node->set_assigned_device_name(assigned_device);
   // Log placement if log_device_placement is set.
   if (options_ && options_->config.log_device_placement()) {
-    printf("%s: %s\n", node->name().c_str(),
+    printf("%s: (%s): %s\n", node->name().c_str(),
+           node->type_string().c_str(),
            node->assigned_device_name().c_str());
-    LOG(INFO) << node->name() << ": " << node->assigned_device_name();
+    LOG(INFO) << node->name() << ": " << "(" << node->type_string() << ")" 
+              << node->assigned_device_name();
   }
 }
 
diff --git a/tensorflow/core/distributed_runtime/master.cc b/tensorflow/core/distributed_runtime/master.cc
index cf9deaabd8c..741282be31b 100644
--- a/tensorflow/core/distributed_runtime/master.cc
+++ b/tensorflow/core/distributed_runtime/master.cc
@@ -282,6 +282,7 @@ void Master::ExtendSession(const ExtendSessionRequest* req,
     done(errors::Aborted("Session ", req->session_handle(), " is not found."));
     return;
   }
+  mu_.unlock();
 
   SchedClosure([session, req, resp, done]() {
     Status status = ValidateExternalGraphDefSyntax(req->graph_def());
@@ -290,7 +291,22 @@ void Master::ExtendSession(const ExtendSessionRequest* req,
     }
     done(status);
   });
+}
+
+void Master::PartialRunSetup(const PartialRunSetupRequest* req,
+                             PartialRunSetupResponse* resp, MyClosure done) {
+  mu_.lock();
+  MasterSession* session = gtl::FindPtrOrNull(sessions_, req->session_handle());
+  if (session == nullptr) {
+    mu_.unlock();
+    done(errors::Aborted("Session ", req->session_handle(), " is not found."));
+    return;
+  }
   mu_.unlock();
+
+  SchedClosure([this, session, req, resp, done]() {
+    done(session->PartialRunSetup(req, resp));
+  });
 }
 
 void Master::RunStep(CallOptions* opts, const RunStepRequest* req,
@@ -303,6 +319,7 @@ void Master::RunStep(CallOptions* opts, const RunStepRequest* req,
     done(errors::Aborted("Session ", req->session_handle(), " is not found."));
     return;
   }
+  mu_.unlock();
 
   SchedClosure([this, start_time, session, opts, req, resp, done]() {
     Status status = session->Run(opts, req, resp);
@@ -312,7 +329,6 @@ void Master::RunStep(CallOptions* opts, const RunStepRequest* req,
     last_1000_steps_.AddValue((done_time - start_time) / 1e9);
     ++step_count_;
   });
-  mu_.unlock();
 }
 
 void Master::CloseSession(const CloseSessionRequest* req,
diff --git a/tensorflow/core/distributed_runtime/master.h b/tensorflow/core/distributed_runtime/master.h
index a44ee6352a4..10875d80d40 100644
--- a/tensorflow/core/distributed_runtime/master.h
+++ b/tensorflow/core/distributed_runtime/master.h
@@ -46,6 +46,9 @@ class Master {
   void ExtendSession(const ExtendSessionRequest* req,
                      ExtendSessionResponse* resp, MyClosure done);
 
+  void PartialRunSetup(const PartialRunSetupRequest* req,
+                       PartialRunSetupResponse* resp, MyClosure done);
+
   void RunStep(CallOptions* opts, const RunStepRequest* req,
                RunStepResponse* resp, MyClosure done);
 
diff --git a/tensorflow/core/distributed_runtime/master_interface.h b/tensorflow/core/distributed_runtime/master_interface.h
index ec9218e2133..6b405f8eaa5 100644
--- a/tensorflow/core/distributed_runtime/master_interface.h
+++ b/tensorflow/core/distributed_runtime/master_interface.h
@@ -17,6 +17,7 @@ limitations under the License.
 #define TENSORFLOW_CORE_DISTRIBUTED_RUNTIME_MASTER_INTERFACE_H_
 
 #include "tensorflow/core/distributed_runtime/call_options.h"
+#include "tensorflow/core/lib/core/errors.h"
 #include "tensorflow/core/lib/core/status.h"
 #include "tensorflow/core/protobuf/master.pb.h"
 
@@ -37,6 +38,12 @@ class MasterInterface {
                                const ExtendSessionRequest* request,
                                ExtendSessionResponse* response) = 0;
 
+  virtual Status PartialRunSetup(CallOptions* call_options,
+                                 const PartialRunSetupRequest* request,
+                                 PartialRunSetupResponse* response) {
+    return errors::Unimplemented("Partial run not implemented for this master");
+  }
+
   virtual Status RunStep(CallOptions* call_options,
                          const RunStepRequest* request,
                          RunStepResponse* response) = 0;
diff --git a/tensorflow/core/distributed_runtime/master_session.cc b/tensorflow/core/distributed_runtime/master_session.cc
index 6f3b7841785..cacaf838165 100644
--- a/tensorflow/core/distributed_runtime/master_session.cc
+++ b/tensorflow/core/distributed_runtime/master_session.cc
@@ -50,18 +50,6 @@ limitations under the License.
 
 namespace tensorflow {
 
-// A little bit of per-step state.
-struct PerStepState {
-  bool collect_costs = false;
-  bool collect_timeline = false;
-  bool collect_rpcs = false;
-  Microseconds start_micros = Microseconds(0);
-  Microseconds end_micros = Microseconds(0);
-  std::vector<StepStats> step_stats;  // per partition
-  StepStats rpc_stats;                // for RPC layer
-  CostGraphDef cost_graph;
-};
-
 // MasterSession wraps SimpleClientGraph in a reference counted object.
 // This way, MasterSession can clear up the cache mapping Run requests to
 // compiled graphs while the compiled graph is still being used.
@@ -72,15 +60,38 @@ class MasterSession::ReffedClientGraph : public core::RefCounted {
   ReffedClientGraph(const string& handle, const BuildGraphOptions& bopts,
                     std::unique_ptr<SimpleClientGraph> cg,
                     const SessionOptions& session_opts,
-                    StatsPublisherFactory stats_publisher_factory)
+                    StatsPublisherFactory stats_publisher_factory,
+                    SimpleGraphExecutionState* execution_state, bool is_partial)
       : session_handle_(handle),
         client_graph_(std::move(cg)),
         bopts_(bopts),
-        session_opts_(session_opts) {
+        session_opts_(session_opts),
+        is_partial_(is_partial) {
     VLOG(1) << "Created ReffedClientGraph for node with "
             << client_graph_->graph.num_node_ids();
 
     stats_publisher_ = stats_publisher_factory(handle, bopts, session_opts);
+
+    // If this is a partial run we need to initialize a name to node map for
+    // testing that fetches are reachable.
+    if (is_partial) {
+      std::unordered_set<StringPiece, StringPiece::Hasher> names;
+      for (const string& input : bopts.feed_endpoints) {
+        TensorId id(ParseTensorName(input));
+        names.emplace(id.first);
+      }
+      for (const string& output : bopts.fetch_endpoints) {
+        TensorId id(ParseTensorName(output));
+        names.emplace(id.first);
+      }
+      // We use the graph from the execution_state because we want the graph
+      // nodes before they are rewritten replaced by the rewriter.
+      for (Node* n : execution_state->full_graph()->nodes()) {
+        if (names.count(n->name()) > 0) {
+          name_to_node_.insert({n->name(), n});
+        }
+      }
+    }
   }
 
   ~ReffedClientGraph() override { DeregisterPartitions(); }
@@ -171,7 +182,7 @@ class MasterSession::ReffedClientGraph : public core::RefCounted {
                        SimpleGraphExecutionState* execution_state,
                        PerStepState* pss, CallOptions* opts,
                        const RunStepRequest& req, RunStepResponse* resp,
-                       CancellationManager* cm);
+                       CancellationManager* cm, const bool is_last_partial_run);
 
   // Calls workers to cleanup states for the step "step_id".  Calls
   // `done` when all cleanup RPCs have completed.
@@ -185,6 +196,9 @@ class MasterSession::ReffedClientGraph : public core::RefCounted {
   void ProcessDeviceStats(ProfileHandler* ph,
                           const SimpleGraphExecutionState* execution_state,
                           const DeviceStepStats& ds, bool is_rpc);
+  // Checks that the requested fetches can be computed from the provided feeds.
+  Status CheckFetches(const RunStepRequest& req, const RunState* run_state,
+                      SimpleGraphExecutionState* execution_state);
 
   string DetailText(const NodeDef& def, const NodeExecStats& ns) {
     int64 tot = 0;
@@ -209,6 +223,8 @@ class MasterSession::ReffedClientGraph : public core::RefCounted {
   std::unordered_set<const Node*> nodes_needing_input_mapping_;
   BuildGraphOptions bopts_;
   const SessionOptions session_opts_;
+  const bool is_partial_;
+  std::unordered_map<StringPiece, Node*, StringPiece::Hasher> name_to_node_;
 
   // Graph partitioned into per-location subgraphs.
   struct Part {
@@ -483,15 +499,14 @@ class RunManyGraphs {
   TF_DISALLOW_COPY_AND_ASSIGN(RunManyGraphs);
 };
 
-
 Status MasterSession::ReffedClientGraph::RunPartitions(
     const MasterEnv* env, int64 step_id, int64 execution_count,
     SimpleGraphExecutionState* execution_state, PerStepState* pss,
     CallOptions* call_opts, const RunStepRequest& req, RunStepResponse* resp,
-    CancellationManager* cm) {
+    CancellationManager* cm, const bool is_last_partial_run) {
   VLOG(2) << "RunPartitions step_id " << step_id << " execution_count "
           << execution_count;
-  // Builds an index for feeds provided by the client.
+  // Build an index for feeds provided by the client.
   std::unordered_map<StringPiece, const TensorProto*, StringPiece::Hasher>
       feeds(3);
 
@@ -524,26 +539,64 @@ Status MasterSession::ReffedClientGraph::RunPartitions(
   for (int i = 0; i < num; ++i) {
     const Part& part = partitions_[i];
     RunManyGraphs::Call* c = calls.get(i);
+    if (is_partial_) {
+      c->req.set_is_partial(is_partial_);
+      c->req.set_is_last_partial_run(is_last_partial_run);
+    }
     c->req.set_graph_handle(part.graph_handle);
     c->req.set_step_id(step_id);
     *c->req.mutable_exec_opts() = exec_opts;
     // If any feeds are provided, send the feed values together
     // in the RunGraph request.
-    for (const auto& feed_key : part.feed_key) {
-      const string& feed = feed_key.first;
-      const string& key = feed_key.second;
-      const TensorProto* val = feeds[feed];
-      if (val == nullptr) {
-        return errors::InvalidArgument("No feed is provided for feed=", feed,
-                                       ", key=", key);
+    // In the partial case, we only want to include feeds provided in the req.
+    // In the non-partial case, all feeds in the request are in the part.
+    // We keep these as separate paths for now, to ensure we aren't
+    // inadvertently slowing down the normal run path.
+    if (is_partial_) {
+      for (const auto& feed : req.feed()) {
+        const string& name = feed.name();
+        auto iter = part.feed_key.find(name);
+        if (iter == part.feed_key.end()) {
+          // The provided feed must be for a different partition.
+          continue;
+        }
+        const string& key = iter->second;
+        const TensorProto* val = feeds[name];
+        if (val == nullptr) {
+          return errors::InvalidArgument("No feed is provided for feed=", name,
+                                         ", key=", key);
+        }
+        auto* send = c->req.add_send();
+        send->set_key(key);
+        *(send->mutable_val()) = *val;  // TODO(mrry): make it faster if needed.
+      }
+      // TODO(suharshs): Make a map from feed to fetch_key to make this faster.
+      // For now, we just iterate through partitions to find the matching key.
+      for (const auto& req_fetch : req.fetch()) {
+        for (const auto& key_fetch : part.key_fetch) {
+          if (key_fetch.second == req_fetch) {
+            c->req.add_recv_key(key_fetch.first);
+            break;
+          }
+        }
+      }
+    } else {
+      for (const auto& feed_key : part.feed_key) {
+        const string& feed = feed_key.first;
+        const string& key = feed_key.second;
+        const TensorProto* val = feeds[feed];
+        if (val == nullptr) {
+          return errors::InvalidArgument("No feed is provided for feed=", feed,
+                                         ", key=", key);
+        }
+        auto* send = c->req.add_send();
+        send->set_key(key);
+        *(send->mutable_val()) = *val;  // TODO(mrry): make it faster if needed.
+      }
+      for (const auto& key_fetch : part.key_fetch) {
+        const string& key = key_fetch.first;
+        c->req.add_recv_key(key);
       }
-      auto* send = c->req.add_send();
-      send->set_key(key);
-      *(send->mutable_val()) = *val;  // TODO(mrry): make it faster if needed.
-    }
-    for (const auto& key_fetch : part.key_fetch) {
-      const string& key = key_fetch.first;
-      c->req.add_recv_key(key);
     }
   }
 
@@ -762,6 +815,64 @@ void MasterSession::ReffedClientGraph::ProcessDeviceStats(
   }
 }
 
+// TODO(suharshs): Merge with CheckFetches in DirectSession.
+// TODO(suharsh,mrry): Build a map from fetch target to set of feeds it depends
+// on once at setup time to prevent us from computing the dependencies
+// everytime.
+Status MasterSession::ReffedClientGraph::CheckFetches(
+    const RunStepRequest& req, const RunState* run_state,
+    SimpleGraphExecutionState* execution_state) {
+  // Build the set of pending feeds that we haven't seen.
+  std::unordered_set<TensorId, TensorId::Hasher> pending_feeds;
+  for (const string& feed : run_state->pending_inputs) {
+    TensorId id(ParseTensorName(feed));
+    auto it = name_to_node_.find(id.first);
+    if (it == name_to_node_.end()) {
+      return errors::NotFound("Feed ", feed, ": not found");
+    }
+    pending_feeds.insert(id);
+  }
+  for (const auto& feed : req.feed()) {
+    TensorId id(ParseTensorName(feed.name()));
+    pending_feeds.erase(id);
+  }
+
+  // Initialize the stack with the fetch nodes.
+  std::vector<const Node*> stack;
+  for (const string& fetch : req.fetch()) {
+    TensorId id(ParseTensorName(fetch));
+    auto it = name_to_node_.find(id.first);
+    if (it == name_to_node_.end()) {
+      return errors::NotFound("Fetch ", fetch, ": not found");
+    }
+    stack.push_back(it->second);
+  }
+
+  // Any tensor needed for fetches can't be in pending_feeds.
+  // We need to use the original full graph from execution state.
+  const Graph* graph = execution_state->full_graph();
+  std::vector<bool> visited(graph->num_node_ids(), false);
+  while (!stack.empty()) {
+    const Node* n = stack.back();
+    stack.pop_back();
+
+    for (const Edge* in_edge : n->in_edges()) {
+      const Node* in_node = in_edge->src();
+      if (pending_feeds.count({in_node->name(), in_edge->src_output()}) > 0) {
+        return errors::InvalidArgument("Fetch ", in_node->name(), ":",
+                                       in_edge->src_output(),
+                                       " can't be computed from the feeds"
+                                       " that have been fed so far.");
+      }
+      if (!visited[in_node->id()]) {
+        visited[in_node->id()] = true;
+        stack.push_back(in_node);
+      }
+    }
+  }
+  return Status::OK();
+}
+
 // Asynchronously deregisters subgraphs on the workers, without waiting for the
 // result.
 void MasterSession::ReffedClientGraph::DeregisterPartitions() {
@@ -803,6 +914,23 @@ void BuildBuildGraphOptions(const RunStepRequest& req,
   std::sort(opts->fetch_endpoints.begin(), opts->fetch_endpoints.end());
 }
 
+void BuildBuildGraphOptions(const PartialRunSetupRequest& req,
+                            BuildGraphOptions* opts) {
+  for (const auto& feed : req.feed()) {
+    opts->feed_endpoints.push_back(feed);
+  }
+  for (const auto& fetch : req.fetch()) {
+    opts->fetch_endpoints.push_back(fetch);
+  }
+  for (const auto& target : req.target()) {
+    opts->target_nodes.push_back(target);
+  }
+
+  std::sort(opts->feed_endpoints.begin(), opts->feed_endpoints.end());
+  std::sort(opts->target_nodes.begin(), opts->target_nodes.end());
+  std::sort(opts->fetch_endpoints.begin(), opts->fetch_endpoints.end());
+}
+
 uint64 HashBuildGraphOptions(const BuildGraphOptions& opts) {
   uint64 h = 0x2b992ddfa23249d6ull;
   for (const string& name : opts.feed_endpoints) {
@@ -927,11 +1055,9 @@ Status MasterSession::Extend(const ExtendSessionRequest* req,
   return Status::OK();
 }
 
-Status MasterSession::StartStep(const RunStepRequest& req,
-                                BuildGraphOptions* opts, int64* count,
-                                ReffedClientGraph** rcg) {
-  BuildBuildGraphOptions(req, opts);
-  const uint64 hash = HashBuildGraphOptions(*opts);
+Status MasterSession::StartStep(const BuildGraphOptions& opts, int64* count,
+                                ReffedClientGraph** rcg, bool is_partial) {
+  const uint64 hash = HashBuildGraphOptions(opts);
   ReffedClientGraph* to_unref = nullptr;
   {
     mutex_lock l(mu_);
@@ -944,12 +1070,12 @@ Status MasterSession::StartStep(const RunStepRequest& req,
       // We have not seen this subgraph before. Build the subgraph and
       // cache it.
       VLOG(1) << "Unseen hash " << hash << " for "
-              << BuildGraphOptionsString(*opts);
+              << BuildGraphOptionsString(opts);
       std::unique_ptr<SimpleClientGraph> client_graph;
-      TF_RETURN_IF_ERROR(execution_state_->BuildGraph(*opts, &client_graph));
-      auto entry =
-          new ReffedClientGraph(handle_, *opts, std::move(client_graph),
-                                session_opts_, stats_publisher_factory_);
+      TF_RETURN_IF_ERROR(execution_state_->BuildGraph(opts, &client_graph));
+      auto entry = new ReffedClientGraph(
+          handle_, opts, std::move(client_graph), session_opts_,
+          stats_publisher_factory_, execution_state_.get(), is_partial);
       iter = runs_.insert({hash, entry}).first;
       auto obs_iter = obsolete_.find(hash);
       if (obs_iter != obsolete_.end()) {
@@ -979,6 +1105,47 @@ void MasterSession::ClearRunsTable(std::vector<ReffedClientGraph*>* to_unref,
   rcg_map->clear();
 }
 
+Status MasterSession::PartialRunSetup(const PartialRunSetupRequest* req,
+                                      PartialRunSetupResponse* resp) {
+  std::vector<string> inputs, outputs, targets;
+  for (const auto& feed : req->feed()) {
+    inputs.push_back(feed);
+  }
+  for (const auto& fetch : req->fetch()) {
+    outputs.push_back(fetch);
+  }
+  for (const auto& target : req->target()) {
+    targets.push_back(target);
+  }
+
+  string handle = std::to_string(partial_run_handle_counter_.fetch_add(1));
+
+  ReffedClientGraph* rcg = nullptr;
+  int64 count = 0;
+
+  // Prepare.
+  BuildGraphOptions opts;
+  BuildBuildGraphOptions(*req, &opts);
+  TF_RETURN_IF_ERROR(StartStep(opts, &count, &rcg, true));
+  // Keeps the highest 8 bits 0x01: we reserve some bits of the
+  // step_id for future use.
+  uint64 step_id = (random::New64() & ((1uLL << 56) - 1)) | (1uLL << 56);
+  TRACEPRINTF("stepid %llu", step_id);
+
+  rcg->Ref();
+  RunState* run_state = new RunState(inputs, outputs, rcg, step_id, count);
+  {
+    mutex_lock l(mu_);
+    partial_runs_.emplace(
+        std::make_pair(handle, std::unique_ptr<RunState>(run_state)));
+  }
+
+  TF_RETURN_IF_ERROR(BuildAndRegisterPartitions(rcg));
+
+  resp->set_partial_run_handle(handle);
+  return Status::OK();
+}
+
 Status MasterSession::Run(CallOptions* opts, const RunStepRequest* req,
                           RunStepResponse* resp) {
   UpdateLastAccessTime();
@@ -986,7 +1153,12 @@ Status MasterSession::Run(CallOptions* opts, const RunStepRequest* req,
     mutex_lock l(mu_);
     ++num_running_;
   }
-  Status status = DoRunWithLocalExecution(opts, req, resp);
+  Status status;
+  if (!req->partial_run_handle().empty()) {
+    status = DoPartialRun(opts, req, resp);
+  } else {
+    status = DoRunWithLocalExecution(opts, req, resp);
+  }
   {
     mutex_lock l(mu_);
     --num_running_;
@@ -997,23 +1169,7 @@ Status MasterSession::Run(CallOptions* opts, const RunStepRequest* req,
   return status;
 }
 
-Status MasterSession::DoRunWithLocalExecution(CallOptions* opts,
-                                              const RunStepRequest* req,
-                                              RunStepResponse* resp) {
-  VLOG(2) << "DoRunWithLocalExecution "
-          << "req: " << req->DebugString();
-  PerStepState pss;
-  pss.start_micros = Env::Default()->NowMicros();
-
-  // Prepare.
-  BuildGraphOptions bgopts;
-  ReffedClientGraph* rcg = nullptr;
-  int64 count = 0;
-  TF_RETURN_IF_ERROR(StartStep(*req, &bgopts, &count, &rcg));
-
-  // Unref "rcg" when out of scope.
-  core::ScopedUnref unref(rcg);
-
+Status MasterSession::BuildAndRegisterPartitions(ReffedClientGraph* rcg) {
   // Registers subgraphs if haven't done so.
   PartitionOptions popts;
   popts.node_to_loc = SplitByWorker;
@@ -1051,12 +1207,136 @@ Status MasterSession::DoRunWithLocalExecution(CallOptions* opts,
   TF_RETURN_IF_ERROR(rcg->RegisterPartitions(
       env_, popts, rcg->client_graph()->flib_def->ToProto()));
 
+  return Status::OK();
+}
+
+Status MasterSession::DoPartialRun(CallOptions* opts, const RunStepRequest* req,
+                                   RunStepResponse* resp) {
+  const string& prun_handle = req->partial_run_handle();
+  RunState* run_state = nullptr;
+  {
+    mutex_lock l(mu_);
+    auto it = partial_runs_.find(prun_handle);
+    if (it == partial_runs_.end()) {
+      return errors::InvalidArgument(
+          "Must run PartialRunSetup before performing partial runs");
+    }
+    run_state = it->second.get();
+  }
+
+  // If this is the first partial run, initialize the PerStepState.
+  if (!run_state->step_started) {
+    run_state->step_started = true;
+    PerStepState pss;
+
+    auto count = run_state->count;
+    pss.collect_timeline =
+        req->options().trace_level() == RunOptions::FULL_TRACE;
+
+    // Build the cost model every 'build_cost_model_every' steps after skipping
+    // an
+    // initial 'build_cost_model_after' steps.
+    const int64 build_cost_model_after =
+        session_opts_.config.graph_options().build_cost_model_after();
+    const int64 build_cost_model_every =
+        session_opts_.config.graph_options().build_cost_model();
+    pss.collect_costs =
+        build_cost_model_every > 0 &&
+        ((count + 1 - build_cost_model_after) % build_cost_model_every == 0);
+
+    std::unique_ptr<ProfileHandler> ph = run_state->rcg->GetProfileHandler(
+        run_state->step_id, count, req->options());
+    if (ph) {
+      pss.collect_timeline = true;
+      pss.collect_rpcs = ph->should_collect_rpcs();
+    }
+
+    run_state->pss = std::move(pss);
+    run_state->ph = std::move(ph);
+  }
+
+  // Make sure that this is a new set of feeds that are still pending.
+  for (const auto& feed : req->feed()) {
+    auto it = run_state->pending_inputs.find(feed.name());
+    if (it == run_state->pending_inputs.end()) {
+      return errors::InvalidArgument("The feed ", feed.name(),
+                                     " had already been fed.");
+    }
+  }
+  // Check that this is a new set of fetches that are still pending.
+  for (const auto& fetch : req->fetch()) {
+    auto it = run_state->pending_outputs.find(fetch);
+    if (it == run_state->pending_outputs.end()) {
+      return errors::InvalidArgument("The fetch ", fetch,
+                                     " had already been fetched.");
+    }
+  }
+
+  // Ensure that the requested fetches can be computed from the provided feeds.
+  TF_RETURN_IF_ERROR(
+      run_state->rcg->CheckFetches(*req, run_state, execution_state_.get()));
+
+  // Determine if this partial run satisfies all the pending inputs and ouputs.
+  for (const auto& feed : req->feed()) {
+    run_state->pending_inputs.erase(feed.name());
+  }
+  for (const auto& fetch : req->fetch()) {
+    run_state->pending_outputs.erase(fetch);
+  }
+  bool is_last_partial_run =
+      (run_state->pending_inputs.empty() && run_state->pending_outputs.empty());
+
+  Status s = run_state->rcg->RunPartitions(
+      env_, run_state->step_id, run_state->count, execution_state_.get(),
+      &run_state->pss, opts, *req, resp, cancellation_manager_,
+      is_last_partial_run);
+
+  // Delete the run state if there is an error or all fetches are done.
+  if (!s.ok() || is_last_partial_run) {
+    ReffedClientGraph* rcg = run_state->rcg;
+    run_state->pss.end_micros = Env::Default()->NowMicros();
+    // Schedule post-processing and cleanup to be done asynchronously.
+    rcg->Ref();
+    rcg->ProcessStats(env_, run_state->step_id, &run_state->pss,
+                      execution_state_.get(), run_state->ph.get(), *req, resp);
+    rcg->CleanupPartitionsAsync(
+        run_state->step_id, [this, rcg, prun_handle](const Status& s) {
+          if (!s.ok()) {
+            LOG(ERROR) << "Cleanup partition error: " << s;
+          }
+          rcg->Unref();
+          mutex_lock l(mu_);
+          partial_runs_.erase(prun_handle);
+        });
+  }
+  return s;
+}
+
+Status MasterSession::DoRunWithLocalExecution(CallOptions* opts,
+                                              const RunStepRequest* req,
+                                              RunStepResponse* resp) {
+  VLOG(2) << "DoRunWithLocalExecution "
+          << "req: " << req->DebugString();
+  PerStepState pss;
+  pss.start_micros = Env::Default()->NowMicros();
+
+  // Prepare.
+  BuildGraphOptions bgopts;
+  BuildBuildGraphOptions(*req, &bgopts);
+  ReffedClientGraph* rcg = nullptr;
+  int64 count = 0;
+  TF_RETURN_IF_ERROR(StartStep(bgopts, &count, &rcg, false));
+
+  // Unref "rcg" when out of scope.
+  core::ScopedUnref unref(rcg);
+
+  TF_RETURN_IF_ERROR(BuildAndRegisterPartitions(rcg));
+
   // Keeps the highest 8 bits 0x01: we reserve some bits of the
   // step_id for future use.
   const uint64 step_id = (random::New64() & ((1uLL << 56) - 1)) | (1uLL << 56);
   TRACEPRINTF("stepid %llu", step_id);
 
-  std::unique_ptr<ProfileHandler> ph;
   pss.collect_timeline = req->options().trace_level() == RunOptions::FULL_TRACE;
 
   // Build the cost model every 'build_cost_model_every' steps after skipping an
@@ -1069,15 +1349,16 @@ Status MasterSession::DoRunWithLocalExecution(CallOptions* opts,
       build_cost_model_every > 0 &&
       ((count + 1 - build_cost_model_after) % build_cost_model_every == 0);
 
-  ph = rcg->GetProfileHandler(step_id, count, req->options());
+  std::unique_ptr<ProfileHandler> ph =
+      rcg->GetProfileHandler(step_id, count, req->options());
   if (ph) {
     pss.collect_timeline = true;
     pss.collect_rpcs = ph->should_collect_rpcs();
   }
 
-  TF_RETURN_IF_ERROR(rcg->RunPartitions(env_, step_id, count,
-                                        execution_state_.get(), &pss, opts,
-                                        *req, resp, cancellation_manager_));
+  TF_RETURN_IF_ERROR(
+      rcg->RunPartitions(env_, step_id, count, execution_state_.get(), &pss,
+                         opts, *req, resp, cancellation_manager_, false));
 
   pss.end_micros = Env::Default()->NowMicros();
 
@@ -1110,4 +1391,22 @@ Status MasterSession::Close() {
   return Status::OK();
 }
 
+MasterSession::RunState::RunState(const std::vector<string>& input_names,
+                                  const std::vector<string>& output_names,
+                                  ReffedClientGraph* rcg, const uint64 step_id,
+                                  const int64 count)
+    : rcg(rcg), step_id(step_id), count(count) {
+  // Initially all the feeds and fetches are pending.
+  for (auto& name : input_names) {
+    pending_inputs.emplace(name);
+  }
+  for (auto& name : output_names) {
+    pending_outputs.emplace(name);
+  }
+}
+
+MasterSession::RunState::~RunState() {
+  if (rcg) rcg->Unref();
+}
+
 }  // end namespace tensorflow
diff --git a/tensorflow/core/distributed_runtime/master_session.h b/tensorflow/core/distributed_runtime/master_session.h
index e17614c819d..96d759d9c8d 100644
--- a/tensorflow/core/distributed_runtime/master_session.h
+++ b/tensorflow/core/distributed_runtime/master_session.h
@@ -16,6 +16,7 @@ limitations under the License.
 #ifndef TENSORFLOW_CORE_DISTRIBUTED_RUNTIME_MASTER_SESSION_H_
 #define TENSORFLOW_CORE_DISTRIBUTED_RUNTIME_MASTER_SESSION_H_
 
+#include <atomic>
 #include <vector>
 
 #include "tensorflow/core/common_runtime/device_set.h"
@@ -72,6 +73,10 @@ class MasterSession {
   // Extend() may block the caller thread for a long time.
   Status Extend(const ExtendSessionRequest* req, ExtendSessionResponse* resp);
 
+  // Setup a partial run call.
+  Status PartialRunSetup(const PartialRunSetupRequest* req,
+                         PartialRunSetupResponse* resp);
+
   // Run one step.
   Status Run(CallOptions* opts, const RunStepRequest* req,
              RunStepResponse* resp);
@@ -101,6 +106,8 @@ class MasterSession {
 
   std::atomic_ulong last_access_time_usec_;
 
+  std::atomic<int64> partial_run_handle_counter_ = {0};
+
   mutex mu_;
   std::unique_ptr<SimpleGraphExecutionState> execution_state_;
   int64 graph_version_;
@@ -115,6 +122,36 @@ class MasterSession {
   RCGMap runs_ GUARDED_BY(mu_);
   RCGMap obsolete_ GUARDED_BY(mu_);
 
+  struct PerStepState {
+    bool collect_costs = false;
+    bool collect_timeline = false;
+    bool collect_rpcs = false;
+    Microseconds start_micros = Microseconds(0);
+    Microseconds end_micros = Microseconds(0);
+    std::vector<StepStats> step_stats;  // per partition
+    StepStats rpc_stats;                // for RPC layer
+    CostGraphDef cost_graph;
+  };
+
+  struct RunState {
+    std::unordered_set<string> pending_inputs;
+    std::unordered_set<string> pending_outputs;
+    ReffedClientGraph* rcg = nullptr;
+    uint64 step_id;
+    int64 count = 0;
+    PerStepState pss;
+    std::unique_ptr<ProfileHandler> ph;
+    bool step_started = false;
+
+    RunState(const std::vector<string>& input_names,
+             const std::vector<string>& output_names, ReffedClientGraph* rcg,
+             const uint64 step_id, const int64 count);
+
+    ~RunState();
+  };
+  std::unordered_map<string, std::unique_ptr<RunState>> partial_runs_
+      GUARDED_BY(mu_);
+
   // Active RunStep calls.
   condition_variable num_running_is_zero_;
   int32 num_running_ GUARDED_BY(mu_) = 0;
@@ -131,14 +168,18 @@ class MasterSession {
   // Private dtor. The client must call Close().
   virtual ~MasterSession();
 
-  Status StartStep(const RunStepRequest& req, BuildGraphOptions* opts,
-                   int64* count, ReffedClientGraph** graph);
+  Status StartStep(const BuildGraphOptions& opts, int64* count,
+                   ReffedClientGraph** graph, bool is_partial);
   void ClearRunsTable(std::vector<ReffedClientGraph*>* to_unref,
                       RCGMap* rcg_map) EXCLUSIVE_LOCKS_REQUIRED(mu_);
   Status DoRunWithLocalExecution(CallOptions* opts, const RunStepRequest* req,
                                  RunStepResponse* resp);
+  Status DoPartialRun(CallOptions* opts, const RunStepRequest* req,
+                      RunStepResponse* resp);
   void UpdateLastAccessTime();
 
+  Status BuildAndRegisterPartitions(ReffedClientGraph* rcg);
+
   TF_DISALLOW_COPY_AND_ASSIGN(MasterSession);
 };
 
diff --git a/tensorflow/core/framework/common_shape_fns.cc b/tensorflow/core/framework/common_shape_fns.cc
index f3a71a73f7e..cc6cd10a084 100644
--- a/tensorflow/core/framework/common_shape_fns.cc
+++ b/tensorflow/core/framework/common_shape_fns.cc
@@ -70,8 +70,6 @@ Status Get3dOutputSize(const std::array<int64, 3>& input,
 
 namespace shape_inference {
 
-namespace {
-
 Status GetWindowedOutputSizeFromDims(
     shape_inference::InferenceContext* c,
     shape_inference::DimensionHandle input_size,
@@ -97,7 +95,6 @@ Status GetWindowedOutputSizeFromDims(
   }
   return Status::OK();
 }
-}  // namespace
 
 Status UnchangedShape(shape_inference::InferenceContext* c) {
   c->set_output(0, c->input(0));
diff --git a/tensorflow/core/framework/common_shape_fns.h b/tensorflow/core/framework/common_shape_fns.h
index 2e711f5277b..176ea3519d8 100644
--- a/tensorflow/core/framework/common_shape_fns.h
+++ b/tensorflow/core/framework/common_shape_fns.h
@@ -96,6 +96,13 @@ Status Get3dOutputSize(const std::array<int64, 3>& input,
 
 namespace shape_inference {
 
+// Like GetWindowedOutputSize, but deals with DimensionHandles.
+Status GetWindowedOutputSizeFromDims(InferenceContext* c,
+                                     DimensionHandle input_size,
+                                     DimensionOrConstant filter_size,
+                                     int64 stride, Padding padding_type,
+                                     DimensionHandle* output_size);
+
 // Transfers shape of input(0) to output(0).
 Status UnchangedShape(shape_inference::InferenceContext* c);
 
diff --git a/tensorflow/core/framework/op_kernel.h b/tensorflow/core/framework/op_kernel.h
index 432e2ad2f6e..4a66d43e505 100644
--- a/tensorflow/core/framework/op_kernel.h
+++ b/tensorflow/core/framework/op_kernel.h
@@ -132,7 +132,7 @@ class OpKernel {
   // We allow legacy scalars within Google up until GraphDef version 6.
   // TODO(irving): Remove when we can drop support for GraphDef version 5.
   bool allow_legacy_scalars() const {
-#if defined(PLATFORM_GOOGLE)
+#if defined(PLATFORM_GOOGLE) || defined(PLATFORM_GOOGLE_ANDROID)
     return graph_def_version_ < 6;
 #else
     return false;
diff --git a/tensorflow/core/framework/shape_inference.cc b/tensorflow/core/framework/shape_inference.cc
index 4aa32f6a841..f6475e07366 100644
--- a/tensorflow/core/framework/shape_inference.cc
+++ b/tensorflow/core/framework/shape_inference.cc
@@ -31,11 +31,20 @@ InferenceContext::InferenceContext(
     const NodeDef* node_def, const OpDef& op_def,
     const std::vector<TensorShapeProto>& input_shapes,
     const std::vector<const Tensor*>& input_tensors,
-    const std::vector<ShapeHandle>& input_tensors_as_shapes,
+    const std::vector<TensorShapeProto>& input_tensors_as_shapes,
     const std::vector<TensorShapeProto>& input_handle_shapes,
     const std::vector<DataType>& input_handle_dtypes)
     : node_def_(*CHECK_NOTNULL(node_def)) {
-  PreInputInit(op_def, input_tensors, input_tensors_as_shapes);
+  std::vector<ShapeHandle> input_tensors_as_shape_handles;
+  for (const TensorShapeProto& p : input_tensors_as_shapes) {
+    ShapeHandle shape;
+    construction_status_.Update(MakeShapeFromShapeProto(p, &shape));
+    if (!construction_status_.ok()) {
+      return;
+    }
+    input_tensors_as_shape_handles.push_back(shape);
+  }
+  PreInputInit(op_def, input_tensors, input_tensors_as_shape_handles);
   if (!construction_status_.ok()) return;
   for (const TensorShapeProto& p : input_shapes) {
     ShapeHandle shape;
diff --git a/tensorflow/core/framework/shape_inference.h b/tensorflow/core/framework/shape_inference.h
index e02490efd92..1a8107ef00d 100644
--- a/tensorflow/core/framework/shape_inference.h
+++ b/tensorflow/core/framework/shape_inference.h
@@ -164,7 +164,7 @@ class InferenceContext {
   InferenceContext(const NodeDef* node_def, const OpDef& op_def,
                    const std::vector<TensorShapeProto>& input_shapes,
                    const std::vector<const Tensor*>& input_tensors,
-                   const std::vector<ShapeHandle>& input_tensors_as_shapes,
+                   const std::vector<TensorShapeProto>& input_tensors_as_shapes,
                    const std::vector<TensorShapeProto>& input_handle_shapes,
                    const std::vector<DataType>& input_handle_dtypes);
 
diff --git a/tensorflow/core/framework/tensor.h b/tensorflow/core/framework/tensor.h
index 47d74d4defc..43e44e7a96e 100644
--- a/tensorflow/core/framework/tensor.h
+++ b/tensorflow/core/framework/tensor.h
@@ -435,6 +435,7 @@ class Tensor {
   friend class VariableOp;            // For access to set_shape
   friend class AutoReloadVariableOp;  // For access to set_shape
   friend class TensorTestHelper;      // For access to set_shape
+  template <typename Device, typename T>
   friend class CreateVariableOp;
 
   // Creates a tensor with the input datatype, shape and buf.
diff --git a/tensorflow/core/kernels/BUILD b/tensorflow/core/kernels/BUILD
index 1954ebdc108..a84eaad3152 100644
--- a/tensorflow/core/kernels/BUILD
+++ b/tensorflow/core/kernels/BUILD
@@ -389,16 +389,11 @@ cc_header_only_library(
 # OpKernel libraries ----------------------------------------------------------
 
 ARRAY_DEPS = [
-    ":batch_space_ops",
     ":bounds_check",
     ":concat_lib",
-    ":cuda_device_array",
-    ":depth_space_ops",
-    ":extract_image_patches_op",
     ":fill_functor",
     ":gather_functor",
     ":ops_util",
-    ":split_lib",
     ":strided_slice_op",
     ":transpose_functor",
     "//tensorflow/core:array_grad",
@@ -426,6 +421,13 @@ tf_kernel_libraries(
 
 tf_kernel_libraries(
     name = "array",
+    libs = [
+        ":batch_space_ops",
+        ":depth_space_ops",
+        ":extract_image_patches_op",
+        ":split_op",
+        ":unpack_op",
+    ],
     prefixes = [
         "bcast_ops",
         "bitcast_op",
@@ -450,16 +452,27 @@ tf_kernel_libraries(
         "reverse_sequence_op",
         "shape_ops",
         "slice_op",
-        "split_op",
         "tile_ops",
         "transpose_op",
         "unique_op",
-        "unpack_op",
         "where_op",
     ],
     deps = ARRAY_DEPS,
 )
 
+tf_kernel_library(
+    name = "split_op",
+    gpu_srcs = ["cuda_device_array.h"],
+    prefix = "split_op",
+    deps = ARRAY_DEPS + [":split_lib"],
+)
+
+tf_kernel_library(
+    name = "unpack_op",
+    prefix = "unpack_op",
+    deps = ARRAY_DEPS + [":split_lib"],
+)
+
 tf_cc_test(
     name = "batch_norm_op_test",
     size = "small",
@@ -886,16 +899,16 @@ tf_cc_test(
 
 tf_kernel_libraries(
     name = "data_flow",
+    libs = [
+        ":dynamic",
+        ":lookup",
+    ],
     prefixes = [
-        "dynamic_partition_op",
-        "dynamic_stitch_op",
         "conditional_accumulator_base_op",
         "conditional_accumulator_op",
         "barrier_ops",
         "fifo_queue_op",
         "priority_queue_op",
-        "lookup_table_init_op",
-        "lookup_table_op",
         "padding_fifo_queue_op",
         "queue_ops",
         "random_shuffle_queue_op",
@@ -930,6 +943,40 @@ tf_kernel_libraries(
     ],
 )
 
+tf_kernel_libraries(
+    name = "dynamic",
+    prefixes = [
+        "dynamic_partition_op",
+        "dynamic_stitch_op",
+    ],
+    deps = [
+        ":bounds_check",
+        "//tensorflow/core:core_cpu",
+        "//tensorflow/core:data_flow_ops_op_lib",
+        "//tensorflow/core:framework",
+        "//tensorflow/core:lib",
+        "//tensorflow/core:lib_internal",
+    ],
+)
+
+tf_kernel_libraries(
+    name = "lookup",
+    prefixes = [
+        "lookup_table_init_op",
+        "lookup_table_op",
+    ],
+    deps = [
+        ":bounds_check",
+        ":initializable_lookup_table",
+        ":lookup_util",
+        "//tensorflow/core:core_cpu",
+        "//tensorflow/core:data_flow_ops_op_lib",
+        "//tensorflow/core:framework",
+        "//tensorflow/core:lib",
+        "//tensorflow/core:lib_internal",
+    ],
+)
+
 tf_cc_tests(
     size = "small",
     srcs = [
@@ -1089,8 +1136,9 @@ tf_kernel_libraries(
         ":eigen_helpers",
         ":image_resizer_state",
         "//tensorflow/core:framework",
+        "//tensorflow/core:gif_internal",
         "//tensorflow/core:image_ops_op_lib",
-        "//tensorflow/core:jpeg",
+        "//tensorflow/core:jpeg_internal",
         "//tensorflow/core:lib",
         "//tensorflow/core:lib_internal",
         "//tensorflow/core:protos_all_cc",
@@ -1607,12 +1655,14 @@ tf_kernel_library(
 
 tf_kernel_libraries(
     name = "nn",
+    libs = [
+        ":l2loss_op",
+    ],
     prefixes = [
         "batch_norm_op",
         "bias_op",
         "fused_batch_norm_op",
         "in_topk_op",
-        "l2loss_op",
         "lrn_op",
         "relu_op",
         "softmax_op",
@@ -1641,6 +1691,19 @@ tf_kernel_libraries(
     ]),
 )
 
+tf_kernel_library(
+    name = "l2loss_op",
+    prefix = "l2loss_op",
+    deps = [
+        "//tensorflow/core:framework",
+        "//tensorflow/core:lib",
+        "//tensorflow/core:lib_internal",
+        "//tensorflow/core:nn_grad",
+        "//tensorflow/core:nn_ops_op_lib",
+        "//third_party/eigen3",
+    ],
+)
+
 tf_cuda_cc_test(
     name = "lrn_op_test",
     srcs = ["lrn_op_test.cc"],
@@ -2037,11 +2100,13 @@ tf_kernel_libraries(
         "count_up_to_op",
         "dense_update_ops",
         "scatter_op",
+        "scatter_nd_op",
         "variable_ops",
     ],
     deps = [
         ":assign_op",
         ":bounds_check",
+        ":fill_functor",
         ":scatter_functor",
         "//tensorflow/core:framework",
         "//tensorflow/core:lib",
@@ -2055,6 +2120,7 @@ tf_cc_test(
     size = "small",
     srcs = ["scatter_op_test.cc"],
     deps = [
+        ":fill_functor",
         ":ops_testutil",
         ":ops_util",
         ":scatter_op",
@@ -2067,6 +2133,23 @@ tf_cc_test(
     ],
 )
 
+tf_cc_test(
+    name = "scatter_nd_op_test",
+    size = "small",
+    srcs = ["scatter_nd_op_test.cc"],
+    deps = [
+        ":ops_testutil",
+        ":ops_util",
+        ":scatter_nd_op",
+        "//tensorflow/core:framework",
+        "//tensorflow/core:lib",
+        "//tensorflow/core:protos_all_cc",
+        "//tensorflow/core:test",
+        "//tensorflow/core:test_main",
+        "//tensorflow/core:testlib",
+    ],
+)
+
 tf_kernel_libraries(
     name = "string",
     prefixes = [
@@ -2509,6 +2592,7 @@ filegroup(
             "debug_ops.*",
             # Ops excluded because they do not build correctly for Android.
             # See b/29213790
+            "scatter_nd_op*",
             "sparse_matmul_op.*",
         ],
     ),
diff --git a/tensorflow/core/kernels/conv_ops_gpu_3.cu.cc b/tensorflow/core/kernels/conv_ops_gpu_3.cu.cc
index d9882764fb6..dca0073a9ab 100644
--- a/tensorflow/core/kernels/conv_ops_gpu_3.cu.cc
+++ b/tensorflow/core/kernels/conv_ops_gpu_3.cu.cc
@@ -221,9 +221,16 @@ __global__ void SwapDimension1And2InTensor3UsingTiles(const T* input,
     tile_height = input_dims[1] - (input_dims_in_tiles[1] - 1) * TileSize;
   }
 
+  int input_flat_index = input_origin_flat_index + x;
+
   // Load the data from input memory to the shared memory tile.
-  if (x < tile_width) {
-    int input_flat_index = input_origin_flat_index + x;
+  if (TF_PREDICT_TRUE(tile_height == TileSize && tile_width == TileSize)) {
+#pragma unroll
+    for (int y = 0; y < TileSize; y++) {
+      shared_memory_tile[y][x] = input[input_flat_index];
+      input_flat_index += input_dims[2];
+    }
+  } else if (x < tile_width) {
     for (int y = 0; y < tile_height; y++) {
       shared_memory_tile[y][x] = input[input_flat_index];
       input_flat_index += input_dims[2];
@@ -247,7 +254,13 @@ __global__ void SwapDimension1And2InTensor3UsingTiles(const T* input,
   int output_flat_index = output_origin_flat_index + x;
 
   // Load the data from the shared memory tile to the output memory.
-  if (x < tile_height) {
+  if (TF_PREDICT_TRUE(tile_height == TileSize && tile_width == TileSize)) {
+#pragma unroll
+    for (int y = 0; y < TileSize; y++) {
+      output[output_flat_index] = shared_memory_tile[x][y];
+      output_flat_index += output_dims[2];
+    }
+  } else if (x < tile_height) {
     for (int y = 0; y < tile_width; y++) {
       output[output_flat_index] = shared_memory_tile[x][y];
       output_flat_index += output_dims[2];
diff --git a/tensorflow/core/kernels/cwise_op_gpu_log1p.cu.cc b/tensorflow/core/kernels/cwise_op_gpu_log1p.cu.cc
new file mode 100644
index 00000000000..d09224c70e0
--- /dev/null
+++ b/tensorflow/core/kernels/cwise_op_gpu_log1p.cu.cc
@@ -0,0 +1,26 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#if GOOGLE_CUDA
+
+#include "tensorflow/core/kernels/cwise_ops_gpu_common.cu.h"
+
+namespace tensorflow {
+namespace functor {
+DEFINE_UNARY3(log1p, Eigen::half, float, double);
+}  // namespace functor
+}  // namespace tensorflow
+
+#endif  // GOOGLE_CUDA
diff --git a/tensorflow/core/kernels/cwise_op_log1p.cc b/tensorflow/core/kernels/cwise_op_log1p.cc
new file mode 100644
index 00000000000..91a14989e64
--- /dev/null
+++ b/tensorflow/core/kernels/cwise_op_log1p.cc
@@ -0,0 +1,24 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include "tensorflow/core/kernels/cwise_ops_common.h"
+
+namespace tensorflow {
+REGISTER5(UnaryOp, CPU, "Log1p", functor::log1p, float, Eigen::half, double,
+          complex64, complex128);
+#if GOOGLE_CUDA
+REGISTER3(UnaryOp, GPU, "Log1p", functor::log1p, float, Eigen::half, double);
+#endif
+}  // namespace tensorflow
diff --git a/tensorflow/core/kernels/cwise_ops.h b/tensorflow/core/kernels/cwise_ops.h
index 572a729b34b..b038d73e171 100644
--- a/tensorflow/core/kernels/cwise_ops.h
+++ b/tensorflow/core/kernels/cwise_ops.h
@@ -454,6 +454,9 @@ struct exp : base<T, Eigen::internal::scalar_exp_op<T> > {};
 template <typename T>
 struct log : base<T, Eigen::internal::scalar_log_op<T> > {};
 
+template <typename T>
+struct log1p : base<T, Eigen::internal::scalar_log1p_op<T> > {};
+
 template <typename T>
 struct sign : base<T, Eigen::internal::scalar_sign_op<T> > {};
 
diff --git a/tensorflow/core/kernels/hexagon/BUILD b/tensorflow/core/kernels/hexagon/BUILD
index 869728c06f9..2ca2210d1f2 100644
--- a/tensorflow/core/kernels/hexagon/BUILD
+++ b/tensorflow/core/kernels/hexagon/BUILD
@@ -30,6 +30,7 @@ tf_cc_test(
     name = "quantized_matmul_op_for_hexagon_test",
     size = "small",
     srcs = ["quantized_matmul_op_for_hexagon_test.cc"],
+    tags = ["nomsan"],  # http://b/32242946
     deps = [
         "//tensorflow/core:framework",
         "//tensorflow/core:protos_all_cc",
diff --git a/tensorflow/core/kernels/hexagon/graph_transferer.cc b/tensorflow/core/kernels/hexagon/graph_transferer.cc
index bf91c7678f7..6836cc88ef7 100644
--- a/tensorflow/core/kernels/hexagon/graph_transferer.cc
+++ b/tensorflow/core/kernels/hexagon/graph_transferer.cc
@@ -27,6 +27,13 @@ static constexpr bool DBG = false;
 static constexpr const char* const INPUTS_NODE_PREFIX = "inputs_for_";
 static constexpr const char* const OUTPUTS_NODE_PREFIX = "outputs_for_";
 static constexpr const char* const DATA_NODE_PREFIX = "data_for_op_";
+static constexpr const char* const CONST_SHAPE_PREFIX = "const_shape_";
+static constexpr const char* const PADDING_PREFIX = "NN_PAD_";
+static constexpr const char* const PADDING_ATTR_NAME = "padding";
+static constexpr const char* const STRIDES_ATTR_NAME = "strides";
+static constexpr const char* const KSIZE_ATTR_NAME = "ksize";
+static constexpr const char* const PADDING_VALID_STR = "VALID";
+static constexpr const char* const PADDING_SAME_STR = "SAME";
 
 void GraphTransferer::LoadGraphFromProto(const GraphDef& graph_def) {
   ImportGraphDefOptions opts;
@@ -63,6 +70,11 @@ GraphTransferer::GetConstNodeParams() const {
   return const_node_transfer_params_list_;
 }
 
+const std::vector<GraphTransferer::NodeTransferParams>&
+GraphTransferer::GetOpNodeParams() const {
+  return node_transfer_params_list_;
+}
+
 int GraphTransferer::CacheNode(const Node& node) {
   if (node_name_to_id_cache_map_.count(node.name()) > 0) {
     if (DBG) {
@@ -107,6 +119,8 @@ void GraphTransferer::RegisterNode(const ShapeRefiner& shape_refiner,
     }
   } else if (node.IsConstant()) {
     RegisterConstantNode(shape_refiner, node);
+  } else if (HasPaddingAndStrides(node)) {
+    RegisterNodeWithPaddingAndStrides(shape_refiner, node);
   } else {
     // TODO(satok): register params for nodes which are supported by SOC
     if (DBG) {
@@ -134,8 +148,6 @@ void GraphTransferer::RegisterConstantNode(const ShapeRefiner& shape_refiner,
   CHECK(context->ValueKnown(num_elements_dim));
   const int64 num_output_elements = context->Value(num_elements_dim);
   const int data_size = max_bytes_per_data * num_output_elements;
-  const int rank = context->Rank(shape_handle);
-  CHECK(rank == 0);
   const std::array<int64, SHAPE_ARRAY_SIZE> shape =
       BuildShapeArray(shape_handle, context);
   const_node_transfer_params_list_.emplace_back(
@@ -146,6 +158,52 @@ void GraphTransferer::RegisterConstantNode(const ShapeRefiner& shape_refiner,
                               data_size});
 }
 
+int GraphTransferer::RegisterConstantShape(const std::vector<int>& shape) {
+  // TODO(satok): Handle non-4dim strides
+  CHECK(shape.size() == 4);
+  const string shape_name =
+      std::string(CONST_SHAPE_PREFIX) + std::to_string(shape.at(0)) + 'x' +
+      std::to_string(shape.at(1)) + 'x' + std::to_string(shape.at(2)) + 'x' +
+      std::to_string(shape.at(3));
+  if (node_name_to_id_cache_map_.count(shape_name) <= 0) {
+    node_name_cache_list_.emplace_back(nullptr);
+    const int id = node_name_cache_list_.size() - 1;
+    node_name_to_id_cache_map_.emplace(shape_name, id);
+    const_node_transfer_params_list_.emplace_back(ConstNodeTransferParams{
+        shape_name, id, {{shape[0], shape[1], shape[2], shape[3]}}, "", 0});
+  }
+  return node_name_to_id_cache_map_[shape_name];
+}
+
+bool GraphTransferer::HasPaddingAndStrides(const Node& node) {
+  return node.def().attr().count(PADDING_ATTR_NAME) > 0 &&
+         node.def().attr().count(STRIDES_ATTR_NAME) > 0;
+}
+
+void GraphTransferer::RegisterNodeWithPaddingAndStrides(
+    const ShapeRefiner& shape_refiner, const Node& node) {
+  CHECK(node_name_to_id_cache_map_.count(node.name()) == 1);
+  const int id = node_name_to_id_cache_map_[node.name()];
+  shape_inference::InferenceContext* context = shape_refiner.GetContext(&node);
+  CHECK(node.def().attr().count(PADDING_ATTR_NAME) > 0);
+  // TODO(satok): Use context->GetAttr(...) instead?
+  Padding padding;
+  context->GetAttr(PADDING_ATTR_NAME, &padding);
+  CHECK(node.def().attr().count(STRIDES_ATTR_NAME) > 0);
+  std::vector<int32> strides;
+  context->GetAttr(STRIDES_ATTR_NAME, &strides);
+  const int stride_id = RegisterConstantShape(strides);
+  std::vector<int> extra_inputs{stride_id};
+  if (node.def().attr().count(KSIZE_ATTR_NAME) > 0) {
+    std::vector<int32> kernel_sizes;
+    context->GetAttr(KSIZE_ATTR_NAME, &kernel_sizes);
+    const int ksize_id = RegisterConstantShape(kernel_sizes);
+    extra_inputs.push_back(ksize_id);
+  }
+  AppendNodeParams(node.name(), id, node.type_string(), padding,
+                   node.num_inputs(), extra_inputs, node.num_outputs());
+}
+
 bool GraphTransferer::RegisterNodeIfAllInputsAreCached(
     const ShapeRefiner& shape_refiner, const Node& node,
     const bool only_register_const_node) {
@@ -161,14 +219,21 @@ bool GraphTransferer::RegisterNodeIfAllInputsAreCached(
 
 void GraphTransferer::AppendNodeParams(const string& name, const int id,
                                        const string& type,
-                                       const string& padding,
+                                       const Padding& padding,
                                        const int inputs_size,
+                                       const std::vector<int>& extra_inputs,
                                        const int outputs_size) {
+  // TODO(satok): register inputs
+  // TODO(satok): register outputs
+  // TODO(satok): store padding as Padding?
   node_transfer_params_list_.emplace_back(NodeTransferParams{
-      name, id, type, padding,
-      string(INPUTS_NODE_PREFIX) + std::to_string(inputs_size), inputs_size,
-      string(OUTPUTS_NODE_PREFIX) + std::to_string(outputs_size),
-      outputs_size});
+      name, id, type,
+      string(PADDING_PREFIX) +
+          string(padding == VALID ? PADDING_VALID_STR : PADDING_SAME_STR),
+      string(INPUTS_NODE_PREFIX) + std::to_string(id),
+      inputs_size + static_cast<int>(extra_inputs.size()),
+      string(OUTPUTS_NODE_PREFIX) + std::to_string(id),
+      static_cast<int>(outputs_size)});
 }
 
 /* static */ std::array<int64, GraphTransferer::SHAPE_ARRAY_SIZE>
@@ -205,6 +270,7 @@ GraphTransferer::BuildShapeArray(
 
 void GraphTransferer::DumpNodeTransferParams() const {
   // TODO(satok): Dump all params
+  LOG(INFO) << "*** Const Nodes ***";
   for (const ConstNodeTransferParams& params :
        const_node_transfer_params_list_) {
     LOG(INFO) << "[ " << params.id << " \"" << params.name << "\" (Const)";
@@ -214,6 +280,18 @@ void GraphTransferer::DumpNodeTransferParams() const {
     LOG(INFO) << "  data_size: " << params.data_size << " bytes"
               << " ]";
   }
+  LOG(INFO) << "******";
+  LOG(INFO) << "*** Op Nodes ***";
+  for (const NodeTransferParams& params : node_transfer_params_list_) {
+    LOG(INFO) << "[ " << params.id << " \"" << params.name;
+    LOG(INFO) << "  type: " << params.type;
+    LOG(INFO) << "  padding: " << params.padding;
+    LOG(INFO) << "  inputs: " << params.inputs_name
+              << ", size = " << params.inputs_size;
+    LOG(INFO) << "  outputs: " << params.outputs_name
+              << ", size = " << params.outputs_size << " ]";
+  }
+  LOG(INFO) << "******";
 }
 
 }  // namespace tensorflow
diff --git a/tensorflow/core/kernels/hexagon/graph_transferer.h b/tensorflow/core/kernels/hexagon/graph_transferer.h
index 3e3ee3d49ba..99e1952f607 100644
--- a/tensorflow/core/kernels/hexagon/graph_transferer.h
+++ b/tensorflow/core/kernels/hexagon/graph_transferer.h
@@ -25,6 +25,7 @@ limitations under the License.
 #include "tensorflow/core/graph/graph.h"
 #include "tensorflow/core/platform/macros.h"
 #include "tensorflow/core/platform/protobuf.h"
+#include "tensorflow/core/util/padding.h"
 
 namespace tensorflow {
 
@@ -67,17 +68,25 @@ class GraphTransferer {
   // Return const node parameters for transfer
   const std::vector<ConstNodeTransferParams>& GetConstNodeParams() const;
 
+  // Return op node parameters for transfer
+  const std::vector<NodeTransferParams>& GetOpNodeParams() const;
+
  private:
   int CacheNode(const Node& node);
   bool AreAllInputsCached(const Node& node) const;
   void RegisterConstantNode(const ShapeRefiner& shape_refiner,
                             const Node& node);
+  int RegisterConstantShape(const std::vector<int>& shape);
+  bool HasPaddingAndStrides(const Node& node);
+  void RegisterNodeWithPaddingAndStrides(const ShapeRefiner& shape_refiner,
+                                         const Node& node);
   void RegisterNode(const ShapeRefiner& shape_refiner, const Node& node);
   bool RegisterNodeIfAllInputsAreCached(const ShapeRefiner& shape_refiner,
                                         const Node& node,
                                         const bool only_register_const_node);
   void AppendNodeParams(const string& name, const int id, const string& type,
-                        const string& padding, const int inputs_size,
+                        const Padding& padding, const int inputs_size,
+                        const std::vector<int>& extra_inputs,
                         const int outputs_size);
   static std::array<int64, SHAPE_ARRAY_SIZE> BuildShapeArray(
       const shape_inference::ShapeHandle& shape_handle,
diff --git a/tensorflow/core/kernels/hexagon/graph_transferer_test.cc b/tensorflow/core/kernels/hexagon/graph_transferer_test.cc
index 4c386f4a623..99771f56282 100644
--- a/tensorflow/core/kernels/hexagon/graph_transferer_test.cc
+++ b/tensorflow/core/kernels/hexagon/graph_transferer_test.cc
@@ -16,7 +16,9 @@ limitations under the License.
 #include <memory>
 
 #include "tensorflow/cc/ops/const_op.h"
+#include "tensorflow/cc/ops/nn_ops.h"
 #include "tensorflow/cc/ops/standard_ops.h"
+#include "tensorflow/core/framework/tensor_testutil.h"
 #include "tensorflow/core/graph/graph_def_builder.h"
 #include "tensorflow/core/kernels/hexagon/graph_transferer.h"
 #include "tensorflow/core/lib/core/status.h"
@@ -40,12 +42,49 @@ class GraphTransfererTest : public ::testing::Test {
   std::unique_ptr<Session> _session;
 };
 
-static GraphDef CreateSmallGraphDef() {
+static GraphDef CreateAddGraphDef() {
   Scope root = Scope::NewRootScope();
   ops::Output node_a = ops::Const(root.WithOpName(NAME_A), 1);
   ops::Output node_b = ops::Const(root.WithOpName(NAME_B), 2);
-  ops::Add(root.WithOpName("a_plus_b"), node_a, node_b);
+  ops::Output node_add = ops::Add(root.WithOpName("a_plus_b"), node_a, node_b);
+  GraphDef def;
+  TF_CHECK_OK(root.ToGraphDef(&def));
+  return def;
+}
 
+static GraphDef CreateConvGraphDef() {
+  Scope root = Scope::NewRootScope();
+  Tensor input_data(DT_FLOAT, TensorShape({1, 1, 1, 1}));
+  test::FillIota<float>(&input_data, 1.0f);
+  ops::Output input =
+      ops::Const(root.WithOpName("input"), ops::Input::Initializer(input_data));
+  Tensor filter_data(DT_FLOAT, TensorShape({1, 1, 1, 1}));
+  test::FillIota<float>(&filter_data, 1.0f);
+  ops::Output filter = ops::Const(root.WithOpName("filter"),
+                                  ops::Input::Initializer(filter_data));
+  const std::vector<int> strides{1, 1, 1, 1};
+  ops::Output conv =
+      ops::Conv2D(root.WithOpName("conv"), input, filter, strides, "SAME");
+  GraphDef def;
+  TF_CHECK_OK(root.ToGraphDef(&def));
+  return def;
+}
+
+static GraphDef CreatePoolGraphDef() {
+  Scope root = Scope::NewRootScope();
+  Tensor input_data(DT_FLOAT, TensorShape({1, 1, 1, 1}));
+  test::FillIota<float>(&input_data, 1.0f);
+  ops::Output input =
+      ops::Const(root.WithOpName("input"), ops::Input::Initializer(input_data));
+  Tensor filter_data(DT_FLOAT, TensorShape({1, 1, 1, 1}));
+  test::FillIota<float>(&filter_data, 1.0f);
+  ops::Output filter = ops::Const(root.WithOpName("filter"),
+                                  ops::Input::Initializer(filter_data));
+  const std::vector<int> ksize{1, 1, 1, 1};
+  const std::vector<int> padding{0, 0, 0, 0};
+  const std::vector<int> strides{1, 1, 1, 1};
+  ops::Output max_pool =
+      ops::MaxPool(root.WithOpName("maxpool"), input, ksize, strides, "SAME");
   GraphDef def;
   TF_CHECK_OK(root.ToGraphDef(&def));
   return def;
@@ -62,17 +101,29 @@ static const GraphTransferer::ConstNodeTransferParams* FindConstNodeParams(
   return nullptr;
 }
 
-TEST_F(GraphTransfererTest, LoadGraph) {
-  GraphDef def = CreateSmallGraphDef();
+static const GraphTransferer::NodeTransferParams* FindOpNodeParams(
+    const GraphTransferer& gt, const string& name) {
+  for (const GraphTransferer::NodeTransferParams& params :
+       gt.GetOpNodeParams()) {
+    if (params.name == name) {
+      return &params;
+    }
+  }
+  return nullptr;
+}
+
+TEST_F(GraphTransfererTest, LoadAddGraph) {
+  GraphDef def = CreateAddGraphDef();
   _session->Create(def);
 
   GraphTransferer gt;
   gt.LoadGraphFromProto(def);
-  ASSERT_EQ(2, gt.GetConstNodeParams().size());
+  const int const_node_count = gt.GetConstNodeParams().size();
+  ASSERT_EQ(2, const_node_count);
   const GraphTransferer::ConstNodeTransferParams* params_a =
       FindConstNodeParams(gt, NAME_A);
   ASSERT_TRUE(params_a != nullptr);
-  EXPECT_TRUE(params_a->id > 0 && params_a->id <= 2);
+  EXPECT_TRUE(params_a->id > 0 && params_a->id <= const_node_count);
   EXPECT_EQ(NAME_A, params_a->name);
   EXPECT_EQ(1, params_a->shape[0]);
   EXPECT_EQ(1, params_a->shape[1]);
@@ -83,7 +134,7 @@ TEST_F(GraphTransfererTest, LoadGraph) {
   const GraphTransferer::ConstNodeTransferParams* params_b =
       FindConstNodeParams(gt, NAME_B);
   ASSERT_TRUE(params_b != nullptr);
-  EXPECT_TRUE(params_b->id > 0 && params_b->id <= 2);
+  EXPECT_TRUE(params_b->id > 0 && params_b->id <= const_node_count);
   EXPECT_EQ(1, params_b->shape[0]);
   EXPECT_EQ(1, params_b->shape[1]);
   EXPECT_EQ(1, params_b->shape[2]);
@@ -91,4 +142,45 @@ TEST_F(GraphTransfererTest, LoadGraph) {
   EXPECT_EQ(10, params_b->data_size);
 }
 
+TEST_F(GraphTransfererTest, LoadConvGraph) {
+  GraphDef def = CreateConvGraphDef();
+  _session->Create(def);
+
+  GraphTransferer gt;
+  gt.LoadGraphFromProto(def);
+  const int const_node_count = gt.GetConstNodeParams().size();
+  ASSERT_EQ(3, const_node_count);
+  const int op_node_count = gt.GetOpNodeParams().size();
+  ASSERT_EQ(1, op_node_count);
+  const GraphTransferer::NodeTransferParams* params_conv =
+      FindOpNodeParams(gt, "conv");
+  ASSERT_TRUE(params_conv != nullptr);
+  const int id = params_conv->id;
+  EXPECT_TRUE(id > 0 && id <= (const_node_count + op_node_count));
+  EXPECT_EQ("Conv2D", params_conv->type);
+  EXPECT_EQ(3, params_conv->inputs_size);
+  EXPECT_EQ(1, params_conv->outputs_size);
+  EXPECT_EQ("NN_PAD_SAME", params_conv->padding);
+}
+
+TEST_F(GraphTransfererTest, LoadMaxPoolGraph) {
+  GraphDef def = CreatePoolGraphDef();
+  _session->Create(def);
+
+  GraphTransferer gt;
+  gt.LoadGraphFromProto(def);
+  const int const_node_count = gt.GetConstNodeParams().size();
+  ASSERT_EQ(3, const_node_count);
+  const int op_node_count = gt.GetOpNodeParams().size();
+  ASSERT_EQ(1, op_node_count);
+  const GraphTransferer::NodeTransferParams* params_max_pool =
+      FindOpNodeParams(gt, "maxpool");
+  ASSERT_TRUE(params_max_pool != nullptr);
+  const int id = params_max_pool->id;
+  EXPECT_TRUE(id > 0 && id <= (const_node_count + op_node_count));
+  EXPECT_EQ("MaxPool", params_max_pool->type);
+  EXPECT_EQ(3, params_max_pool->inputs_size);
+  EXPECT_EQ(1, params_max_pool->outputs_size);
+  EXPECT_EQ("NN_PAD_SAME", params_max_pool->padding);
+}
 }  // namespace tensorflow
diff --git a/tensorflow/core/kernels/immutable_constant_op_test.cc b/tensorflow/core/kernels/immutable_constant_op_test.cc
index 93d726a64d4..d822e316ead 100644
--- a/tensorflow/core/kernels/immutable_constant_op_test.cc
+++ b/tensorflow/core/kernels/immutable_constant_op_test.cc
@@ -64,7 +64,7 @@ class TestFileSystem : public NullFileSystem {
       std::unique_ptr<ReadOnlyMemoryRegion>* result) override {
     float val = 0;
     StringPiece scheme, host, path;
-    ParseURI(fname, &scheme, &host, &path);
+    io::ParseURI(fname, &scheme, &host, &path);
     // For the tests create in-memory regions with float values equal to the
     // region name.
     if (path == "/2") {
diff --git a/tensorflow/core/kernels/parameterized_truncated_normal_op.cc b/tensorflow/core/kernels/parameterized_truncated_normal_op.cc
index 4d31edbb1a9..77c4b7a7299 100644
--- a/tensorflow/core/kernels/parameterized_truncated_normal_op.cc
+++ b/tensorflow/core/kernels/parameterized_truncated_normal_op.cc
@@ -46,25 +46,6 @@ namespace functor {
 using random::PhiloxRandom;
 using random::SingleSampleAdapter;
 
-// Sample a truncated normal random variable, with mean, stddev, minval, and
-// maxval parameters for each batch. Uses two rejection sampling algorithms
-// described in http://rd.springer.com/article/10.1007/BF00143942.
-//
-// Either minval may be -infinity, or maxval may be +infinity. If the interval
-// (minval, maxval) is empty, the result is NaN. Large intervals which include
-// both tails may have reduced accuracy.
-template <typename Device, typename T>
-struct TruncatedNormalFunctor {
-  void operator()(OpKernelContext* ctx, const Device& d, int64 num_batches,
-                  int64 samples_per_batch, int64 num_elements,
-                  typename TTypes<T>::ConstFlat means,
-                  typename TTypes<T>::ConstFlat stddevs,
-                  typename TTypes<T>::ConstFlat minvals,
-                  typename TTypes<T>::ConstFlat maxvals,
-                  const random::PhiloxRandom& gen,
-                  typename TTypes<T>::Flat output);
-};
-
 template <typename T>
 struct TruncatedNormalFunctor<CPUDevice, T> {
   static const int kMaxIterations = 100;
@@ -96,8 +77,8 @@ struct TruncatedNormalFunctor<CPUDevice, T> {
 
       // Vectorized intermediate calculations for uniform rejection sampling.
       // We always generate at most 4 samples.
-      tensorflow::random::Array<T, 4> z;
-      tensorflow::random::Array<T, 4> g;
+      Eigen::array<T, 4> z;
+      Eigen::array<T, 4> g;
 
       for (int64 b = start_batch; b < limit_batch; ++b) {
         // We are passed a flat array for each of the parameter tensors.
@@ -145,13 +126,7 @@ struct TruncatedNormalFunctor<CPUDevice, T> {
         if (diff < cutoff) {
           // Sample from a uniform distribution on [normMin, normMax].
 
-          T plusFactor;
-          if (normMin < T(0)) {
-            // normMax > 0 because it is flipped otherwise.
-            plusFactor = T(0);
-          } else {
-            plusFactor = normMin * normMin;
-          }
+          const T plusFactor = (normMin < T(0)) ? T(0) : normMin * normMin;
 
           while (sample < limit_sample) {
             const auto rand = dist(&gen_copy);
@@ -395,4 +370,21 @@ TF_CALL_double(REGISTER);
 
 #undef REGISTER
 
+#if GOOGLE_CUDA
+
+#define REGISTER(TYPE)                                         \
+  REGISTER_KERNEL_BUILDER(Name("ParameterizedTruncatedNormal") \
+                              .Device(DEVICE_GPU)              \
+                              .HostMemory("shape")             \
+                              .TypeConstraint<TYPE>("dtype"),  \
+                          ParameterizedTruncatedNormalOp<GPUDevice, TYPE>)
+
+TF_CALL_half(REGISTER);
+TF_CALL_float(REGISTER);
+TF_CALL_double(REGISTER);
+
+#undef REGISTER
+
+#endif  // GOOGLE_CUDA
+
 }  // end namespace tensorflow
diff --git a/tensorflow/core/kernels/parameterized_truncated_normal_op.h b/tensorflow/core/kernels/parameterized_truncated_normal_op.h
index a46bb1c9fa6..cc801eb8109 100644
--- a/tensorflow/core/kernels/parameterized_truncated_normal_op.h
+++ b/tensorflow/core/kernels/parameterized_truncated_normal_op.h
@@ -16,14 +16,35 @@ limitations under the License.
 #ifndef TENSORFLOW_KERNELS_PARAMETERIZED_TRUNCATED_NORMAL_OP_H_
 #define TENSORFLOW_KERNELS_PARAMETERIZED_TRUNCATED_NORMAL_OP_H_
 
+#include "tensorflow/core/framework/tensor_types.h"
+#include "tensorflow/core/lib/random/random_distributions.h"
+
 namespace tensorflow {
 
 class OpKernelContext;
 
 namespace functor {
 
+// Sample a truncated normal random variable, with mean, stddev, minval, and
+// maxval parameters for each batch. Uses two rejection sampling algorithms
+// described in http://rd.springer.com/article/10.1007/BF00143942.
+//
+// Either minval may be -infinity, or maxval may be +infinity. If the interval
+// (minval, maxval) is empty, the result is NaN. Large intervals which include
+// both tails may have reduced accuracy.
 template <typename Device, typename T>
-struct TruncatedNormalFunctor;
+struct TruncatedNormalFunctor {
+  void operator()(OpKernelContext* ctx, const Device& d, int64 num_batches,
+                  int64 samples_per_batch, int64 num_elements,
+                  typename TTypes<T>::ConstFlat means,
+                  typename TTypes<T>::ConstFlat stddevs,
+                  typename TTypes<T>::ConstFlat minvals,
+                  typename TTypes<T>::ConstFlat maxvals,
+                  const random::PhiloxRandom& gen,
+                  typename TTypes<T>::Flat output);
+
+  static const int kMaxIterations = 100;
+};
 
 }  // namespace functor
 }  // namespace tensorflow
diff --git a/tensorflow/core/kernels/parameterized_truncated_normal_op_gpu.cu.cc b/tensorflow/core/kernels/parameterized_truncated_normal_op_gpu.cu.cc
new file mode 100644
index 00000000000..42d47440690
--- /dev/null
+++ b/tensorflow/core/kernels/parameterized_truncated_normal_op_gpu.cu.cc
@@ -0,0 +1,214 @@
+/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#if GOOGLE_CUDA
+
+#define EIGEN_USE_GPU
+
+#include "tensorflow/core/kernels/parameterized_truncated_normal_op.h"
+
+#include <assert.h>
+#include <stdio.h>
+#include <cmath>
+
+#include "third_party/eigen3/unsupported/Eigen/CXX11/Tensor"
+#include "tensorflow/core/framework/tensor_types.h"
+#include "tensorflow/core/lib/random/philox_random.h"
+#include "tensorflow/core/lib/random/random_distributions.h"
+#include "tensorflow/core/util/cuda_kernel_helper.h"
+
+#define UNROLL _Pragma("unroll")
+
+namespace tensorflow {
+
+class OpKernelContext;
+
+namespace functor {
+
+typedef Eigen::GpuDevice GPUDevice;
+
+template <typename T>
+__global__ void __launch_bounds__(1024)
+    TruncatedNormalKernel(random::PhiloxRandom gen, T* data, int64 num_batches,
+                          int64 samples_per_batch, int64 num_elements,
+                          const T* means, bool single_mean, const T* stddevs,
+                          bool single_stddev, const T* minvals,
+                          bool single_minval, const T* maxvals,
+                          bool single_maxval, int64 kMaxIterations) {
+  const int32 max_samples_per_item = 2 * kMaxIterations;
+  // Initial offset as given by CUDA_1D_KERNEL_LOOP.
+  const int32 initial_offset = blockIdx.x * blockDim.x + threadIdx.x;
+  gen.Skip(max_samples_per_item * initial_offset);
+  typedef random::UniformDistribution<random::PhiloxRandom, T> Uniform;
+  Uniform dist;
+  const int kDistSize = Uniform::kResultElementCount;
+  const T quietNaN = Eigen::NumTraits<T>::quiet_NaN();
+
+  // We skip the total number of threads to get to the next element. To produce
+  // deterministic results between devices, each element in the output array
+  // skips max_samples_per_item in the generator. Then after generating this
+  // item, we need to skip the samples for one element for every thread to get
+  // to the next element that we actually process.
+  const int32 samples_between_processed_elements =
+      max_samples_per_item * (gridDim.x * blockDim.x);
+
+  CUDA_1D_KERNEL_LOOP(offset, num_elements) {
+    // Track how many more samples we need to skip before we process the next
+    // element.
+    int32 remaining_samples = samples_between_processed_elements;
+
+    const int64 batch_id = offset / samples_per_batch;
+    T mean = means[single_mean ? 0 : batch_id];
+    const T input_stddev = stddevs[single_stddev ? 0 : batch_id];
+    T minval = minvals[single_minval ? 0 : batch_id];
+    T maxval = maxvals[single_maxval ? 0 : batch_id];
+
+    // Flip the distribution if we can make the lower bound positive.
+    T stddev;
+    if (Eigen::numext::isinf(minval) || maxval < mean) {
+      // Reverse all calculations. normMin and normMax will be flipped.
+      // std::swap is a host function (not available in CUDA).
+      T temp = minval;
+      minval = maxval;
+      maxval = temp;
+      stddev = -input_stddev;
+    } else {
+      stddev = input_stddev;
+    }
+
+    // Calculate normalized samples, then scale them.
+    const T normMin = (minval - mean) / stddev;
+    const T normMax = (maxval - mean) / stddev;
+
+    // Determine the method to use.
+    const T sqrtFactor = Eigen::numext::sqrt((normMin * normMin) + T(4));
+    const T cutoff =
+        T(2) *
+        Eigen::numext::exp(T(0.5) + (normMin * (normMin - sqrtFactor)) / T(4)) /
+        (normMin + sqrtFactor);
+    const T diff = normMax - normMin;
+
+    // Validate the normalized min and max, because the originals may have been
+    // flipped already.
+    if (!(input_stddev > T(0) && normMin < normMax &&
+          (Eigen::numext::isfinite(normMin) ||
+           Eigen::numext::isfinite(normMax)))) {
+      data[offset] = quietNaN;
+    } else if (diff < cutoff) {
+      // Sample from a uniform distribution on [normMin, normMax].
+
+      // Vectorized intermediate calculations for uniform rejection sampling.
+      // We always generate at most 4 samples.
+      Eigen::array<T, 4> z;
+      Eigen::array<T, 4> g;
+
+      const T plusFactor = (normMin < T(0)) ? T(0) : normMin * normMin;
+
+      int numIterations = 0;
+      while (numIterations < kMaxIterations) {
+        const auto rand = dist(&gen);
+        remaining_samples -= gen.kResultElementCount;
+        UNROLL for (int i = 0; i < kDistSize; i++) {
+          z[i] = rand[i] * diff + normMin;
+        }
+        UNROLL for (int i = 0; i < kDistSize; i++) {
+          g[i] = (plusFactor - z[i] * z[i]) / 2.0;
+        }
+
+        const auto u = dist(&gen);
+        remaining_samples -= gen.kResultElementCount;
+        UNROLL for (int i = 0; i < kDistSize; i++) {
+          if (u[i] <= Eigen::numext::exp(g[i]) ||
+              numIterations + 1 >= kMaxIterations) {
+            // Accept the sample z.
+            // If we run out of iterations, just use the current uniform
+            // sample. Emperically, the probability of accepting each sample
+            // is at least 50% for typical inputs, so we will always accept
+            // by 100 iterations.
+            // This introduces a slight inaccuracy when at least one bound
+            // is large, minval is negative and maxval is positive.
+            data[offset] = z[i] * stddev + mean;
+            // Break out of the nested loop by updating numIterations.
+            numIterations = kMaxIterations;
+            break;
+          } else {
+            numIterations++;
+          }
+        }
+      }
+    } else {
+      // Sample from an exponential distribution with alpha maximizing
+      // acceptance probability, offset by normMin from the origin.
+      // Accept only if less than normMax.
+      const T alpha =
+          (normMin + Eigen::numext::sqrt((normMin * normMin) + T(4))) / T(2);
+      int numIterations = 0;
+      while (numIterations < kMaxIterations) {
+        auto rand = dist(&gen);
+        remaining_samples -= gen.kResultElementCount;
+        UNROLL for (int i = 0; i < kDistSize; i += 2) {
+          const T z = -Eigen::numext::log(rand[i]) / alpha + normMin;
+          const T x = normMin < alpha ? alpha - z : normMin - alpha;
+          const T g = Eigen::numext::exp(-x * x / 2.0);
+          const T u = rand[i + 1];
+          if ((u <= g && z < normMax) || numIterations + 1 >= kMaxIterations) {
+            data[offset] = z * stddev + mean;
+            // Break out of the nested loop by updating numIterations.
+            numIterations = kMaxIterations;
+            break;
+          } else {
+            numIterations++;
+          }
+        }
+      }
+    }
+
+    gen.Skip(remaining_samples);
+  }
+}
+
+// Partial specialization for GPU
+template <typename T>
+struct TruncatedNormalFunctor<GPUDevice, T> {
+  static const int kMaxIterations = 100;
+
+  void operator()(OpKernelContext* ctx, const GPUDevice& d, int64 num_batches,
+                  int64 samples_per_batch, int64 num_elements,
+                  typename TTypes<T>::ConstFlat means,
+                  typename TTypes<T>::ConstFlat stddevs,
+                  typename TTypes<T>::ConstFlat minvals,
+                  typename TTypes<T>::ConstFlat maxvals,
+                  const random::PhiloxRandom& gen,
+                  typename TTypes<T>::Flat output) {
+    const auto config = GetCudaLaunchConfig(num_elements, d);
+
+    TruncatedNormalKernel<
+        T><<<config.block_count, config.thread_per_block, 0, d.stream()>>>(
+        gen, output.data(), num_batches, samples_per_batch, num_elements,
+        means.data(), means.dimension(0) == 1, stddevs.data(),
+        stddevs.dimension(0) == 1, minvals.data(), minvals.dimension(0) == 1,
+        maxvals.data(), maxvals.dimension(0) == 1, kMaxIterations);
+  };
+};
+
+// Explicit instantiation of the GPU distributions functors
+template struct TruncatedNormalFunctor<GPUDevice, Eigen::half>;
+template struct TruncatedNormalFunctor<GPUDevice, float>;
+template struct TruncatedNormalFunctor<GPUDevice, double>;
+
+}  // namespace functor
+}  // namespace tensorflow
+
+#endif  // GOOGLE_CUDA
diff --git a/tensorflow/core/kernels/parameterized_truncated_normal_op_test.cc b/tensorflow/core/kernels/parameterized_truncated_normal_op_test.cc
index 13d1187f926..07f2f75ca5a 100644
--- a/tensorflow/core/kernels/parameterized_truncated_normal_op_test.cc
+++ b/tensorflow/core/kernels/parameterized_truncated_normal_op_test.cc
@@ -131,5 +131,8 @@ static Graph* PTruncatedNormalOneTail(int num_batches, int samples_per_batch) {
 BM_PTruncatedNormalDev(cpu, 1000, 1000);
 BM_PTruncatedNormalDev_2SD(cpu, 10000, 100);
 BM_PTruncatedNormalDev_OneTail(cpu, 10000, 100);
+BM_PTruncatedNormalDev(gpu, 1000, 1000);
+BM_PTruncatedNormalDev_2SD(gpu, 10000, 100);
+BM_PTruncatedNormalDev_OneTail(gpu, 10000, 100);
 
 }  // namespace tensorflow
diff --git a/tensorflow/core/kernels/quantized_reshape_op.cc b/tensorflow/core/kernels/quantized_reshape_op.cc
index d49edd3feb4..bd76c94edee 100644
--- a/tensorflow/core/kernels/quantized_reshape_op.cc
+++ b/tensorflow/core/kernels/quantized_reshape_op.cc
@@ -50,8 +50,8 @@ class QuantizedReshapeOp : public ReshapeOp {
                               .TypeConstraint<type>("T"), \
                           QuantizedReshapeOp)
 
-TF_CALL_quint8(REGISTER_CPU_KERNEL);
-TF_CALL_qint32(REGISTER_CPU_KERNEL);
+REGISTER_CPU_KERNEL(::tensorflow::quint8);
+REGISTER_CPU_KERNEL(::tensorflow::qint32);
 
 #undef REGISTER_CPU_KERNEL
 
diff --git a/tensorflow/core/kernels/resource_variable_ops.cc b/tensorflow/core/kernels/resource_variable_ops.cc
index fbe66e83860..8809cba41d5 100644
--- a/tensorflow/core/kernels/resource_variable_ops.cc
+++ b/tensorflow/core/kernels/resource_variable_ops.cc
@@ -13,9 +13,12 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
+#define EIGEN_USE_THREADS
+
 #include "tensorflow/core/framework/op_kernel.h"
 #include "tensorflow/core/framework/register_types.h"
 #include "tensorflow/core/framework/resource_mgr.h"
+#include "tensorflow/core/framework/tensor_types.h"
 #include "tensorflow/core/kernels/variable_ops.h"
 #include "tensorflow/core/lib/core/errors.h"
 #include "tensorflow/core/platform/mutex.h"
@@ -25,25 +28,160 @@ namespace tensorflow {
 
 REGISTER_RESOURCE_HANDLE_KERNEL(Var);
 
+template <typename Device, typename T>
 class CreateVariableOp : public OpKernel {
  public:
   CreateVariableOp(OpKernelConstruction* c) : OpKernel(c) {
     OP_REQUIRES_OK(c, c->GetAttr("dtype", &dtype_));
+    OP_REQUIRES(c, DataTypeToEnum<T>::value == dtype_,
+                errors::InvalidArgument(
+                    "Dtypes don't match; expected ", DataTypeString(dtype_),
+                    " got ", DataTypeString(DataTypeToEnum<T>::value)));
   }
 
-  void Compute(OpKernelContext* c) override {
+  void Compute(OpKernelContext* context) override {
     Var* var = new Var(dtype_);
-    var->Ref();
-    core::ScopedUnref ur(var);
-    OP_REQUIRES_OK(c, CreateResource<Var>(c, HandleFromInput(c, 0), var));
-    // TODO(apassos): this currently does not initialize the tensor, so it's
-    // pointless, other than checking construction in tests. Fix this.
+    AllocatorAttributes attr;
+    attr.set_gpu_compatible(true);
+    attr.set_nic_compatible(true);
+    PersistentTensor copy;
+    Tensor value = context->input(1);
+
+    // TODO(apassos): allocating and copying is unnecessary if we are the last
+    // user of the value tensor. This should essentially always be the case, yet
+    // the refcount is usually 2 instead of 1. Figure out what needs to change
+    // in the code to make this not be the case, so we can safely take
+    // ownership.
+    Tensor* tmp_copy = nullptr;
+    OP_REQUIRES_OK(context, context->allocate_persistent(
+                                dtype_, value.shape(), &copy, &tmp_copy, attr));
+    *var->tensor() = *tmp_copy;
+    var->tensor()->flat<T>().device(context->eigen_device<Device>()) =
+        value.flat<T>();
+    OP_REQUIRES_OK(context, CreateResource<Var>(
+                                context, HandleFromInput(context, 0), var));
   }
 
  private:
   DataType dtype_;
 };
-REGISTER_KERNEL_BUILDER(Name("CreateVariableOp").Device(DEVICE_CPU),
-                        CreateVariableOp);
+
+// TODO(apassos) register for the GPU as well.
+#define REGISTER_KERNELS(type)                                \
+  REGISTER_KERNEL_BUILDER(Name("CreateVariableOp")            \
+                              .Device(DEVICE_CPU)             \
+                              .TypeConstraint<type>("dtype"), \
+                          CreateVariableOp<Eigen::ThreadPoolDevice, type>);
+
+TF_CALL_ALL_TYPES(REGISTER_KERNELS);
+TF_CALL_QUANTIZED_TYPES(REGISTER_KERNELS);
+#undef REGISTER_KERNELS
+
+template <typename Device, typename T>
+class ReadVariableOp : public OpKernel {
+ public:
+  ReadVariableOp(OpKernelConstruction* c) : OpKernel(c) {}
+
+  void Compute(OpKernelContext* ctx) {
+    Var* variable = nullptr;
+    OP_REQUIRES_OK(ctx,
+                   LookupResource(ctx, HandleFromInput(ctx, 0), &variable));
+    core::ScopedUnref s(variable);
+    // TODO(apassos): It's possible to do copy-on-write here instead of always
+    // copying by coordinating with the writing code. Do this. This will also
+    // obviate the need to hold a lock here.
+    mutex_lock ml(*variable->mu());
+    Tensor* out = nullptr;
+    OP_REQUIRES_OK(ctx,
+                   ctx->allocate_output(0, variable->tensor()->shape(), &out));
+    out->flat<T>().device(ctx->eigen_device<Device>()) =
+        variable->tensor()->flat<T>();
+  }
+};
+
+// TODO(apassos) register for the GPU as well.
+#define REGISTER_KERNELS(type)                                                 \
+  REGISTER_KERNEL_BUILDER(                                                     \
+      Name("ReadVariableOp").Device(DEVICE_CPU).TypeConstraint<type>("dtype"), \
+      ReadVariableOp<Eigen::ThreadPoolDevice, type>);
+
+TF_CALL_ALL_TYPES(REGISTER_KERNELS);
+TF_CALL_QUANTIZED_TYPES(REGISTER_KERNELS);
+#undef REGISTER_KERNELS
+
+template <typename Device, typename T>
+class AssignVariableOp : public OpKernel {
+ public:
+  AssignVariableOp(OpKernelConstruction* c) : OpKernel(c) {}
+
+  void Compute(OpKernelContext* context) override {
+    Var* variable = nullptr;
+    OP_REQUIRES_OK(context, LookupResource(context, HandleFromInput(context, 0),
+                                           &variable));
+    core::ScopedUnref s(variable);
+
+    // TODO(apassos): holding a lock and copying is unnecessary if we are the
+    // last user of the value tensor. This should essentially always be the
+    // case, yet the refcount is usually 2 instead of 1. Figure out what needs
+    // to change in the code to make this not be the case, so we can safely take
+    // ownership.
+    mutex_lock ml(*variable->mu());
+    Tensor value = context->input(1);
+    variable->tensor()->flat<T>().device(context->eigen_device<Device>()) =
+        value.flat<T>();
+  }
+};
+
+// TODO(apassos) register for the GPU as well.
+#define REGISTER_KERNELS(type)                                \
+  REGISTER_KERNEL_BUILDER(Name("AssignVariableOp")            \
+                              .Device(DEVICE_CPU)             \
+                              .TypeConstraint<type>("dtype"), \
+                          AssignVariableOp<Eigen::ThreadPoolDevice, type>);
+
+TF_CALL_ALL_TYPES(REGISTER_KERNELS);
+TF_CALL_QUANTIZED_TYPES(REGISTER_KERNELS);
+#undef REGISTER_KERNELS
+
+template <typename Device, typename T>
+class AssignAddVariableOp : public OpKernel {
+ public:
+  AssignAddVariableOp(OpKernelConstruction* c) : OpKernel(c) {}
+
+  void Compute(OpKernelContext* context) override {
+    Var* variable = nullptr;
+    OP_REQUIRES_OK(context, LookupResource(context, HandleFromInput(context, 0),
+                                           &variable));
+    core::ScopedUnref s(variable);
+
+    // TODO(apassos): holding a lock and copying is unnecessary if we are the
+    // last user of the value tensor. This should essentially always be the
+    // case, yet the refcount is usually 2 instead of 1. Figure out what needs
+    // to change in the code to make this not be the case, so we can safely take
+    // ownership.
+    mutex_lock ml(*variable->mu());
+    Tensor value = context->input(1);
+    variable->tensor()->flat<T>().device(context->eigen_device<Device>()) +=
+        value.flat<T>();
+
+    // TODO(apassos): this read can also be implemented efficiently so it is
+    // free if no one uses the resulting tensor.
+    Tensor* out = nullptr;
+    OP_REQUIRES_OK(context, context->allocate_output(
+                                0, variable->tensor()->shape(), &out));
+    out->flat<T>().device(context->eigen_device<Device>()) =
+        variable->tensor()->flat<T>();
+  }
+};
+
+// TODO(apassos) register for the GPU as well.
+#define REGISTER_KERNELS(type)                                \
+  REGISTER_KERNEL_BUILDER(Name("AssignAddVariableOp")         \
+                              .Device(DEVICE_CPU)             \
+                              .TypeConstraint<type>("dtype"), \
+                          AssignAddVariableOp<Eigen::ThreadPoolDevice, type>);
+
+TF_CALL_NUMBER_TYPES(REGISTER_KERNELS);
+#undef REGISTER_KERNELS
 
 }  // namespace tensorflow
diff --git a/tensorflow/core/kernels/scatter_nd_op.cc b/tensorflow/core/kernels/scatter_nd_op.cc
new file mode 100644
index 00000000000..83b38d73381
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op.cc
@@ -0,0 +1,402 @@
+/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+// See docs in ../ops/state_ops.cc.
+#define EIGEN_USE_THREADS
+
+#include "tensorflow/core/kernels/scatter_nd_op.h"
+#include "tensorflow/core/framework/op_kernel.h"
+#include "tensorflow/core/framework/register_types.h"
+#include "tensorflow/core/framework/tensor.h"
+#include "tensorflow/core/framework/tensor_shape.h"
+#include "tensorflow/core/kernels/bounds_check.h"
+#include "tensorflow/core/kernels/fill_functor.h"
+#include "tensorflow/core/platform/mutex.h"
+#include "tensorflow/core/platform/types.h"
+#include "tensorflow/core/util/util.h"
+
+namespace tensorflow {
+
+typedef Eigen::ThreadPoolDevice CPUDevice;
+typedef Eigen::GpuDevice GPUDevice;
+
+// Check whether updates.shape = indices.shape[0] + params.shape[IXDIM:]
+static bool ValidUpdateShape(const TensorShape& params_shape,
+                             const Tensor& indices, const Tensor& updates) {
+  int64 indices_nd = 1;
+  if (indices.dims() > 1) {
+    indices_nd = indices.dim_size(1);
+  }
+  for (int d = indices_nd; d < params_shape.dims(); d++) {
+    if (updates.dim_size(d - indices_nd + 1) != params_shape.dim_size(d)) {
+      return false;
+    }
+  }
+  return true;
+}
+
+template <typename Index>
+static void PrepareAndValidateInputs(OpKernelContext* c,
+                                     const TensorShape& params_shape,
+                                     const Tensor& indices,
+                                     const Tensor& updates, int64* indices_nd,
+                                     Index* num_updates, Index* slice_size) {
+  const TensorShape& indices_shape(indices.shape());
+  const TensorShape& updates_shape(updates.shape());
+
+  OP_REQUIRES(
+      c, TensorShapeUtils::IsVectorOrHigher(params_shape),
+      errors::InvalidArgument("Output must be at least 1-D, ", "got shape: ",
+                              params_shape.DebugString()));
+
+  OP_REQUIRES(c, params_shape.num_elements() >= 0 ||
+                     (indices.NumElements() == 0 && updates.NumElements() == 0),
+              errors::InvalidArgument(
+                  "Indices and updates specified for empty output", " shape"));
+
+  OP_REQUIRES(c, updates.dim_size(0) == indices.dim_size(0),
+              errors::InvalidArgument(
+                  "The outermost dimension of updates and indices ",
+                  "must match. Got indices.shape ", indices_shape.DebugString(),
+                  ", updates.shape ", updates_shape.DebugString()));
+  OP_REQUIRES(
+      c, ValidUpdateShape(params_shape, indices, updates),
+      errors::InvalidArgument(
+          "Must have updates.shape = indices.shape[0] + params_shape[IXDIM:], ",
+          "got updates.shape ", updates_shape.DebugString(), ", indices.shape ",
+          indices_shape.DebugString(), ", params_shape ",
+          params_shape.DebugString()));
+  // Check that we have enough index space
+  const int64 N_big = indices.NumElements();
+  OP_REQUIRES(c, N_big <= std::numeric_limits<Index>::max(),
+              errors::InvalidArgument(
+                  "indices has too many elements for ",
+                  DataTypeString(DataTypeToEnum<Index>::v()), " indexing: ",
+                  N_big, " > ", std::numeric_limits<Index>::max()));
+  OP_REQUIRES(
+      c, params_shape.dim_size(0) <= std::numeric_limits<Index>::max(),
+      errors::InvalidArgument("params_shape[0] too large for ",
+                              DataTypeString(DataTypeToEnum<Index>::v()),
+                              " indexing: ", params_shape.dim_size(0), " > ",
+                              std::numeric_limits<Index>::max()));
+
+  // Calculate the number of dimensions in indices
+  *indices_nd = 1;
+  if (indices_shape.dims() > 1) {
+    *indices_nd = indices_shape.dim_size(indices_shape.dims() - 1);
+  }
+
+  // Calculate the number of elements that make up each slice of our updated
+  // tensor. This allows us to work with flattened tensors and copy over whole
+  // slices at a time.
+  Index total_nd = params_shape.dims();
+
+  int64 slice_size_big = 1;
+  for (int64 i = *indices_nd; i < total_nd; ++i) {
+    slice_size_big *= params_shape.dim_size(i);
+  }
+
+  OP_REQUIRES(c, slice_size_big <= std::numeric_limits<Index>::max(),
+              errors::InvalidArgument("slice size is too large for indexing: ",
+                                      slice_size_big, " > ",
+                                      std::numeric_limits<Index>::max()));
+
+  *slice_size = static_cast<Index>(slice_size_big);
+
+  const int64 safe_indices_nd = (*indices_nd < 1) ? 1 : *indices_nd;
+  *num_updates = indices_shape.num_elements() / safe_indices_nd;
+}
+
+template <typename Device, typename T, typename Index>
+class ScatterNdOp : public OpKernel {
+ public:
+  explicit ScatterNdOp(OpKernelConstruction* c) : OpKernel(c) {
+    const DataType dt = DataTypeToEnum<T>::v();
+    const DataType index_t = DataTypeToEnum<Index>::v();
+    OP_REQUIRES_OK(c, c->MatchSignature({index_t, dt, index_t}, {dt}));
+  }
+
+  void Compute(OpKernelContext* c) override {
+    const Tensor& indices = c->input(0);
+    const Tensor& updates = c->input(1);
+    const Tensor& shape_input = c->input(2);
+
+    OP_REQUIRES(c, shape_input.dims() == 1,
+                errors::InvalidArgument("Shape must be a vector"));
+    auto vec = shape_input.flat<Index>();
+    TensorShape shape;
+    TensorShapeUtils::MakeShape(vec.data(), vec.size(), &shape);
+
+    int64 indices_nd;
+    Index num_updates;
+    Index slice_size;
+    PrepareAndValidateInputs<Index>(c, shape, indices, updates, &indices_nd,
+                                    &num_updates, &slice_size);
+    if (!c->status().ok()) return;
+
+    Tensor scratch;
+    OP_REQUIRES_OK(c, c->allocate_temp(DT_INT32, TensorShape(), &scratch));
+
+    auto scratch_scalar = scratch.scalar<Index>();
+    auto indices_flat = indices.flat_inner_dims<Index>();
+    auto updates_flat = updates.shaped<T, 2>({num_updates, slice_size});
+
+    Index bad_i = -1;
+    switch (indices_nd) {
+#define PARAMS_CASE(IXDIM)                                                   \
+  case IXDIM: {                                                              \
+    Tensor* out = nullptr;                                                   \
+    OP_REQUIRES_OK(c, c->allocate_output(0, shape, &out));                   \
+    functor::SetZeroFunctor<Device, T> fill;                                 \
+    fill(c->eigen_device<Device>(), out->flat<T>());                         \
+    if (shape.num_elements() > 0) {                                          \
+      auto output_flat = out->flat_outer_dims<T, (IXDIM) + 1>();             \
+      functor::ScatterNdFunctor<Device, T, Index,                            \
+                                scatter_nd_op::UpdateOp::ASSIGN, (IXDIM)>    \
+          functor;                                                           \
+      bad_i = functor(c->eigen_device<Device>(), slice_size, scratch_scalar, \
+                      output_flat, indices_flat, updates_flat, output_flat); \
+    }                                                                        \
+  } break
+      PARAMS_CASE(0);
+      PARAMS_CASE(1);
+      PARAMS_CASE(2);
+      PARAMS_CASE(3);
+      PARAMS_CASE(4);
+      PARAMS_CASE(5);
+#undef PARAMS_CASE
+      default:
+        OP_REQUIRES(c, false,
+                    errors::InvalidArgument(
+                        "Only indices.shape[-1] values between 0 and 5 "
+                        "are currently supported.  Requested rank: ",
+                        indices_nd));
+    }
+    OP_REQUIRES(
+        c, bad_i < 0,
+        errors::InvalidArgument(
+            "Invalid indices: ", SliceDebugString(indices.shape(), bad_i),
+            " = [", str_util::Join(gtl::ArraySlice<Index>(
+                                       &indices_flat(bad_i, 0), indices_nd),
+                                   ", "),
+            "] does not index into ", shape.DebugString()));
+  }
+};
+
+template <typename Device, typename T, typename Index,
+          scatter_nd_op::UpdateOp op>
+class ScatterNdUpdateOp : public OpKernel {
+ public:
+  explicit ScatterNdUpdateOp(OpKernelConstruction* c) : OpKernel(c) {
+    const DataType dt = DataTypeToEnum<T>::v();
+    const DataType dt_ref = DataTypeToEnum<T>::ref();
+    const DataType index_t = DataTypeToEnum<Index>::v();
+    OP_REQUIRES_OK(c, c->MatchSignature({dt_ref, index_t, dt}, {dt_ref}));
+    OP_REQUIRES_OK(c, c->GetAttr("use_locking", &use_exclusive_lock_));
+  }
+
+  void Compute(OpKernelContext* c) override {
+    if (use_exclusive_lock_) {
+      // Hold mutex while we apply updates
+      mutex_lock l(*c->input_ref_mutex(0));
+      DoCompute(c);
+    } else {
+      DoCompute(c);
+    }
+  }
+
+ private:
+  bool use_exclusive_lock_;
+
+  void DoCompute(OpKernelContext* c) {
+    Tensor params = c->mutable_input(0, use_exclusive_lock_);
+    const Tensor& indices = c->input(1);
+    const Tensor& updates = c->input(2);
+    const TensorShape& params_shape(params.shape());
+
+    int64 indices_nd;
+    Index num_updates;
+    Index slice_size;
+
+    OP_REQUIRES(c, params.IsInitialized(),
+                errors::FailedPrecondition("Null ref for params"));
+    PrepareAndValidateInputs<Index>(c, params_shape, indices, updates,
+                                    &indices_nd, &num_updates, &slice_size);
+    if (!c->status().ok()) return;
+
+    Tensor scratch;
+    OP_REQUIRES_OK(c, c->allocate_temp(DT_INT32, TensorShape(), &scratch));
+
+    auto scratch_scalar = scratch.scalar<Index>();
+    auto indices_flat = indices.flat_inner_dims<Index>();
+    auto updates_flat = updates.shaped<T, 2>({num_updates, slice_size});
+
+    Index bad_i = -1;
+    c->forward_ref_input_to_ref_output(0, 0);
+    switch (indices_nd) {
+#define PARAMS_CASE(IXDIM)                                                 \
+  case IXDIM: {                                                            \
+    auto params_flat = params.flat_outer_dims<T, (IXDIM) + 1>();           \
+    functor::ScatterNdFunctor<Device, T, Index, op, IXDIM> functor;        \
+    bad_i = functor(c->eigen_device<Device>(), slice_size, scratch_scalar, \
+                    params_flat, indices_flat, updates_flat, params_flat); \
+  } break
+      PARAMS_CASE(0);
+      PARAMS_CASE(1);
+      PARAMS_CASE(2);
+      PARAMS_CASE(3);
+      PARAMS_CASE(4);
+      PARAMS_CASE(5);
+#undef PARAMS_CASE
+      default:
+        OP_REQUIRES(c, false,
+                    errors::InvalidArgument(
+                        "Only indices.shape[-1] values between 1 and 5 "
+                        "are currently supported.  Requested rank: ",
+                        indices_nd));
+    }
+    OP_REQUIRES(
+        c, bad_i < 0,
+        errors::InvalidArgument(
+            "Invalid indices: ", SliceDebugString(indices.shape(), bad_i),
+            " = [", str_util::Join(gtl::ArraySlice<Index>(
+                                       &indices_flat(bad_i, 0), indices_nd),
+                                   ", "),
+            "] is not in [0, ", params.dim_size(0), ")"));
+  }
+};
+
+#define REGISTER_SCATTER_ND_KERNEL_INDEX(type, index_type, dev, name)  \
+  REGISTER_KERNEL_BUILDER(Name(name)                                   \
+                              .Device(DEVICE_##dev)                    \
+                              .TypeConstraint<type>("T")               \
+                              .TypeConstraint<index_type>("Tindices"), \
+                          ScatterNdOp<dev##Device, type, index_type>)
+
+#define REGISTER_SCATTER_ND_UPDATE_KERNEL_INDEX(type, index_type, dev, name, \
+                                                op)                          \
+  REGISTER_KERNEL_BUILDER(                                                   \
+      Name(name)                                                             \
+          .Device(DEVICE_##dev)                                              \
+          .TypeConstraint<type>("T")                                         \
+          .TypeConstraint<index_type>("Tindices"),                           \
+      ScatterNdUpdateOp<dev##Device, type, index_type, op>)
+
+#define REGISTER_SCATTER_ND_KERNEL(type, dev, name)         \
+  REGISTER_SCATTER_ND_KERNEL_INDEX(type, int32, dev, name); \
+  REGISTER_SCATTER_ND_KERNEL_INDEX(type, int64, dev, name)
+
+#define REGISTER_SCATTER_ND_UPDATE_KERNEL(type, dev, name, op)         \
+  REGISTER_SCATTER_ND_UPDATE_KERNEL_INDEX(type, int32, dev, name, op); \
+  REGISTER_SCATTER_ND_UPDATE_KERNEL_INDEX(type, int64, dev, name, op)
+
+#define REGISTER_SCATTER_ND_ADD_SUB(type, dev)                     \
+  REGISTER_SCATTER_ND_UPDATE_KERNEL(type, dev, "ScatterNdAdd",     \
+                                    scatter_nd_op::UpdateOp::ADD); \
+  REGISTER_SCATTER_ND_UPDATE_KERNEL(type, dev, "ScatterNdSub",     \
+                                    scatter_nd_op::UpdateOp::SUB); \
+  REGISTER_SCATTER_ND_UPDATE_KERNEL(type, dev, "ScatterNdMul",     \
+                                    scatter_nd_op::UpdateOp::MUL); \
+  REGISTER_SCATTER_ND_UPDATE_KERNEL(type, dev, "ScatterNdDiv",     \
+                                    scatter_nd_op::UpdateOp::DIV);
+
+#define REGISTER_SCATTER_ND(type, dev) \
+  REGISTER_SCATTER_ND_KERNEL(type, dev, "ScatterNd");
+
+#define REGISTER_SCATTER_ND_UPDATE(type, dev)                     \
+  REGISTER_SCATTER_ND_UPDATE_KERNEL(type, dev, "ScatterNdUpdate", \
+                                    scatter_nd_op::UpdateOp::ASSIGN);
+
+// Registers CPU kernels.
+#define REGISTER_SCATTER_ND_ADD_SUB_CPU(type) \
+  REGISTER_SCATTER_ND_ADD_SUB(type, CPU);
+
+#define REGISTER_SCATTER_ND_UPDATE_CPU(type) \
+  REGISTER_SCATTER_ND_UPDATE(type, CPU);
+
+#define REGISTER_SCATTER_ND_CPU(type) REGISTER_SCATTER_ND(type, CPU);
+
+TF_CALL_NUMBER_TYPES(REGISTER_SCATTER_ND_ADD_SUB_CPU);
+TF_CALL_ALL_TYPES(REGISTER_SCATTER_ND_UPDATE_CPU);
+TF_CALL_ALL_TYPES(REGISTER_SCATTER_ND_CPU);
+
+// Registers GPU kernels.
+#if GOOGLE_CUDA
+#define REGISTER_SCATTER_ND_ADD_SUB_GPU(type) \
+  REGISTER_SCATTER_ND_ADD_SUB(type, GPU);
+
+#define REGISTER_SCATTER_ND_UPDATE_GPU(type) \
+  REGISTER_SCATTER_ND_UPDATE(type, GPU);
+
+// TODO(simister): Re-enable when GPU support is working.
+// TF_CALL_GPU_NUMBER_TYPES_NO_HALF(REGISTER_SCATTER_ND_ADD_SUB_GPU);
+// TF_CALL_GPU_NUMBER_TYPES_NO_HALF(REGISTER_SCATTER_ND_UPDATE_GPU);
+
+#endif  // GOOGLE_CUDA
+
+#undef REGISTER_SCATTER_ND_ADD
+#undef REGISTER_SCATTER_ND_ADD_SUB
+#undef REGISTER_SCATTER_ND_ADD_SUB_CPU
+#undef REGISTER_SCATTER_ND_ADD_SUB_GPU
+#undef REGISTER_SCATTER_ND_UPDATE
+#undef REGISTER_SCATTER_ND_UPDATE_CPU
+#undef REGISTER_SCATTER_ND_UPDATE_GPU
+#undef REGISTER_SCATTER_ND_KERNEL
+#undef REGISTER_SCATTER_ND_KERNEL_INDEX
+
+#if GOOGLE_CUDA
+// Forward declarations of the functor specializations for GPU.
+namespace functor {
+
+#define DECLARE_GPU_SPECS_OP(T, Index, op, NDIM)                     \
+  template <>                                                        \
+  Index ScatterNdFunctor<GPUDevice, T, Index, op, NDIM>::operator()( \
+      OpKernelContext* c, const GPUDevice& d,                        \
+      typename TTypes<T, IXDIM>::Tensor params,                      \
+      typename TTypes<Index, 2>::ConstTensor indices,                \
+      typename TTypes<T, 2>::ConstTensor updates);                   \
+  extern template struct ScatterNdFunctor<GPUDevice, T, Index, op>;
+
+#define DECLARE_GPU_SPECS_OPS(T, Index, op) \
+  DECLARE_GPU_SPECS_OP(T, Index, op, 0);    \
+  DECLARE_GPU_SPECS_OP(T, Index, op, 1);    \
+  DECLARE_GPU_SPECS_OP(T, Index, op, 2);    \
+  DECLARE_GPU_SPECS_OP(T, Index, op, 3);    \
+  DECLARE_GPU_SPECS_OP(T, Index, op, 4);    \
+  DECLARE_GPU_SPECS_OP(T, Index, op, 5)
+
+#define DECLARE_GPU_SPECS_INDEX(T, Index)                           \
+  DECLARE_GPU_SPECS_OPS(T, Index, scatter_nd_op::UpdateOp::ASSIGN); \
+  DECLARE_GPU_SPECS_OPS(T, Index, scatter_nd_op::UpdateOp::ADD);    \
+  DECLARE_GPU_SPECS_OPS(T, Index, scatter_nd_op::UpdateOp::SUB);    \
+  DECLARE_GPU_SPECS_OPS(T, Index, scatter_nd_op::UpdateOp::MUL);    \
+  DECLARE_GPU_SPECS_OPS(T, Index, scatter_nd_op::UpdateOp::DIV);
+
+#define DECLARE_GPU_SPECS(T)         \
+  DECLARE_GPU_SPECS_INDEX(T, int32); \
+  DECLARE_GPU_SPECS_INDEX(T, int64);
+
+// TODO(simister): Re-enable when GPU support is working.
+// TF_CALL_GPU_NUMBER_TYPES_NO_HALF(DECLARE_GPU_SPECS);
+
+#undef DECLARE_GPU_SPECS
+#undef DECLARE_GPU_SPECS_INDEX
+#undef DECLARE_GPU_SPECS_OPS
+#undef DECLARE_GPU_SPECS_OP
+
+}  // namespace functor
+#endif  // GOOGLE_CUDA
+
+}  // namespace tensorflow
diff --git a/tensorflow/core/kernels/scatter_nd_op.h b/tensorflow/core/kernels/scatter_nd_op.h
new file mode 100644
index 00000000000..51917b5a0de
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op.h
@@ -0,0 +1,62 @@
+/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef TENSORFLOW_KERNELS_SCATTER_ND_OP_H_
+#define TENSORFLOW_KERNELS_SCATTER_ND_OP_H_
+
+#include "third_party/eigen3/unsupported/Eigen/CXX11/Tensor"
+
+#include "tensorflow/core/framework/op_kernel.h"
+#include "tensorflow/core/framework/register_types.h"
+#include "tensorflow/core/framework/tensor.h"
+#include "tensorflow/core/framework/tensor_shape.h"
+#include "tensorflow/core/kernels/bounds_check.h"
+#include "tensorflow/core/kernels/fill_functor.h"
+#include "tensorflow/core/kernels/scatter_nd_op.h"
+#include "tensorflow/core/platform/mutex.h"
+#include "tensorflow/core/platform/types.h"
+#include "tensorflow/core/util/util.h"
+
+namespace tensorflow {
+
+typedef Eigen::ThreadPoolDevice CPUDevice;
+
+class OpKernelContext;
+
+namespace scatter_nd_op {
+
+enum class UpdateOp { ASSIGN, ADD, SUB, MUL, DIV };
+
+}  // namespace scatter_nd_op
+
+namespace functor {
+
+// Functor used by ScatterOp to do the computations.
+template <typename Device, typename T, typename Index,
+          scatter_nd_op::UpdateOp op, int IXDIM>
+struct ScatterNdFunctor {
+  // Returns -1 on success or a nonnegative i s.t. indices[i] is a bad index.
+  Index operator()(const Device& d, const Index slice_size,
+                   typename TTypes<Index>::Scalar Tscratch,
+                   typename TTypes<T, IXDIM + 1>::Tensor Tparams,
+                   typename TTypes<Index, 2>::ConstTensor Tindices,
+                   typename TTypes<T, 2>::ConstTensor Tupdates,
+                   typename TTypes<T, IXDIM + 1>::Tensor Toutput);
+};
+
+}  // namespace functor
+}  // namespace tensorflow
+
+#endif  // TENSORFLOW_KERNELS_SCATTER_ND_OP_H_
diff --git a/tensorflow/core/kernels/scatter_nd_op_cpu_impl.h b/tensorflow/core/kernels/scatter_nd_op_cpu_impl.h
new file mode 100644
index 00000000000..d2a7746c35e
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op_cpu_impl.h
@@ -0,0 +1,224 @@
+/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#ifndef THIRD_PARTY_TENSORFLOW_CORE_KERNELS_SCATTER_ND_OP_CPU_IMPL_H_
+#define THIRD_PARTY_TENSORFLOW_CORE_KERNELS_SCATTER_ND_OP_CPU_IMPL_H_
+
+// Functor definitions for ScatterND ops, must be compilable by nvcc.
+
+#define EIGEN_USE_THREADS
+
+#include <atomic>
+
+#include "third_party/eigen3/unsupported/Eigen/CXX11/Tensor"
+
+#include "tensorflow/core/framework/op_kernel.h"
+#include "tensorflow/core/framework/register_types.h"
+#include "tensorflow/core/framework/tensor.h"
+#include "tensorflow/core/framework/tensor_shape.h"
+#include "tensorflow/core/kernels/bounds_check.h"
+#include "tensorflow/core/kernels/fill_functor.h"
+#include "tensorflow/core/kernels/scatter_nd_op.h"
+#include "tensorflow/core/platform/mutex.h"
+#include "tensorflow/core/platform/types.h"
+#include "tensorflow/core/util/util.h"
+
+namespace tensorflow {
+
+typedef Eigen::ThreadPoolDevice CPUDevice;
+
+class OpKernelContext;
+
+// Specialization of UpdateExecutor to CPU
+namespace generator {
+
+template <typename T, typename Index, scatter_nd_op::UpdateOp op>
+class UpdateExecutor {
+ public:
+  static void Update(T* input, const T* updates, T* output, Index slice_size);
+};
+
+template <typename T, typename Index>
+class UpdateExecutor<T, Index, scatter_nd_op::UpdateOp::ASSIGN> {
+ public:
+  static void Update(T* /* unused */, const T* updates, T* output,
+                     Index slice_size) {
+    std::copy_n(updates, slice_size, output);
+  }
+};
+
+template <typename T, typename Index>
+class UpdateExecutor<T, Index, scatter_nd_op::UpdateOp::ADD> {
+ public:
+  static void Update(T* input, const T* updates, T* output, Index slice_size) {
+    std::transform(input, input + slice_size, updates, output, std::plus<T>());
+  }
+};
+
+template <typename T, typename Index>
+class UpdateExecutor<T, Index, scatter_nd_op::UpdateOp::SUB> {
+ public:
+  static void Update(T* input, const T* updates, T* output, Index slice_size) {
+    std::transform(input, input + slice_size, updates, output, std::minus<T>());
+  }
+};
+
+template <typename T, typename Index>
+class UpdateExecutor<T, Index, scatter_nd_op::UpdateOp::MUL> {
+ public:
+  static void Update(T* input, const T* updates, T* output, Index slice_size) {
+    std::transform(input, input + slice_size, updates, output,
+                   std::multiplies<T>());
+  }
+};
+
+template <typename T, typename Index>
+class UpdateExecutor<T, Index, scatter_nd_op::UpdateOp::DIV> {
+ public:
+  static void Update(T* input, const T* updates, T* output, Index slice_size) {
+    std::transform(input, input + slice_size, updates, output,
+                   std::divides<T>());
+  }
+};
+
+template <typename T, typename Index, scatter_nd_op::UpdateOp op, int IXDIM>
+class ScatterNdSliceGenerator {
+ public:
+  EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE ScatterNdSliceGenerator(
+      const Index slice_size, typename TTypes<T, IXDIM + 1>::Tensor Tparams,
+      typename TTypes<Index, 2>::ConstTensor Tindices,
+      typename TTypes<T, 2>::ConstTensor Tupdates,
+      typename TTypes<T, IXDIM + 1>::Tensor Toutput,
+      std::atomic<Index>* error_loc)
+      : slice_size_(slice_size),
+        Tparams_(Tparams),
+        Tindices_(Tindices),
+        Tupdates_(Tupdates),
+        Toutput_(Toutput),
+        error_loc_(error_loc) {}
+
+  EIGEN_DEVICE_FUNC bool GenerateIndices(
+      const Index loc, Eigen::array<Eigen::DenseIndex, IXDIM + 1>* ix) const {
+    (*ix)[IXDIM] = 0;
+    bool out_of_bounds = false;
+    for (int i = 0; i < IXDIM; ++i) {
+      const Index ix_i = internal::SubtleMustCopy(Tindices_(loc, i));
+      (*ix)[i] = ix_i;
+      out_of_bounds |= !FastBoundsCheck(ix_i, Tparams_.dimension(i));
+    }
+    return out_of_bounds;
+  }
+
+  EIGEN_DEVICE_FUNC EIGEN_ALWAYS_INLINE int32
+  operator()(const Eigen::array<Eigen::DenseIndex, 1>& loc_array) const {
+    auto loc = loc_array[0];
+    Eigen::array<Eigen::DenseIndex, IXDIM + 1> ix_params;
+    Eigen::array<Eigen::DenseIndex, 2> ix_updates;
+    ix_updates[0] = loc;
+    ix_updates[1] = 0;
+    const bool out_of_bounds = GenerateIndices(loc, &ix_params);
+    if (TF_PREDICT_FALSE(out_of_bounds)) {
+      error_loc_->store(loc);
+    } else {
+      UpdateExecutor<T, Index, op>::Update(&Tparams_(ix_params),
+                                           &Tupdates_(ix_updates),
+                                           &Toutput_(ix_params), slice_size_);
+    }
+    return static_cast<int32>(0);  // Return something...
+  }
+
+ protected:
+  const Index slice_size_;
+  mutable typename TTypes<T, IXDIM + 1>::Tensor Tparams_;
+  const typename TTypes<Index, 2>::ConstTensor Tindices_;
+  const typename TTypes<T, 2>::ConstTensor Tupdates_;
+  mutable typename TTypes<T, IXDIM + 1>::Tensor Toutput_;
+  std::atomic<Index>* error_loc_;
+};
+
+}  // namespace generator
+
+namespace functor {
+
+// Implementation of update functor for CPU.
+template <typename T, typename Index, scatter_nd_op::UpdateOp op, int IXDIM>
+struct ScatterNdFunctor<CPUDevice, T, Index, op, IXDIM> {
+  Index operator()(const CPUDevice& d, const Index slice_size,
+                   typename TTypes<Index>::Scalar Tscratch,
+                   typename TTypes<T, IXDIM + 1>::Tensor Tparams,
+                   typename TTypes<Index, 2>::ConstTensor Tindices,
+                   typename TTypes<T, 2>::ConstTensor Tupdates,
+                   typename TTypes<T, IXDIM + 1>::Tensor Toutput) {
+    std::atomic<Index> error_loc(-1);
+
+    const Eigen::DenseIndex batch_size = Tindices.dimension(0);
+#if !defined(EIGEN_HAS_INDEX_LIST)
+    Eigen::Tensor<Eigen::DenseIndex, 1>::Dimensions reshape_dims{{ 1 }};
+    Eigen::array<Eigen::DenseIndex, 1> broadcast_dims{{ batch_size }};
+#else
+    Eigen::IndexList<Eigen::type2index<1> > reshape_dims;
+    Eigen::IndexList<Eigen::DenseIndex> broadcast_dims;
+    broadcast_dims.set(0, batch_size);
+#endif
+
+    generator::ScatterNdSliceGenerator<T, Index, op, IXDIM> generator(
+        slice_size, Tparams, Tindices, Tupdates, Toutput, &error_loc);
+    Tscratch.device(d) = Tscratch.reshape(reshape_dims)
+                             .broadcast(broadcast_dims)
+                             .generate(generator)
+                             .sum();
+
+    // error_loc() returns -1 if there's no out-of-bounds index,
+    // otherwise it returns the location of an OOB index in Tindices.
+    return error_loc.load();
+  }
+};
+
+#define REGISTER_SCATTER_ND_FULL(T, Index, op)                               \
+  template Index                                                             \
+  ScatterNdFunctor<CPUDevice, T, Index, op, CPU_PROVIDED_IXDIM>::operator()( \
+      const CPUDevice& d, const Index slice_size,                            \
+      typename TTypes<Index>::Scalar Tscratch,                               \
+      typename TTypes<T, CPU_PROVIDED_IXDIM + 1>::Tensor Tparams,            \
+      typename TTypes<Index, 2>::ConstTensor Tindices,                       \
+      typename TTypes<T, 2>::ConstTensor Tupdates,                           \
+      typename TTypes<T, CPU_PROVIDED_IXDIM + 1>::Tensor Toutput)
+
+#define REGISTER_SCATTER_ND_INDEX(type, op)  \
+  REGISTER_SCATTER_ND_FULL(type, int32, op); \
+  REGISTER_SCATTER_ND_FULL(type, int64, op)
+
+#define REGISTER_SCATTER_ND_UPDATE(type) \
+  REGISTER_SCATTER_ND_INDEX(type, scatter_nd_op::UpdateOp::ASSIGN);
+
+#define REGISTER_SCATTER_ND_MATH(type)                           \
+  REGISTER_SCATTER_ND_INDEX(type, scatter_nd_op::UpdateOp::ADD); \
+  REGISTER_SCATTER_ND_INDEX(type, scatter_nd_op::UpdateOp::SUB); \
+  REGISTER_SCATTER_ND_INDEX(type, scatter_nd_op::UpdateOp::MUL); \
+  REGISTER_SCATTER_ND_INDEX(type, scatter_nd_op::UpdateOp::DIV);
+
+TF_CALL_ALL_TYPES(REGISTER_SCATTER_ND_UPDATE);
+TF_CALL_NUMBER_TYPES(REGISTER_SCATTER_ND_MATH)
+
+#undef REGISTER_SCATTER_ND_MATH
+#undef REGISTER_SCATTER_ND_UPDATE
+#undef REGISTER_SCATTER_ND_INDEX
+#undef REGISTER_SCATTER_ND_FULL
+
+}  // namespace functor
+
+}  // namespace tensorflow
+
+#endif  // THIRD_PARTY_TENSORFLOW_CORE_KERNELS_SCATTER_ND_OP_CPU_IMPL_H_
diff --git a/tensorflow/core/kernels/scatter_nd_op_cpu_impl_0.cc b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_0.cc
new file mode 100644
index 00000000000..e978c5c348a
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_0.cc
@@ -0,0 +1,18 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#define CPU_PROVIDED_IXDIM 0
+#include "tensorflow/core/kernels/scatter_nd_op_cpu_impl.h"
+#undef CPU_PROVIDED_IXDIM
diff --git a/tensorflow/core/kernels/scatter_nd_op_cpu_impl_1.cc b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_1.cc
new file mode 100644
index 00000000000..1c7867a1a2e
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_1.cc
@@ -0,0 +1,18 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#define CPU_PROVIDED_IXDIM 1
+#include "tensorflow/core/kernels/scatter_nd_op_cpu_impl.h"
+#undef CPU_PROVIDED_IXDIM
diff --git a/tensorflow/core/kernels/scatter_nd_op_cpu_impl_2.cc b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_2.cc
new file mode 100644
index 00000000000..fe094c5e6b0
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_2.cc
@@ -0,0 +1,18 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#define CPU_PROVIDED_IXDIM 2
+#include "tensorflow/core/kernels/scatter_nd_op_cpu_impl.h"
+#undef CPU_PROVIDED_IXDIM
diff --git a/tensorflow/core/kernels/scatter_nd_op_cpu_impl_3.cc b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_3.cc
new file mode 100644
index 00000000000..a8b0e32bda5
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_3.cc
@@ -0,0 +1,18 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#define CPU_PROVIDED_IXDIM 3
+#include "tensorflow/core/kernels/scatter_nd_op_cpu_impl.h"
+#undef CPU_PROVIDED_IXDIM
diff --git a/tensorflow/core/kernels/scatter_nd_op_cpu_impl_4.cc b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_4.cc
new file mode 100644
index 00000000000..2cae469fcae
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_4.cc
@@ -0,0 +1,18 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#define CPU_PROVIDED_IXDIM 4
+#include "tensorflow/core/kernels/scatter_nd_op_cpu_impl.h"
+#undef CPU_PROVIDED_IXDIM
diff --git a/tensorflow/core/kernels/scatter_nd_op_cpu_impl_5.cc b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_5.cc
new file mode 100644
index 00000000000..c6031fd7818
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op_cpu_impl_5.cc
@@ -0,0 +1,19 @@
+
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#define CPU_PROVIDED_IXDIM 5
+#include "tensorflow/core/kernels/scatter_nd_op_cpu_impl.h"
+#undef CPU_PROVIDED_IXDIM
diff --git a/tensorflow/core/kernels/scatter_nd_op_test.cc b/tensorflow/core/kernels/scatter_nd_op_test.cc
new file mode 100644
index 00000000000..d6743a68674
--- /dev/null
+++ b/tensorflow/core/kernels/scatter_nd_op_test.cc
@@ -0,0 +1,320 @@
+/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+#include <functional>
+#include <memory>
+#include <vector>
+
+#include "tensorflow/core/framework/allocator.h"
+#include "tensorflow/core/framework/fake_input.h"
+#include "tensorflow/core/framework/graph.pb.h"
+#include "tensorflow/core/framework/node_def_builder.h"
+#include "tensorflow/core/framework/op_kernel.h"
+#include "tensorflow/core/framework/tensor.h"
+#include "tensorflow/core/framework/types.h"
+#include "tensorflow/core/framework/types.pb.h"
+#include "tensorflow/core/kernels/ops_testutil.h"
+#include "tensorflow/core/kernels/ops_util.h"
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/lib/random/simple_philox.h"
+#include "tensorflow/core/platform/logging.h"
+#include "tensorflow/core/platform/test.h"
+#include "tensorflow/core/platform/test_benchmark.h"
+
+namespace tensorflow {
+namespace {
+
+class ScatterNdUpdateOpTest : public OpsTestBase {
+ protected:
+  void MakeOp(DataType variable_ref_type, DataType index_type) {
+    TF_ASSERT_OK(NodeDefBuilder("myop", "ScatterNdUpdate")
+                     .Input(FakeInput(variable_ref_type))
+                     .Input(FakeInput(index_type))
+                     .Input(FakeInput(RemoveRefType(variable_ref_type)))
+                     .Finalize(node_def()));
+    TF_ASSERT_OK(InitOp());
+  }
+};
+
+TEST_F(ScatterNdUpdateOpTest, Simple_StringType) {
+  MakeOp(DT_STRING_REF, DT_INT32);
+  AddInputFromArray<string>(TensorShape({1}), {"Brain"});
+  AddInputFromArray<int32>(TensorShape({1}), {0});
+  AddInputFromArray<string>(TensorShape({1}), {"TensorFlow"});
+  TF_ASSERT_OK(RunOpKernel());
+  // Check the new state of the input
+  Tensor params_tensor = *mutable_input(0).tensor;
+  Tensor expected(allocator(), DT_STRING, TensorShape({1}));
+  test::FillValues<string>(&expected, {"TensorFlow"});
+  test::ExpectTensorEqual<string>(expected, params_tensor);
+}
+
+TEST_F(ScatterNdUpdateOpTest, Simple_BoolType) {
+  MakeOp(DT_BOOL_REF, DT_INT32);
+  AddInputFromArray<bool>(TensorShape({1}), {false});
+  AddInputFromArray<int32>(TensorShape({1}), {0});
+  AddInputFromArray<bool>(TensorShape({1}), {true});
+  TF_ASSERT_OK(RunOpKernel());
+  // Check the new state of the input
+  Tensor params_tensor = *mutable_input(0).tensor;
+  Tensor expected(allocator(), DT_BOOL, TensorShape({1}));
+  test::FillValues<bool>(&expected, {true});
+  test::ExpectTensorEqual<bool>(expected, params_tensor);
+}
+
+TEST_F(ScatterNdUpdateOpTest, Simple_TwoD32) {
+  MakeOp(DT_FLOAT_REF, DT_INT32);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({5, 3}),
+                           {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0});
+  AddInputFromArray<int32>(TensorShape({3, 1}), {0, 4, 2});
+  AddInputFromArray<float>(TensorShape({3, 3}),
+                           {100, 101, 102, 777, 778, 779, 10000, 10001, 10002});
+  TF_ASSERT_OK(RunOpKernel());
+
+  // Check the new state of the input
+  Tensor params_tensor = *mutable_input(0).tensor;
+  Tensor expected(allocator(), DT_FLOAT, TensorShape({5, 3}));
+  test::FillValues<float>(&expected, {100, 101, 102, 0, 0, 0, 10000, 10001,
+                                      10002, 0, 0, 0, 777, 778, 779});
+  test::ExpectTensorEqual<float>(expected, params_tensor);
+}
+
+TEST_F(ScatterNdUpdateOpTest, Simple_Two64) {
+  MakeOp(DT_FLOAT_REF, DT_INT64);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({5, 3}),
+                           {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0});
+  AddInputFromArray<int64>(TensorShape({3, 1}), {0, 4, 2});
+  AddInputFromArray<float>(TensorShape({3, 3}),
+                           {100, 101, 102, 777, 778, 779, 10000, 10001, 10002});
+  TF_ASSERT_OK(RunOpKernel());
+
+  // Check the new state of the input
+  Tensor params_tensor = *mutable_input(0).tensor;
+  Tensor expected(allocator(), DT_FLOAT, TensorShape({5, 3}));
+  test::FillValues<float>(&expected, {100, 101, 102, 0, 0, 0, 10000, 10001,
+                                      10002, 0, 0, 0, 777, 778, 779});
+  test::ExpectTensorEqual<float>(expected, params_tensor);
+}
+/*TEST_F(ScatterNdUpdateOpTest, Simple_ZeroElements) {
+  MakeOp(DT_FLOAT_REF, DT_INT32);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({0}), {});
+  AddInputFromArray<int32>(TensorShape({0}), {});
+  AddInputFromArray<float>(TensorShape({0}), {});
+  Status s = RunOpKernel();
+  EXPECT_TRUE(StringPiece(s.ToString())
+                  .contains("Output must not have 0 elements, got shape: "))
+      << s;
+}*/
+
+TEST_F(ScatterNdUpdateOpTest, Simple_ZeroD) {
+  MakeOp(DT_FLOAT_REF, DT_INT32);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({5}), {0, 0, 0, 0, 0});
+  AddInputFromArray<int32>(TensorShape({1}), {3});
+  AddInputFromArray<float>(TensorShape({1}), {101});
+  TF_ASSERT_OK(RunOpKernel());
+
+  // Check the new state of the input
+  Tensor params_tensor = *mutable_input(0).tensor;
+  Tensor expected(allocator(), DT_FLOAT, TensorShape({5}));
+  test::FillValues<float>(&expected, {0, 0, 0, 101, 0});
+  test::ExpectTensorEqual<float>(expected, params_tensor);
+}
+
+TEST_F(ScatterNdUpdateOpTest, Simple_OneD) {
+  MakeOp(DT_FLOAT_REF, DT_INT32);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({5}), {0, 0, 0, 0, 0});
+  AddInputFromArray<int32>(TensorShape({3, 1}), {0, 4, 2});
+  AddInputFromArray<float>(TensorShape({3}), {100, 101, 102});
+  TF_ASSERT_OK(RunOpKernel());
+
+  // Check the new state of the input
+  Tensor params_tensor = *mutable_input(0).tensor;
+  Tensor expected(allocator(), DT_FLOAT, TensorShape({5}));
+  test::FillValues<float>(&expected, {100, 0, 102, 0, 101});
+  test::ExpectTensorEqual<float>(expected, params_tensor);
+}
+
+TEST_F(ScatterNdUpdateOpTest, HigherRank) {
+  MakeOp(DT_FLOAT_REF, DT_INT32);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({8}), {0, 0, 0, 0, 0, 0, 0, 0});
+  AddInputFromArray<int32>(TensorShape({2, 3, 1}), {0, 4, 2, 1, 3, 6});
+  AddInputFromArray<float>(TensorShape({2, 3}), {10, 20, 30, 40, 50, 60});
+  TF_ASSERT_OK(RunOpKernel());
+
+  // Check the new state of the input
+  Tensor params_tensor = *mutable_input(0).tensor;
+  Tensor expected(allocator(), DT_FLOAT, TensorShape({8}));
+  test::FillValues<float>(&expected, {10, 40, 30, 50, 20, 0, 60, 0});
+  test::ExpectTensorEqual<float>(expected, params_tensor);
+}
+
+TEST_F(ScatterNdUpdateOpTest, Error_IndexOutOfRange) {
+  MakeOp(DT_FLOAT_REF, DT_INT32);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({5, 3}),
+                           {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0});
+  AddInputFromArray<int32>(TensorShape({3, 1}), {0, 4, 99});
+  AddInputFromArray<float>(TensorShape({3, 3}),
+                           {100, 101, 102, 777, 778, 779, 10000, 10001, 10002});
+  Status s = RunOpKernel();
+  EXPECT_TRUE(StringPiece(s.ToString())
+                  .contains("Invalid indices: [2,0] = [99] is not in [0, 5)"))
+      << s;
+}
+
+TEST_F(ScatterNdUpdateOpTest, Error_WrongDimsIndices) {
+  MakeOp(DT_FLOAT_REF, DT_INT32);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({2, 3}), {0, 0, 0, 0, 0, 0});
+  AddInputFromArray<int32>(TensorShape({1, 3, 1}), {0, 4, 99});
+  AddInputFromArray<float>(TensorShape({3, 3}),
+                           {100, 101, 102, 777, 778, 779, 10000, 10001, 10002});
+  Status s = RunOpKernel();
+  EXPECT_TRUE(StringPiece(s.ToString())
+                  .contains("The outermost dimension of updates and indices "
+                            "must match. Got indices.shape [1,3,1], "
+                            "updates.shape [3,3]"))
+      << s;
+}
+
+TEST_F(ScatterNdUpdateOpTest, Error_MismatchedParamsAndUpdateDimensions) {
+  MakeOp(DT_FLOAT_REF, DT_INT32);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({5, 3}),
+                           {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0});
+  AddInputFromArray<int32>(TensorShape({3, 1}), {0, 4, 2});
+  AddInputFromArray<float>(
+      TensorShape({3, 4}),
+      {100, 101, 102, 103, 777, 778, 779, 780, 10000, 10001, 10002, 10004});
+  Status s = RunOpKernel();
+  EXPECT_TRUE(StringPiece(s.ToString())
+                  .contains("Must have updates.shape = indices.shape[0] + "
+                            "params_shape[IXDIM:], got"))
+
+      << s;
+}
+
+TEST_F(ScatterNdUpdateOpTest, Error_MismatchedIndicesAndUpdateDimensions) {
+  MakeOp(DT_FLOAT_REF, DT_INT32);
+
+  // Feed and run
+  AddInputFromArray<float>(TensorShape({5, 3}),
+                           {0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0});
+  AddInputFromArray<int32>(TensorShape({3, 1}), {0, 4, 2});
+  AddInputFromArray<float>(TensorShape({2, 3}),
+                           {100, 101, 102, 10000, 10001, 10002});
+  Status s = RunOpKernel();
+  EXPECT_TRUE(StringPiece(s.ToString())
+                  .contains("The outermost dimension of updates and indices "
+                            "must match. Got "))
+      << s;
+}
+
+class ScatterNdUpdateBM : public ScatterNdUpdateOpTest {
+ public:
+  virtual void TestBody() {}
+  void MakeBenchmarkOp(const char* op, DataType index_type) {
+    TF_ASSERT_OK(NodeDefBuilder("myop", op)
+                     .Input(FakeInput(DT_FLOAT_REF))
+                     .Input(FakeInput(index_type))
+                     .Input(FakeInput(DT_FLOAT))
+                     .Finalize(node_def()));
+    TF_CHECK_OK(InitOp());
+  }
+};
+
+template <typename Index>
+static void BM_ScatterNdHelper(int iters, int embedding_size, const char* op) {
+  testing::StopTiming();
+  const int kRows = 10000000 / embedding_size;
+  std::vector<float> values;
+  values.reserve(kRows);
+  for (int i = 0; i < kRows * embedding_size; i++) {
+    values.push_back(i);
+  }
+  const int kNumUpdates = 1000;
+  random::PhiloxRandom philox(301, 17);
+  random::SimplePhilox rnd(&philox);
+  std::vector<Index> indices;
+  std::vector<float> updates;
+  for (int i = 0; i < kNumUpdates; i++) {
+    indices.push_back(rnd.Uniform(kRows));
+    for (int j = 0; j < embedding_size; j++) {
+      updates.push_back(i * 10 + j);
+    }
+  }
+
+  ScatterNdUpdateBM bm;
+  bm.MakeBenchmarkOp(op, DataTypeToEnum<Index>::v());
+  bm.AddInputFromArray<float>(TensorShape({kRows, embedding_size}), values);
+  bm.AddInputFromArray<Index>(TensorShape({kNumUpdates}), indices);
+  bm.AddInputFromArray<float>(TensorShape({kNumUpdates, embedding_size}),
+                              updates);
+  testing::ItemsProcessed((static_cast<int64>(kNumUpdates) * embedding_size) *
+                          iters);
+  testing::StartTiming();
+  while (iters-- > 0) {
+    Status s = bm.RunOpKernel();
+  }
+  testing::StopTiming();
+}
+
+static void BM_ScatterNdUpdateInt32(int iters, int embedding_size) {
+  BM_ScatterNdHelper<int32>(iters, embedding_size, "ScatterNdUpdate");
+}
+static void BM_ScatterNdUpdateInt64(int iters, int embedding_size) {
+  BM_ScatterNdHelper<int64>(iters, embedding_size, "ScatterNdUpdate");
+}
+
+static void BM_ScatterNdAddInt32(int iters, int embedding_size) {
+  BM_ScatterNdHelper<int32>(iters, embedding_size, "ScatterNdAdd");
+}
+static void BM_ScatterNdAddInt64(int iters, int embedding_size) {
+  BM_ScatterNdHelper<int64>(iters, embedding_size, "ScatterNdAdd");
+}
+
+BENCHMARK(BM_ScatterNdUpdateInt32)
+    ->Arg(1)
+    ->Arg(10)
+    ->Arg(64)
+    ->Arg(256)
+    ->Arg(1024);
+BENCHMARK(BM_ScatterNdUpdateInt64)
+    ->Arg(1)
+    ->Arg(10)
+    ->Arg(64)
+    ->Arg(256)
+    ->Arg(1024);
+
+BENCHMARK(BM_ScatterNdAddInt32)->Arg(1)->Arg(10)->Arg(64)->Arg(256)->Arg(1024);
+BENCHMARK(BM_ScatterNdAddInt64)->Arg(1)->Arg(10)->Arg(64)->Arg(256)->Arg(1024);
+
+}  // namespace
+}  // namespace tensorflow
diff --git a/tensorflow/core/kernels/sparse_tensor_dense_matmul_op.h b/tensorflow/core/kernels/sparse_tensor_dense_matmul_op.h
index 6106328e7ef..3bec4ce5f2d 100644
--- a/tensorflow/core/kernels/sparse_tensor_dense_matmul_op.h
+++ b/tensorflow/core/kernels/sparse_tensor_dense_matmul_op.h
@@ -55,34 +55,13 @@ EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE T MaybeConj(T v) {
   return v;
 }
 
-#ifdef __GCUDACC__
-// TODO(ebrevdo): remove this once a bugfix is in.
-#define MAYBE_CONJ(T)                                         \
-  template <>                                                 \
-  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE T MaybeConj<T>(T v) { \
-    assert(false && "Conjugation not supported");             \
-  }
-#else
-#define MAYBE_CONJ(T)                                         \
-  template <>                                                 \
-  EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE T MaybeConj<T>(T v) { \
-    return Eigen::numext::conj(v);                            \
-  }
-#endif
-
-MAYBE_CONJ(std::complex<float>);
-MAYBE_CONJ(std::complex<double>);
-MAYBE_CONJ(std::complex<long double>);
-
-#undef MAYBE_CONJ
-
 template <typename MATRIX>
 class MaybeAdjoint<MATRIX, true> {
  public:
   EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE MaybeAdjoint(MATRIX m) : m_(m) {}
   EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE typename MATRIX::Scalar operator()(
       const typename MATRIX::Index i, const typename MATRIX::Index j) const {
-    return MaybeConj(m_(j, i));
+    return Eigen::numext::conj(m_(j, i));
   }
 
  private:
diff --git a/tensorflow/core/kernels/whole_file_read_ops.cc b/tensorflow/core/kernels/whole_file_read_ops.cc
index e3d77b370bb..538e3bbc9eb 100644
--- a/tensorflow/core/kernels/whole_file_read_ops.cc
+++ b/tensorflow/core/kernels/whole_file_read_ops.cc
@@ -119,4 +119,28 @@ class ReadFileOp : public OpKernel {
 
 REGISTER_KERNEL_BUILDER(Name("ReadFile").Device(DEVICE_CPU), ReadFileOp);
 
+class WriteFileOp : public OpKernel {
+ public:
+  using OpKernel::OpKernel;
+  void Compute(OpKernelContext* context) override {
+    const Tensor* filename_input;
+    const Tensor* contents_input;
+    OP_REQUIRES_OK(context, context->input("filename", &filename_input));
+    OP_REQUIRES_OK(context, context->input("contents", &contents_input));
+    OP_REQUIRES(context, TensorShapeUtils::IsScalar(filename_input->shape()),
+                errors::InvalidArgument(
+                    "Input filename tensor must be scalar, but had shape: ",
+                    filename_input->shape().DebugString()));
+    OP_REQUIRES(context, TensorShapeUtils::IsScalar(contents_input->shape()),
+                errors::InvalidArgument(
+                    "Contents tensor must be scalar, but had shape: ",
+                    contents_input->shape().DebugString()));
+    OP_REQUIRES_OK(
+        context,
+        WriteStringToFile(context->env(), filename_input->scalar<string>()(),
+                          contents_input->scalar<string>()()));
+  }
+};
+
+REGISTER_KERNEL_BUILDER(Name("WriteFile").Device(DEVICE_CPU), WriteFileOp);
 }  // namespace tensorflow
diff --git a/tensorflow/core/lib/core/blocking_counter.h b/tensorflow/core/lib/core/blocking_counter.h
index b2411f5951f..5dab07dbef9 100644
--- a/tensorflow/core/lib/core/blocking_counter.h
+++ b/tensorflow/core/lib/core/blocking_counter.h
@@ -31,7 +31,7 @@ class BlockingCounter {
     DCHECK_EQ((initial_count << 1) >> 1, initial_count);
   }
 
-  ~BlockingCounter() { DCHECK_EQ(state_ >> 1, 0); }
+  ~BlockingCounter() {}
 
   inline void DecrementCount() {
     unsigned int v = state_.fetch_sub(2, std::memory_order_acq_rel) - 2;
@@ -53,6 +53,20 @@ class BlockingCounter {
       cond_var_.wait(l);
     }
   }
+  // Wait for the specified time, return false iff the count has not dropped to
+  // zero before the timeout expired.
+  inline bool WaitFor(std::chrono::milliseconds ms) {
+    unsigned int v = state_.fetch_or(1, std::memory_order_acq_rel);
+    if ((v >> 1) == 0) return true;
+    mutex_lock l(mu_);
+    while (!notified_) {
+      const std::cv_status status = cond_var_.wait_for(l, ms);
+      if (status == std::cv_status::timeout) {
+        return false;
+      }
+    }
+    return true;
+  }
 
  private:
   mutex mu_;
diff --git a/tensorflow/core/lib/core/threadpool.cc b/tensorflow/core/lib/core/threadpool.cc
index c3704da0b12..534ef902fb9 100644
--- a/tensorflow/core/lib/core/threadpool.cc
+++ b/tensorflow/core/lib/core/threadpool.cc
@@ -88,16 +88,12 @@ struct ThreadPool::Impl : Eigen::ThreadPoolTempl<EigenEnvironment> {
 
   void ParallelFor(int64 total, int64 cost_per_unit,
                    std::function<void(int64, int64)> fn) {
-#ifdef EIGEN_USE_NONBLOCKING_THREAD_POOL
     CHECK_GE(total, 0);
     CHECK_EQ(total, (int64)(Eigen::Index)total);
     Eigen::ThreadPoolDevice device(this, this->NumThreads());
     device.parallelFor(
         total, Eigen::TensorOpCost(0, 0, cost_per_unit),
         [&fn](Eigen::Index first, Eigen::Index last) { fn(first, last); });
-#else
-    CHECK(0);  // should not be used with the old thread pool
-#endif
   }
 };
 
diff --git a/tensorflow/core/lib/core/threadpool_test.cc b/tensorflow/core/lib/core/threadpool_test.cc
index cf8926b54d1..c7d8db51364 100644
--- a/tensorflow/core/lib/core/threadpool_test.cc
+++ b/tensorflow/core/lib/core/threadpool_test.cc
@@ -57,7 +57,6 @@ TEST(ThreadPool, DoWork) {
   }
 }
 
-#ifdef EIGEN_USE_NONBLOCKING_THREAD_POOL
 TEST(ThreadPool, ParallelFor) {
   // Make ParallelFor use as many threads as possible.
   int64 kHugeCost = 1 << 30;
@@ -80,7 +79,6 @@ TEST(ThreadPool, ParallelFor) {
     }
   }
 }
-#endif
 
 static void BM_Sequential(int iters) {
   ThreadPool pool(Env::Default(), "test", kNumThreads);
diff --git a/tensorflow/core/lib/io/path.cc b/tensorflow/core/lib/io/path.cc
index de49d07d62b..31397722fe6 100644
--- a/tensorflow/core/lib/io/path.cc
+++ b/tensorflow/core/lib/io/path.cc
@@ -14,6 +14,7 @@ limitations under the License.
 ==============================================================================*/
 
 #include "tensorflow/core/lib/io/path.h"
+#include "tensorflow/core/lib/strings/scanner.h"
 #include "tensorflow/core/lib/strings/strcat.h"
 
 namespace tensorflow {
@@ -49,11 +50,14 @@ string JoinPathImpl(std::initializer_list<StringPiece> paths) {
   return result;
 }
 
-// Return the parts of the path, split on the final "/".  If there is no
-// "/" in the path, the first part of the output is empty and the second
-// is the input. If the only "/" in the path is the first character, it is
-// the first part of the output.
-std::pair<StringPiece, StringPiece> SplitPath(StringPiece path) {
+// Return the parts of the URI, split on the final "/" in the path. If there is
+// no "/" in the path, the first part of the output is the scheme and host, and
+// the second is the path. If the only "/" in the path is the first character,
+// it is included in the first part of the output.
+std::pair<StringPiece, StringPiece> SplitPath(StringPiece uri) {
+  StringPiece scheme, host, path;
+  ParseURI(uri, &scheme, &host, &path);
+
   auto pos = path.rfind('/');
 #ifdef PLATFORM_WINDOWS
   if (pos == StringPiece::npos)
@@ -61,15 +65,17 @@ std::pair<StringPiece, StringPiece> SplitPath(StringPiece path) {
 #endif
   // Handle the case with no '/' in 'path'.
   if (pos == StringPiece::npos)
-    return std::make_pair(StringPiece(path.data(), 0), path);
+    return std::make_pair(StringPiece(uri.begin(), host.end() - uri.begin()),
+                          path);
 
   // Handle the case with a single leading '/' in 'path'.
   if (pos == 0)
-    return std::make_pair(StringPiece(path.data(), 1),
-                          StringPiece(path.data() + 1, path.size() - 1));
+    return std::make_pair(
+        StringPiece(uri.begin(), path.begin() + 1 - uri.begin()),
+        StringPiece(path.data() + 1, path.size() - 1));
 
   return std::make_pair(
-      StringPiece(path.data(), pos),
+      StringPiece(uri.begin(), path.begin() + pos - uri.begin()),
       StringPiece(path.data() + pos + 1, path.size() - (pos + 1)));
 }
 
@@ -185,5 +191,42 @@ string CleanPath(StringPiece unclean_path) {
   return path;
 }
 
+void ParseURI(StringPiece remaining, StringPiece* scheme, StringPiece* host,
+              StringPiece* path) {
+  // 0. Parse scheme
+  // Make sure scheme matches [a-zA-Z][0-9a-zA-Z.]*
+  // TODO(keveman): Allow "+" and "-" in the scheme.
+  if (!strings::Scanner(remaining)
+           .One(strings::Scanner::LETTER)
+           .Many(strings::Scanner::LETTER_DIGIT_DOT)
+           .StopCapture()
+           .OneLiteral("://")
+           .GetResult(&remaining, scheme)) {
+    // If there's no scheme, assume the entire string is a path.
+    *scheme = StringPiece(remaining.begin(), 0);
+    *host = StringPiece(remaining.begin(), 0);
+    *path = remaining;
+    return;
+  }
+
+  // 1. Parse host
+  if (!strings::Scanner(remaining).ScanUntil('/').GetResult(&remaining, host)) {
+    // No path, so the rest of the URI is the host.
+    *host = remaining;
+    *path = StringPiece(remaining.end(), 0);
+    return;
+  }
+
+  // 2. The rest is the path
+  *path = remaining;
+}
+
+string CreateURI(StringPiece scheme, StringPiece host, StringPiece path) {
+  if (scheme.empty()) {
+    return path.ToString();
+  }
+  return strings::StrCat(scheme, "://", host, path);
+}
+
 }  // namespace io
 }  // namespace tensorflow
diff --git a/tensorflow/core/lib/io/path.h b/tensorflow/core/lib/io/path.h
index 64165f857fe..955098f5b5e 100644
--- a/tensorflow/core/lib/io/path.h
+++ b/tensorflow/core/lib/io/path.h
@@ -74,6 +74,21 @@ StringPiece Extension(StringPiece path);
 // string manipulation, completely independent of process state.
 string CleanPath(StringPiece path);
 
+// Populates the scheme, host, and path from a URI. scheme, host, and path are
+// guaranteed by this function to point into the contents of uri, even if
+// empty.
+//
+// Corner cases:
+// - If the URI is invalid, scheme and host are set to empty strings and the
+//   passed string is assumed to be a path
+// - If the URI omits the path (e.g. file://host), then the path is left empty.
+void ParseURI(StringPiece uri, StringPiece* scheme, StringPiece* host,
+              StringPiece* path);
+
+// Creates a URI from a scheme, host, and path. If the scheme is empty, we just
+// return the path.
+string CreateURI(StringPiece scheme, StringPiece host, StringPiece path);
+
 }  // namespace io
 }  // namespace tensorflow
 
diff --git a/tensorflow/core/lib/io/path_test.cc b/tensorflow/core/lib/io/path_test.cc
index f3f3d245d5d..e3275b93b68 100644
--- a/tensorflow/core/lib/io/path_test.cc
+++ b/tensorflow/core/lib/io/path_test.cc
@@ -45,6 +45,8 @@ TEST(PathTest, IsAbsolutePath) {
 }
 
 TEST(PathTest, Dirname) {
+  EXPECT_EQ("hdfs://127.0.0.1:9000/",
+            Dirname("hdfs://127.0.0.1:9000/train.csv.tfrecords"));
   EXPECT_EQ("/hello", Dirname("/hello/"));
   EXPECT_EQ("/", Dirname("/hello"));
   EXPECT_EQ("hello", Dirname("hello/world"));
@@ -97,5 +99,47 @@ TEST(PathTest, CleanPath) {
   EXPECT_EQ("../../bar", CleanPath("foo/../../../bar"));
 }
 
+#define EXPECT_PARSE_URI(uri, scheme, host, path)  \
+  do {                                             \
+    StringPiece u(uri);                            \
+    StringPiece s, h, p;                           \
+    ParseURI(u, &s, &h, &p);                       \
+    EXPECT_EQ(scheme, s.ToString());               \
+    EXPECT_EQ(host, h.ToString());                 \
+    EXPECT_EQ(path, p.ToString());                 \
+    EXPECT_EQ(uri, CreateURI(scheme, host, path)); \
+    EXPECT_LE(u.begin(), s.begin());               \
+    EXPECT_GE(u.end(), s.begin());                 \
+    EXPECT_LE(u.begin(), s.end());                 \
+    EXPECT_GE(u.end(), s.end());                   \
+    EXPECT_LE(u.begin(), h.begin());               \
+    EXPECT_GE(u.end(), h.begin());                 \
+    EXPECT_LE(u.begin(), h.end());                 \
+    EXPECT_GE(u.end(), h.end());                   \
+    EXPECT_LE(u.begin(), p.begin());               \
+    EXPECT_GE(u.end(), p.begin());                 \
+    EXPECT_LE(u.begin(), p.end());                 \
+    EXPECT_GE(u.end(), p.end());                   \
+  } while (0)
+
+TEST(PathTest, CreateParseURI) {
+  EXPECT_PARSE_URI("http://foo", "http", "foo", "");
+  EXPECT_PARSE_URI("/encrypted/://foo", "", "", "/encrypted/://foo");
+  EXPECT_PARSE_URI("/usr/local/foo", "", "", "/usr/local/foo");
+  EXPECT_PARSE_URI("file:///usr/local/foo", "file", "", "/usr/local/foo");
+  EXPECT_PARSE_URI("local.file:///usr/local/foo", "local.file", "",
+                   "/usr/local/foo");
+  EXPECT_PARSE_URI("a-b:///foo", "", "", "a-b:///foo");
+  EXPECT_PARSE_URI(":///foo", "", "", ":///foo");
+  EXPECT_PARSE_URI("9dfd:///foo", "", "", "9dfd:///foo");
+  EXPECT_PARSE_URI("file:", "", "", "file:");
+  EXPECT_PARSE_URI("file:/", "", "", "file:/");
+  EXPECT_PARSE_URI("hdfs://localhost:8020/path/to/file", "hdfs",
+                   "localhost:8020", "/path/to/file");
+  EXPECT_PARSE_URI("hdfs://localhost:8020", "hdfs", "localhost:8020", "");
+  EXPECT_PARSE_URI("hdfs://localhost:8020/", "hdfs", "localhost:8020", "/");
+}
+#undef EXPECT_PARSE_URI
+
 }  // namespace io
 }  // namespace tensorflow
diff --git a/tensorflow/core/ops/array_ops.cc b/tensorflow/core/ops/array_ops.cc
index a7fb3375c8f..ce1f76503c8 100644
--- a/tensorflow/core/ops/array_ops.cc
+++ b/tensorflow/core/ops/array_ops.cc
@@ -151,7 +151,7 @@ Status SetOutputShapeForReshape(InferenceContext* c) {
         TF_RETURN_IF_ERROR(c->Multiply(known_elems, dim, &known_elems));
       }
     }
-    if (!too_many_unknown) {
+    if (!too_many_unknown && c->Value(known_elems) != 0) {
       DimensionHandle inferred_dim;
       TF_RETURN_IF_ERROR(c->Divide(num_in_elems, c->Value(known_elems),
                                    true /* evenly_divisible */, &inferred_dim));
@@ -4387,6 +4387,83 @@ output_min: This value is copied from input_min.
 output_max: This value is copied from input_max.
 )Doc");
 
+REGISTER_OP("ScatterNd")
+    .Input("indices: Tindices")
+    .Input("updates: T")
+    .Input("shape: Tindices")
+    .Output("output: T")
+    .Attr("T: type")
+    .Attr("Tindices: {int32, int64}")
+    .Doc(
+        R"doc(Creates a new tensor by applying sparse `updates` to individual values or slices within a zero tensor of the given `shape` tensor according to indices.
+This operator is the inverse of the [tf.gather_nd](#gather_nd) operator which extracts values or slices from a given tensor.
+
+TODO(simister): Add a link to Variable.__getitem__ documentation on slice syntax.
+
+`shape` is a `TensorShape` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `shape`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `shape`.
+
+`updates` is Tensor of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, shape[K], ..., shape[P-1]].
+```
+
+The simplest form of scatter is to insert individual elements in a tensor by index. For example, say we want to insert 4 scattered elements in a rank-1 tensor with 8 elements.
+
+<div style="width:70%; margin:auto; margin-bottom:10px; margin-top:20px;">
+<img style="width:100%" src="../../images/ScatterNd1.png" alt>
+</div>
+
+In Python, this scatter operation would look like this:
+
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    shape = tf.constant([8])
+    scatter = tf.scatter_nd(indices, updates, shape)
+    with tf.Session() as sess:
+      print sess.run(scatter)
+
+The resulting tensor would look like this:
+
+    [0, 11, 0, 10, 9, 0, 0, 12]
+
+We can also, insert entire slices of a higher rank tensor all at once. For example, if we wanted to insert two slices in the first dimension of a rank-3 tensor with two matrices of new values.
+
+<div style="width:70%; margin:auto; margin-bottom:10px; margin-top:20px;">
+<img style="width:100%" src="../../images/ScatterNd2.png" alt>
+</div>
+
+In Python, this scatter operation would look like this:
+
+    indices = tf.constant([[0], [2]])
+    updates = tf.constant([[[5, 5, 5, 5], [6, 6, 6, 6],
+                            [7, 7, 7, 7], [8, 8, 8, 8]],
+                           [[5, 5, 5, 5], [6, 6, 6, 6],
+                            [7, 7, 7, 7], [8, 8, 8, 8]]])
+    shape = tf.constant([4, 4, 4])
+    scatter = tf.scatter_nd(indices, updates, shape)
+    with tf.Session() as sess:
+      print sess.run(scatter)
+
+The resulting tensor would look like this:
+
+    [[[5, 5, 5, 5], [6, 6, 6, 6], [7, 7, 7, 7], [8, 8, 8, 8]],
+     [[0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0]],
+     [[5, 5, 5, 5], [6, 6, 6, 6], [7, 7, 7, 7], [8, 8, 8, 8]],
+     [[0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0]]]
+
+indices: A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+updates: A Tensor. Must have the same type as tensor. A tensor of updated values to store in ref.
+shape: A vector. The shape of the resulting tensor.
+output: A new tensor with the given shape and updates applied according to the indices.)doc");
+
 REGISTER_OP("FakeQuantWithMinMaxArgs")
     .Attr("min: float = -6.0")
     .Attr("max: float = 6.0")
@@ -4409,6 +4486,7 @@ REGISTER_OP("FakeQuantWithMinMaxArgsGradient")
     .Input("gradients: float")
     .Input("inputs: float")
     .Output("backprops: float")
+    .SetShapeFn(shape_inference::UnchangedShape)
     .Doc(R"doc(
 Compute gradients for a FakeQuantWithMinMaxArgs operation.
 
@@ -4450,6 +4528,21 @@ REGISTER_OP("FakeQuantWithMinMaxVarsGradient")
     .Output("backprops_wrt_input: float")
     .Output("backprop_wrt_min: float")
     .Output("backprop_wrt_max: float")
+    .SetShapeFn([](InferenceContext* c) {
+      // gradients and inputs are same size.
+      ShapeHandle inputs;
+      TF_RETURN_IF_ERROR(c->Merge(c->input(0), c->input(1), &inputs));
+
+      // min and max are scalars
+      ShapeHandle min_max;
+      TF_RETURN_IF_ERROR(c->WithRank(c->input(2), 0, &min_max));
+      TF_RETURN_IF_ERROR(c->Merge(min_max, c->input(3), &min_max));
+
+      c->set_output(0, inputs);
+      c->set_output(1, min_max);
+      c->set_output(2, min_max);
+      return Status::OK();
+    })
     .Doc(R"doc(
 Compute gradients for a FakeQuantWithMinMaxVars operation.
 
@@ -4503,6 +4596,24 @@ REGISTER_OP("FakeQuantWithMinMaxVarsPerChannelGradient")
     .Output("backprops_wrt_input: float")
     .Output("backprop_wrt_min: float")
     .Output("backprop_wrt_max: float")
+    .SetShapeFn([](InferenceContext* c) {
+      ShapeHandle inputs;
+      TF_RETURN_IF_ERROR(c->WithRankAtLeast(c->input(0), 1, &inputs));
+      TF_RETURN_IF_ERROR(c->WithRankAtMost(inputs, 4, &inputs));
+      TF_RETURN_IF_ERROR(c->Merge(inputs, c->input(1), &inputs));
+
+      ShapeHandle last_dim = c->Vector(c->Dim(inputs, -1));
+
+      ShapeHandle min_max;
+      TF_RETURN_IF_ERROR(c->WithRank(c->input(2), 1, &min_max));
+      TF_RETURN_IF_ERROR(c->Merge(min_max, last_dim, &min_max));
+      TF_RETURN_IF_ERROR(c->Merge(c->input(3), min_max, &min_max));
+
+      c->set_output(0, inputs);
+      c->set_output(1, min_max);
+      c->set_output(2, min_max);
+      return Status::OK();
+    })
     .Doc(R"doc(
 Compute gradients for a FakeQuantWithMinMaxVarsPerChannel operation.
 
diff --git a/tensorflow/core/ops/array_ops_test.cc b/tensorflow/core/ops/array_ops_test.cc
index 7f7861384cb..691380fd265 100644
--- a/tensorflow/core/ops/array_ops_test.cc
+++ b/tensorflow/core/ops/array_ops_test.cc
@@ -718,6 +718,14 @@ TEST(ArrayOpsTest, Reshape_ShapeFn) {
   INFER_ERROR(
       "Cannot reshape a tensor with 2 elements to shape [] (1 elements)", op,
       "[1,2];[0]");
+
+  // Reshaping a tensor with no elements.
+  new_shape = test::AsTensor<int32>({-1});
+  INFER_OK(op, "[0];[1]", "[0]");
+  new_shape = test::AsTensor<int32>({-1, 6});
+  INFER_OK(op, "[0,2];[1]", "[0,6]");
+  new_shape = test::AsTensor<int32>({0, -1});
+  INFER_OK(op, "[0,2];[1]", "[0,?]");
 }
 
 TEST(ArrayOpsTest, QuantizedReshape_ShapeFn) {
@@ -1525,4 +1533,23 @@ TEST(ArrayOpsTest, FakeQuantWithMinMaxVarsPerChannel) {
   INFER_ERROR("must be equal", op, "[5];[4];[?]");
 }
 
+TEST(ArrayOpsTest, FakeQuantWithMinMaxVarsPerChannelGradient) {
+  ShapeInferenceTestOp op("FakeQuantWithMinMaxVarsPerChannelGradient");
+
+  INFER_OK(op, "?;?;?;?", "?;[?];[?]");
+  INFER_OK(op, "[3];[3];[3];[3]", "in0;in3;in3");
+  INFER_OK(op, "[1,3];[1,3];[3];[3]", "in0;in3;in3");
+  INFER_OK(op, "[1,2,3,4];[1,2,3,4];[4];[4]", "in0;in3;in3");
+
+  // Rank check vectors.
+  INFER_ERROR("be equal rank", op, "[1,?,3];[1,?,3];[3];[]");
+  INFER_ERROR("be rank 1", op, "[1,?,3];[1,?,3];[];[3]");
+  INFER_ERROR("be at least rank 1", op, "[];[];[1];[1]");
+  INFER_ERROR("be at most rank 4", op, "[1,2,3,4,5];[1,2,3,4,5];[1];[1]");
+
+  // Vectors must match each other, and match last dim of input.
+  INFER_ERROR("must be equal", op, "[1,3];[1,3];[2];[3]");
+  INFER_ERROR("must be equal", op, "[1,3];[1,3];[3];[2]");
+}
+
 }  // end namespace tensorflow
diff --git a/tensorflow/core/ops/compat/ops_history.v0.pbtxt b/tensorflow/core/ops/compat/ops_history.v0.pbtxt
index b7a7c3e73fd..9859a763d3e 100644
--- a/tensorflow/core/ops/compat/ops_history.v0.pbtxt
+++ b/tensorflow/core/ops/compat/ops_history.v0.pbtxt
@@ -24732,6 +24732,321 @@ op {
     }
   }
 }
+op {
+  name: "ScatterNd"
+  input_arg {
+    name: "indices"
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    type_attr: "T"
+  }
+  input_arg {
+    name: "shape"
+    type_attr: "Tindices"
+  }
+  output_arg {
+    name: "output"
+    type_attr: "T"
+  }
+  attr {
+    name: "T"
+    type: "type"
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+}
+op {
+  name: "ScatterNdAdd"
+  input_arg {
+    name: "ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+        type: DT_INT64
+        type: DT_INT32
+        type: DT_UINT8
+        type: DT_UINT16
+        type: DT_INT16
+        type: DT_INT8
+        type: DT_COMPLEX64
+        type: DT_COMPLEX128
+        type: DT_QINT8
+        type: DT_QUINT8
+        type: DT_QINT32
+        type: DT_HALF
+      }
+    }
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: false
+    }
+  }
+}
+op {
+  name: "ScatterNdDiv"
+  input_arg {
+    name: "ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+        type: DT_INT64
+        type: DT_INT32
+        type: DT_UINT8
+        type: DT_UINT16
+        type: DT_INT16
+        type: DT_INT8
+        type: DT_COMPLEX64
+        type: DT_COMPLEX128
+        type: DT_QINT8
+        type: DT_QUINT8
+        type: DT_QINT32
+        type: DT_HALF
+      }
+    }
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: false
+    }
+  }
+}
+op {
+  name: "ScatterNdMul"
+  input_arg {
+    name: "ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+        type: DT_INT64
+        type: DT_INT32
+        type: DT_UINT8
+        type: DT_UINT16
+        type: DT_INT16
+        type: DT_INT8
+        type: DT_COMPLEX64
+        type: DT_COMPLEX128
+        type: DT_QINT8
+        type: DT_QUINT8
+        type: DT_QINT32
+        type: DT_HALF
+      }
+    }
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: false
+    }
+  }
+}
+op {
+  name: "ScatterNdSub"
+  input_arg {
+    name: "ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+        type: DT_INT64
+        type: DT_INT32
+        type: DT_UINT8
+        type: DT_UINT16
+        type: DT_INT16
+        type: DT_INT8
+        type: DT_COMPLEX64
+        type: DT_COMPLEX128
+        type: DT_QINT8
+        type: DT_QUINT8
+        type: DT_QINT32
+        type: DT_HALF
+      }
+    }
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: false
+    }
+  }
+}
+op {
+  name: "ScatterNdUpdate"
+  input_arg {
+    name: "ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: true
+    }
+  }
+}
 op {
   name: "ScatterSub"
   input_arg {
diff --git a/tensorflow/core/ops/io_ops.cc b/tensorflow/core/ops/io_ops.cc
index 83f0542e02d..1167461e9e5 100644
--- a/tensorflow/core/ops/io_ops.cc
+++ b/tensorflow/core/ops/io_ops.cc
@@ -582,6 +582,22 @@ REGISTER_OP("ReadFile")
 Reads and outputs the entire contents of the input filename.
 )doc");
 
+REGISTER_OP("WriteFile")
+    .Input("filename: string")
+    .Input("contents: string")
+    .SetShapeFn([](InferenceContext* c) {
+      ShapeHandle unused;
+      TF_RETURN_IF_ERROR(c->WithRank(c->input(0), 0, &unused));
+      TF_RETURN_IF_ERROR(c->WithRank(c->input(1), 0, &unused));
+      return Status::OK();
+    })
+    .Doc(R"doc(
+Writes contents to the file at input filename. Creates file if not existing.
+
+filename: scalar. The name of the file to which we write the contents.
+contents: scalar. The content to be written to the output file.
+)doc");
+
 REGISTER_OP("MatchingFiles")
     .Input("pattern: string")
     .Output("filenames: string")
diff --git a/tensorflow/core/ops/math_ops.cc b/tensorflow/core/ops/math_ops.cc
index ff00214da3c..7d3e212d279 100644
--- a/tensorflow/core/ops/math_ops.cc
+++ b/tensorflow/core/ops/math_ops.cc
@@ -296,6 +296,13 @@ Computes natural logarithm of x element-wise.
 I.e., \\(y = \log_e x\\).
 )doc");
 
+REGISTER_OP("Log1p")
+    .UNARY_COMPLEX()
+    .Doc(R"doc(
+Computes natural logarithm of (1 + x) element-wise.
+I.e., \\(y = \log_e (1 + x)\\).
+)doc");
+
 REGISTER_OP("Tanh")
     .UNARY_COMPLEX()
     .Doc(R"doc(
diff --git a/tensorflow/core/ops/ops.pbtxt b/tensorflow/core/ops/ops.pbtxt
index 512b3dcd666..44f109a33cb 100644
--- a/tensorflow/core/ops/ops.pbtxt
+++ b/tensorflow/core/ops/ops.pbtxt
@@ -15427,6 +15427,362 @@ op {
   summary: "Multiplies sparse updates into a variable reference."
   description: "This operation computes\n\n    # Scalar indices\n    ref[indices, ...] *= updates[...]\n\n    # Vector indices (for each i)\n    ref[indices[i], ...] *= updates[i, ...]\n\n    # High rank indices (for each i, ..., j)\n    ref[indices[i, ..., j], ...] *= updates[i, ..., j, ...]\n\nThis operation outputs `ref` after the update is done.\nThis makes it easier to chain operations that need to use the reset value.\n\nDuplicate entries are handled correctly: if multiple `indices` reference\nthe same location, their contributions multiply.\n\nRequires `updates.shape = indices.shape + ref.shape[1:]`."
 }
+op {
+  name: "ScatterNd"
+  input_arg {
+    name: "indices"
+    description: "A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref."
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    description: "A Tensor. Must have the same type as tensor. A tensor of updated values to store in ref."
+    type_attr: "T"
+  }
+  input_arg {
+    name: "shape"
+    description: "A vector. The shape of the resulting tensor."
+    type_attr: "Tindices"
+  }
+  output_arg {
+    name: "output"
+    description: "A new tensor with the given shape and updates applied according to the indices."
+    type_attr: "T"
+  }
+  attr {
+    name: "T"
+    type: "type"
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  summary: "Creates a new tensor by applying sparse `updates` to individual values or slices within a zero tensor of the given `shape` tensor according to indices."
+  description: "This operator is the inverse of the [tf.gather_nd](#gather_nd) operator which extracts values or slices from a given tensor.\n\nTODO(simister): Add a link to Variable.__getitem__ documentation on slice syntax.\n\n`shape` is a `TensorShape` with rank `P` and `indices` is a `Tensor` of rank `Q`.\n\n`indices` must be integer tensor, containing indices into `shape`.\nIt must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.\n\nThe innermost dimension of `indices` (with length `K`) corresponds to\nindices into elements (if `K = P`) or slices (if `K < P`) along the `K`th\ndimension of `shape`.\n\n`updates` is Tensor of rank `Q-1+P-K` with shape:\n\n```\n[d_0, ..., d_{Q-2}, shape[K], ..., shape[P-1]].\n```\n\nThe simplest form of scatter is to insert individual elements in a tensor by index. For example, say we want to insert 4 scattered elements in a rank-1 tensor with 8 elements.\n\n<div style=\"width:70%; margin:auto; margin-bottom:10px; margin-top:20px;\">\n<img style=\"width:100%\" src=\"../../images/ScatterNd1.png\" alt>\n</div>\n\nIn Python, this scatter operation would look like this:\n\n    indices = tf.constant([[4], [3], [1], [7]])\n    updates = tf.constant([9, 10, 11, 12])\n    shape = tf.constant([8])\n    scatter = tf.scatter_nd(indices, updates, shape)\n    with tf.Session() as sess:\n      print sess.run(scatter)\n\nThe resulting tensor would look like this:\n\n    [0, 11, 0, 10, 9, 0, 0, 12]\n\nWe can also, insert entire slices of a higher rank tensor all at once. For example, if we wanted to insert two slices in the first dimension of a rank-3 tensor with two matrices of new values.\n\n<div style=\"width:70%; margin:auto; margin-bottom:10px; margin-top:20px;\">\n<img style=\"width:100%\" src=\"../../images/ScatterNd2.png\" alt>\n</div>\n\nIn Python, this scatter operation would look like this:\n\n    indices = tf.constant([[0], [2]])\n    updates = tf.constant([[[5, 5, 5, 5], [6, 6, 6, 6],\n                            [7, 7, 7, 7], [8, 8, 8, 8]],\n                           [[5, 5, 5, 5], [6, 6, 6, 6],\n                            [7, 7, 7, 7], [8, 8, 8, 8]]])\n    shape = tf.constant([4, 4, 4])\n    scatter = tf.scatter_nd(indices, updates, shape)\n    with tf.Session() as sess:\n      print sess.run(scatter)\n\nThe resulting tensor would look like this:\n\n    [[[5, 5, 5, 5], [6, 6, 6, 6], [7, 7, 7, 7], [8, 8, 8, 8]],\n     [[0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0]],\n     [[5, 5, 5, 5], [6, 6, 6, 6], [7, 7, 7, 7], [8, 8, 8, 8]],\n     [[0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0]]]"
+}
+op {
+  name: "ScatterNdAdd"
+  input_arg {
+    name: "ref"
+    description: "A mutable Tensor. Should be from a Variable node."
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    description: "A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref."
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    description: "A Tensor. Must have the same type as ref. A tensor of updated values to add to ref."
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    description: "Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done."
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+        type: DT_INT64
+        type: DT_INT32
+        type: DT_UINT8
+        type: DT_UINT16
+        type: DT_INT16
+        type: DT_INT8
+        type: DT_COMPLEX64
+        type: DT_COMPLEX128
+        type: DT_QINT8
+        type: DT_QUINT8
+        type: DT_QINT32
+        type: DT_HALF
+      }
+    }
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: false
+    }
+    description: "An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention."
+  }
+  summary: "Applies sparse addition between `updates` and individual values or slices within a given variable according to `indices`."
+  description: "`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.\n\n`indices` must be integer tensor, containing indices into `ref`.\nIt must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.\n\nThe innermost dimension of `indices` (with length `K`) corresponds to\nindices into elements (if `K = P`) or slices (if `K < P`) along the `K`th\ndimension of `ref`.\n\n`updates` is `Tensor` of rank `Q-1+P-K` with shape:\n\n```\n[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].\n```\n\nFor example, say we want to add 4 scattered elements to a rank-1 tensor to 8 elements. In Python, that addition would look like this:\n\n    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])\n    indices = tf.constant([[4], [3], [1], [7]])\n    updates = tf.constant([9, 10, 11, 12])\n    add = tf.scatter_nd_add(ref, indices, updates)\n    with tf.Session() as sess:\n      print sess.run(add)\n\nThe resulting update to ref would look like this:\n\n    [1, 13, 3, 14, 14, 6, 7, 20]\n\nSee [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices."
+}
+op {
+  name: "ScatterNdDiv"
+  input_arg {
+    name: "ref"
+    description: "A mutable Tensor. Should be from a Variable node."
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    description: "A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref."
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    description: "A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref."
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    description: "Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done."
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+        type: DT_INT64
+        type: DT_INT32
+        type: DT_UINT8
+        type: DT_UINT16
+        type: DT_INT16
+        type: DT_INT8
+        type: DT_COMPLEX64
+        type: DT_COMPLEX128
+        type: DT_QINT8
+        type: DT_QUINT8
+        type: DT_QINT32
+        type: DT_HALF
+      }
+    }
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: false
+    }
+    description: "An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention."
+  }
+  summary: "Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`."
+  description: "`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.\n\n`indices` must be integer tensor, containing indices into `ref`.\nIt must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.\n\nThe innermost dimension of `indices` (with length `K`) corresponds to\nindices into elements (if `K = P`) or slices (if `K < P`) along the `K`th\ndimension of `ref`.\n\n`updates` is `Tensor` of rank `Q-1+P-K` with shape:\n\n```\n[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].\n```\n\nFor example, say we want to divide a rank-1 tensor with 8 elements by 4 scattered elements. In Python, that division would look like this:\n\n    ref = tf.Variable([10, 20, 30, 40, 50, 60, 70, 80])\n    indices = tf.constant([[4], [3], [1], [7]])\n    updates = tf.constant([2, 3, 4, 5])\n    sub = tf.scatter_nd_div(ref, indices, updates)\n    with tf.Session() as sess:\n      print sess.run(sub)\n\nThe resulting update to ref would look like this:\n\n    [10, 5, 30, 13, 25, 60, 70, 16]\n\nSee [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices."
+}
+op {
+  name: "ScatterNdMul"
+  input_arg {
+    name: "ref"
+    description: "A mutable Tensor. Should be from a Variable node."
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    description: "A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref."
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    description: "A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref."
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    description: "Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done."
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+        type: DT_INT64
+        type: DT_INT32
+        type: DT_UINT8
+        type: DT_UINT16
+        type: DT_INT16
+        type: DT_INT8
+        type: DT_COMPLEX64
+        type: DT_COMPLEX128
+        type: DT_QINT8
+        type: DT_QUINT8
+        type: DT_QINT32
+        type: DT_HALF
+      }
+    }
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: false
+    }
+    description: "An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention."
+  }
+  summary: "Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`."
+  description: "`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.\n\n`indices` must be integer tensor, containing indices into `ref`.\nIt must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.\n\nThe innermost dimension of `indices` (with length `K`) corresponds to\nindices into elements (if `K = P`) or slices (if `K < P`) along the `K`th\ndimension of `ref`.\n\n`updates` is `Tensor` of rank `Q-1+P-K` with shape:\n\n```\n[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].\n```\n\nFor example, say we want to multiply 4 scattered elements with a rank-1 tensor with 8 elements. In Python, that multiplication would look like this:\n\n    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])\n    indices = tf.constant([[4], [3], [1], [7]])\n    updates = tf.constant([9, 10, 11, 12])\n    sub = tf.scatter_nd_mul(ref, indices, updates)\n    with tf.Session() as sess:\n      print sess.run(sub)\n\nThe resulting update to ref would look like this:\n\n    [1, 22, 3, 40, 45, 6, 7, 96]\n\nSee [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices."
+}
+op {
+  name: "ScatterNdSub"
+  input_arg {
+    name: "ref"
+    description: "A mutable Tensor. Should be from a Variable node."
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    description: "A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref."
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    description: "A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref."
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    description: "Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done."
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_FLOAT
+        type: DT_DOUBLE
+        type: DT_INT64
+        type: DT_INT32
+        type: DT_UINT8
+        type: DT_UINT16
+        type: DT_INT16
+        type: DT_INT8
+        type: DT_COMPLEX64
+        type: DT_COMPLEX128
+        type: DT_QINT8
+        type: DT_QUINT8
+        type: DT_QINT32
+        type: DT_HALF
+      }
+    }
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: false
+    }
+    description: "An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention."
+  }
+  summary: "Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`."
+  description: "`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.\n\n`indices` must be integer tensor, containing indices into `ref`.\nIt must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.\n\nThe innermost dimension of `indices` (with length `K`) corresponds to\nindices into elements (if `K = P`) or slices (if `K < P`) along the `K`th\ndimension of `ref`.\n\n`updates` is `Tensor` of rank `Q-1+P-K` with shape:\n\n```\n[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].\n```\n\nFor example, say we want to subtract 4 scattered elements from a rank-1 tensor with 8 elements. In Python, that subtraction would look like this:\n\n    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])\n    indices = tf.constant([[4], [3], [1], [7]])\n    updates = tf.constant([9, 10, 11, 12])\n    sub = tf.scatter_nd_sub(ref, indices, updates)\n    with tf.Session() as sess:\n      print sess.run(sub)\n\nThe resulting update to ref would look like this:\n\n    [1, -9, 3, -6, -4, 6, 7, -4]\n\nSee [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices."
+}
+op {
+  name: "ScatterNdUpdate"
+  input_arg {
+    name: "ref"
+    description: "A mutable Tensor. Should be from a Variable node."
+    type_attr: "T"
+    is_ref: true
+  }
+  input_arg {
+    name: "indices"
+    description: "A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref."
+    type_attr: "Tindices"
+  }
+  input_arg {
+    name: "updates"
+    description: "A Tensor. Must have the same type as ref. A tensor of updated values to add to ref."
+    type_attr: "T"
+  }
+  output_arg {
+    name: "output_ref"
+    description: "Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done."
+    type_attr: "T"
+    is_ref: true
+  }
+  attr {
+    name: "T"
+    type: "type"
+  }
+  attr {
+    name: "Tindices"
+    type: "type"
+    allowed_values {
+      list {
+        type: DT_INT32
+        type: DT_INT64
+      }
+    }
+  }
+  attr {
+    name: "use_locking"
+    type: "bool"
+    default_value {
+      b: true
+    }
+    description: "An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention."
+  }
+  summary: "Applies sparse `updates` to individual values or slices within a given variable according to `indices`."
+  description: "`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.\n\n`indices` must be integer tensor, containing indices into `ref`.\nIt must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.\n\nThe innermost dimension of `indices` (with length `K`) corresponds to\nindices into elements (if `K = P`) or slices (if `K < P`) along the `K`th\ndimension of `ref`.\n\n`updates` is `Tensor` of rank `Q-1+P-K` with shape:\n\n```\n[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].\n```\n\nFor example, say we want to update 4 scattered elements to a rank-1 tensor to 8 elements. In Python, that update would look like this:\n\n    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])\n    indices = tf.constant([[4], [3], [1] ,[7]])\n    updates = tf.constant([9, 10, 11, 12])\n    update = tf.scatter_nd_update(ref, indices, updates)\n    with tf.Session() as sess:\n      print sess.run(update)\n\nThe resulting update to ref would look like this:\n\n    [1, 11, 3, 10, 9, 6, 7, 12]\n\nSee [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices."
+}
 op {
   name: "ScatterSub"
   input_arg {
diff --git a/tensorflow/core/ops/resource_variable_ops.cc b/tensorflow/core/ops/resource_variable_ops.cc
index 6211b07ac58..9e28291070c 100644
--- a/tensorflow/core/ops/resource_variable_ops.cc
+++ b/tensorflow/core/ops/resource_variable_ops.cc
@@ -49,10 +49,88 @@ dtype: the type of this variable. Must agree with the dtypes
 shape: The (possibly partially specified) shape of this variable.
 )");
 
+Status CreateAssignShapeFn(shape_inference::InferenceContext* c) {
+  DataType handle_dtype = c->input_handle_dtype(0);
+  DataType value_dtype;
+  c->GetAttr("dtype", &value_dtype);
+  if (handle_dtype != value_dtype) {
+    return errors::InvalidArgument(
+        "Trying to initialize handle for variable with wrong dtype. "
+        "Expected ",
+        handle_dtype, " got ", value_dtype);
+  }
+  shape_inference::ShapeHandle s = c->input_handle_shape(0);
+  shape_inference::ShapeHandle value_shape = c->input(1);
+  shape_inference::ShapeHandle unused;
+  TF_RETURN_IF_ERROR(c->Merge(s, value_shape, &unused));
+  return Status::OK();
+}
+
 REGISTER_OP("CreateVariableOp")
     .Input("resource: resource")
     .Input("value: dtype")
     .Attr("dtype: type")
+    .SetShapeFn(CreateAssignShapeFn)
+    .Doc(R"(
+Creates a variable resource.
+
+resource: handle to the resource in which to store the variable.
+value: the value to set the new tensor to use.
+dtype: the dtype of the value.
+)");
+
+REGISTER_OP("ReadVariableOp")
+    .Input("resource: resource")
+    .Output("value: dtype")
+    .Attr("dtype: type")
+    .SetShapeFn([](shape_inference::InferenceContext* c) {
+      DataType handle_dtype = c->input_handle_dtype(0);
+      DataType value_dtype;
+      c->GetAttr("dtype", &value_dtype);
+      if (handle_dtype != value_dtype) {
+        return errors::InvalidArgument(
+            "Trying to read variable with wrong dtype. "
+            "Expected ",
+            handle_dtype, " got ", value_dtype);
+      }
+      c->set_output(0, c->input_handle_shape(0));
+      return Status::OK();
+    })
+    .Doc(R"(
+Reads the value of a variable.
+
+The tensor returned by this operation is immutable.
+
+The value returned by this operation is guaranteed to be influenced by all the
+writes on which this operation depends directly or indirectly, and to not be
+influenced by any of the writes which depend directly or indirectly on this
+operation.
+
+resource: handle to the resource in which to store the variable.
+dtype: the dtype of the value.
+)");
+
+REGISTER_OP("AssignVariableOp")
+    .Input("resource: resource")
+    .Input("value: dtype")
+    .Attr("dtype: type")
+    .SetShapeFn(CreateAssignShapeFn)
+    .Doc(R"(
+Assigns a new value to a variable.
+
+Any ReadVariableOp with a control dependency on this op is guaranteed to return
+this value or a subsequent newer value of the variable.
+
+resource: handle to the resource in which to store the variable.
+value: the value to set the new tensor to use.
+dtype: the dtype of the value.
+)");
+
+REGISTER_OP("AssignAddVariableOp")
+    .Input("resource: resource")
+    .Input("value: dtype")
+    .Output("new_value: dtype")
+    .Attr("dtype: type")
     .SetShapeFn([](shape_inference::InferenceContext* c) {
       DataType handle_dtype = c->input_handle_dtype(0);
       DataType value_dtype;
@@ -67,13 +145,21 @@ REGISTER_OP("CreateVariableOp")
       shape_inference::ShapeHandle value_shape = c->input(1);
       shape_inference::ShapeHandle unused;
       TF_RETURN_IF_ERROR(c->Merge(s, value_shape, &unused));
+      c->set_output(0, value_shape);
       return Status::OK();
     })
     .Doc(R"(
-Creates a variable resource.
+Adds a value to the current value of a variable.
+
+Any ReadVariableOp which depends directly or indirectly on this assign is
+guaranteed to see the incremented value or a subsequent newer one.
+
+Outputs the incremented value, which can be used to totally order the
+increments to this variable.
 
 resource: handle to the resource in which to store the variable.
-value: the value to set the new tensor to use.
+value: the value by which the variable will be incremented.
+new_value: the new value of the variable.
 dtype: the dtype of the value.
 )");
 
diff --git a/tensorflow/core/ops/state_ops.cc b/tensorflow/core/ops/state_ops.cc
index b9ac8b16ffb..9339b9b8214 100644
--- a/tensorflow/core/ops/state_ops.cc
+++ b/tensorflow/core/ops/state_ops.cc
@@ -445,6 +445,241 @@ use_locking: If True, the operation will be protected by a lock;
   otherwise the behavior is undefined, but may exhibit less contention.
 )doc");
 
+REGISTER_OP("ScatterNdUpdate")
+    .Input("ref: Ref(T)")
+    .Input("indices: Tindices")
+    .Input("updates: T")
+    .Output("output_ref: Ref(T)")
+    .Attr("T: type")
+    .Attr("Tindices: {int32, int64}")
+    .Attr("use_locking: bool = true")
+    .Doc(
+        R"doc(Applies sparse `updates` to individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to update 4 scattered elements to a rank-1 tensor to 8 elements. In Python, that update would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1] ,[7]])
+    updates = tf.constant([9, 10, 11, 12])
+    update = tf.scatter_nd_update(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(update)
+
+The resulting update to ref would look like this:
+
+    [1, 11, 3, 10, 9, 6, 7, 12]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+ref: A mutable Tensor. Should be from a Variable node.
+indices: A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+updates: A Tensor. Must have the same type as ref. A tensor of updated values to add to ref.
+use_locking: An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+output_ref: Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.)doc");
+
+REGISTER_OP("ScatterNdAdd")
+    .Input("ref: Ref(T)")
+    .Input("indices: Tindices")
+    .Input("updates: T")
+    .Output("output_ref: Ref(T)")
+    .Attr("T: numbertype")
+    .Attr("Tindices: {int32, int64}")
+    .Attr("use_locking: bool = false")
+    .Doc(
+        R"doc(Applies sparse addition between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to add 4 scattered elements to a rank-1 tensor to 8 elements. In Python, that addition would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    add = tf.scatter_nd_add(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(add)
+
+The resulting update to ref would look like this:
+
+    [1, 13, 3, 14, 14, 6, 7, 20]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+ref: A mutable Tensor. Should be from a Variable node.
+indices: A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+updates: A Tensor. Must have the same type as ref. A tensor of updated values to add to ref.
+use_locking: An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+output_ref: Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.)doc");
+
+REGISTER_OP("ScatterNdSub")
+    .Input("ref: Ref(T)")
+    .Input("indices: Tindices")
+    .Input("updates: T")
+    .Output("output_ref: Ref(T)")
+    .Attr("T: numbertype")
+    .Attr("Tindices: {int32, int64}")
+    .Attr("use_locking: bool = false")
+    .Doc(
+        R"doc(Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to subtract 4 scattered elements from a rank-1 tensor with 8 elements. In Python, that subtraction would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    sub = tf.scatter_nd_sub(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(sub)
+
+The resulting update to ref would look like this:
+
+    [1, -9, 3, -6, -4, 6, 7, -4]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+ref: A mutable Tensor. Should be from a Variable node.
+indices: A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+updates: A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref.
+use_locking: An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+output_ref: Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.)doc");
+
+REGISTER_OP("ScatterNdMul")
+    .Input("ref: Ref(T)")
+    .Input("indices: Tindices")
+    .Input("updates: T")
+    .Output("output_ref: Ref(T)")
+    .Attr("T: numbertype")
+    .Attr("Tindices: {int32, int64}")
+    .Attr("use_locking: bool = false")
+    .Doc(
+        R"doc(Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to multiply 4 scattered elements with a rank-1 tensor with 8 elements. In Python, that multiplication would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    sub = tf.scatter_nd_mul(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(sub)
+
+The resulting update to ref would look like this:
+
+    [1, 22, 3, 40, 45, 6, 7, 96]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+ref: A mutable Tensor. Should be from a Variable node.
+indices: A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+updates: A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref.
+use_locking: An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+output_ref: Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.)doc");
+
+REGISTER_OP("ScatterNdDiv")
+    .Input("ref: Ref(T)")
+    .Input("indices: Tindices")
+    .Input("updates: T")
+    .Output("output_ref: Ref(T)")
+    .Attr("T: numbertype")
+    .Attr("Tindices: {int32, int64}")
+    .Attr("use_locking: bool = false")
+    .Doc(
+        R"doc(Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to divide a rank-1 tensor with 8 elements by 4 scattered elements. In Python, that division would look like this:
+
+    ref = tf.Variable([10, 20, 30, 40, 50, 60, 70, 80])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([2, 3, 4, 5])
+    sub = tf.scatter_nd_div(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(sub)
+
+The resulting update to ref would look like this:
+
+    [10, 5, 30, 13, 25, 60, 70, 16]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+ref: A mutable Tensor. Should be from a Variable node.
+indices: A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+updates: A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref.
+use_locking: An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+output_ref: Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.)doc");
+
 REGISTER_OP("CountUpTo")
     .Input("ref: Ref(T)")
     .Output("output: T")
diff --git a/tensorflow/core/platform/cloud/gcs_file_system.cc b/tensorflow/core/platform/cloud/gcs_file_system.cc
index 6641971ba07..39228ed8698 100644
--- a/tensorflow/core/platform/cloud/gcs_file_system.cc
+++ b/tensorflow/core/platform/cloud/gcs_file_system.cc
@@ -81,7 +81,7 @@ Status ParseGcsPath(StringPiece fname, bool empty_object_ok, string* bucket,
     return errors::Internal("bucket and object cannot be null.");
   }
   StringPiece scheme, bucketp, objectp;
-  ParseURI(fname, &scheme, &bucketp, &objectp);
+  io::ParseURI(fname, &scheme, &bucketp, &objectp);
   if (scheme != "gs") {
     return errors::InvalidArgument("GCS path doesn't start with 'gs://': ",
                                    fname);
@@ -118,6 +118,26 @@ string JoinGcsPath(const string& path, const string& subpath) {
   return strings::StrCat(MaybeAppendSlash(path), subpath);
 }
 
+/// \brief Returns the given paths appending all their subfolders.
+///
+/// For every path X in the list, every subfolder in X is added to the
+/// resulting list.
+/// For example:
+///  - for 'a/b/c/d' it will append 'a', 'a/b' and 'a/b/c'
+///  - for 'a/b/c/' it will append 'a', 'a/b' and 'a/b/c'
+std::set<string> AddAllSubpaths(const std::vector<string>& paths) {
+  std::set<string> result;
+  result.insert(paths.begin(), paths.end());
+  for (const string& path : paths) {
+    StringPiece subpath = io::Dirname(path);
+    while (!subpath.empty()) {
+      result.emplace(subpath.ToString());
+      subpath = io::Dirname(subpath);
+    }
+  }
+  return result;
+}
+
 Status ParseJson(StringPiece json, Json::Value* result) {
   Json::Reader reader;
   if (!reader.parse(json.ToString(), *result)) {
@@ -754,14 +774,18 @@ Status GcsFileSystem::FolderExists(const string& dirname, bool* result) {
     return errors::Internal("'result' cannot be nullptr.");
   }
   std::vector<string> children;
-  TF_RETURN_IF_ERROR(GetChildrenBounded(dirname, 1, &children, true));
+  TF_RETURN_IF_ERROR(
+      GetChildrenBounded(dirname, 1, &children, true /* recursively */,
+                         true /* include_self_directory_marker */));
   *result = !children.empty();
   return Status::OK();
 }
 
 Status GcsFileSystem::GetChildren(const string& dirname,
                                   std::vector<string>* result) {
-  return GetChildrenBounded(dirname, UINT64_MAX, result, false);
+  return GetChildrenBounded(dirname, UINT64_MAX, result,
+                            false /* recursively */,
+                            false /* include_self_directory_marker */);
 }
 
 Status GcsFileSystem::GetMatchingPaths(const string& pattern,
@@ -776,11 +800,15 @@ Status GcsFileSystem::GetMatchingPaths(const string& pattern,
                                    pattern);
   }
   std::vector<string> all_files;
-  TF_RETURN_IF_ERROR(GetChildrenBounded(dir, UINT64_MAX, &all_files, true));
+  TF_RETURN_IF_ERROR(
+      GetChildrenBounded(dir, UINT64_MAX, &all_files, true /* recursively */,
+                         false /* include_self_directory_marker */));
 
-  // Match all obtained files to the input pattern.
-  for (const auto& f : all_files) {
-    const string& full_path = io::JoinPath(dir, f);
+  const auto& files_and_folders = AddAllSubpaths(all_files);
+
+  // Match all obtained paths to the input pattern.
+  for (const auto& path : files_and_folders) {
+    const string& full_path = io::JoinPath(dir, path);
     if (Env::Default()->MatchPath(full_path, pattern)) {
       results->push_back(full_path);
     }
@@ -791,7 +819,8 @@ Status GcsFileSystem::GetMatchingPaths(const string& pattern,
 Status GcsFileSystem::GetChildrenBounded(const string& dirname,
                                          uint64 max_results,
                                          std::vector<string>* result,
-                                         bool recursive) {
+                                         bool recursive,
+                                         bool include_self_directory_marker) {
   if (!result) {
     return errors::InvalidArgument("'result' cannot be null");
   }
@@ -840,33 +869,34 @@ Status GcsFileSystem::GetChildrenBounded(const string& dirname,
     Json::Value root;
     TF_RETURN_IF_ERROR(ParseJson(response_piece, &root));
     const auto items = root.get("items", Json::Value::null);
-    if (items == Json::Value::null) {
-      // Empty results.
-      return Status::OK();
-    }
-    if (!items.isArray()) {
-      return errors::Internal("Expected an array 'items' in the GCS response.");
-    }
-    for (size_t i = 0; i < items.size(); i++) {
-      const auto item = items.get(i, Json::Value::null);
-      if (!item.isObject()) {
+    if (items != Json::Value::null) {
+      if (!items.isArray()) {
         return errors::Internal(
-            "Unexpected JSON format: 'items' should be a list of objects.");
+            "Expected an array 'items' in the GCS response.");
       }
-      string name;
-      TF_RETURN_IF_ERROR(GetStringValue(item, "name", &name));
-      // The names should be relative to the 'dirname'. That means the
-      // 'object_prefix', which is part of 'dirname', should be removed from the
-      // beginning of 'name'.
-      StringPiece relative_path(name);
-      if (!relative_path.Consume(object_prefix)) {
-        return errors::Internal(
-            strings::StrCat("Unexpected response: the returned file name ",
-                            name, " doesn't match the prefix ", object_prefix));
-      }
-      result->emplace_back(relative_path.ToString());
-      if (++retrieved_results >= max_results) {
-        return Status::OK();
+      for (size_t i = 0; i < items.size(); i++) {
+        const auto item = items.get(i, Json::Value::null);
+        if (!item.isObject()) {
+          return errors::Internal(
+              "Unexpected JSON format: 'items' should be a list of objects.");
+        }
+        string name;
+        TF_RETURN_IF_ERROR(GetStringValue(item, "name", &name));
+        // The names should be relative to the 'dirname'. That means the
+        // 'object_prefix', which is part of 'dirname', should be removed from
+        // the beginning of 'name'.
+        StringPiece relative_path(name);
+        if (!relative_path.Consume(object_prefix)) {
+          return errors::Internal(strings::StrCat(
+              "Unexpected response: the returned file name ", name,
+              " doesn't match the prefix ", object_prefix));
+        }
+        if (!relative_path.empty() || include_self_directory_marker) {
+          result->emplace_back(relative_path.ToString());
+        }
+        if (++retrieved_results >= max_results) {
+          return Status::OK();
+        }
       }
     }
     const auto prefixes = root.get("prefixes", Json::Value::null);
@@ -982,7 +1012,9 @@ Status GcsFileSystem::DeleteDir(const string& dirname) {
   // with the corresponding name prefix or if there is exactly one matching
   // object and it is the directory marker. Therefore we need to retrieve
   // at most two children for the prefix to detect if a directory is empty.
-  TF_RETURN_IF_ERROR(GetChildrenBounded(dirname, 2, &children, true));
+  TF_RETURN_IF_ERROR(
+      GetChildrenBounded(dirname, 2, &children, true /* recursively */,
+                         true /* include_self_directory_marker */));
 
   if (children.size() > 1 || (children.size() == 1 && !children[0].empty())) {
     return errors::FailedPrecondition("Cannot delete a non-empty directory.");
@@ -1015,7 +1047,9 @@ Status GcsFileSystem::RenameFile(const string& src, const string& target) {
   }
   // Rename all individual objects in the directory one by one.
   std::vector<string> children;
-  TF_RETURN_IF_ERROR(GetChildrenBounded(src, UINT64_MAX, &children, true));
+  TF_RETURN_IF_ERROR(
+      GetChildrenBounded(src, UINT64_MAX, &children, true /* recursively */,
+                         true /* include_self_directory_marker */));
   for (const string& subpath : children) {
     TF_RETURN_IF_ERROR(
         RenameObject(JoinGcsPath(src, subpath), JoinGcsPath(target, subpath)));
@@ -1110,8 +1144,9 @@ Status GcsFileSystem::DeleteRecursively(const string& dirname,
   }
   std::vector<string> all_objects;
   // Get all children in the directory recursively.
-  TF_RETURN_IF_ERROR(GetChildrenBounded(dirname, UINT64_MAX, &all_objects,
-                                        true /* recursive */));
+  TF_RETURN_IF_ERROR(GetChildrenBounded(
+      dirname, UINT64_MAX, &all_objects, true /* recursively */,
+      true /* include_self_directory_marker */));
   for (const string& object : all_objects) {
     const string& full_path = JoinGcsPath(dirname, object);
     // Delete all objects including directory markers for subfolders.
diff --git a/tensorflow/core/platform/cloud/gcs_file_system.h b/tensorflow/core/platform/cloud/gcs_file_system.h
index c98a50cc879..4a00e9daa41 100644
--- a/tensorflow/core/platform/cloud/gcs_file_system.h
+++ b/tensorflow/core/platform/cloud/gcs_file_system.h
@@ -91,8 +91,17 @@ class GcsFileSystem : public FileSystem {
   /// 'result' is set if the function returns OK. 'result' cannot be nullptr.
   Status FolderExists(const string& dirname, bool* result);
 
+  /// \brief Internal version of GetChildren with more knobs.
+  ///
+  /// If 'recursively' is true, returns all objects in all subfolders.
+  /// Otherwise only returns the immediate children in the directory.
+  ///
+  /// If 'include_self_directory_marker' is true and there is a GCS directory
+  /// marker at the path 'dir', GetChildrenBound will return an empty string
+  /// as one of the children that represents this marker.
   Status GetChildrenBounded(const string& dir, uint64 max_results,
-                            std::vector<string>* result, bool recursively);
+                            std::vector<string>* result, bool recursively,
+                            bool include_self_directory_marker);
   /// Retrieves file statistics assuming fname points to a GCS object.
   Status StatForObject(const string& bucket, const string& object,
                        FileStatistics* stat);
diff --git a/tensorflow/core/platform/cloud/gcs_file_system_test.cc b/tensorflow/core/platform/cloud/gcs_file_system_test.cc
index 8d1e31917d6..00bf3314705 100644
--- a/tensorflow/core/platform/cloud/gcs_file_system_test.cc
+++ b/tensorflow/core/platform/cloud/gcs_file_system_test.cc
@@ -579,6 +579,24 @@ TEST(GcsFileSystemTest, FileExists_NotAsBucket) {
   EXPECT_FALSE(fs.FileExists("gs://bucket2"));
 }
 
+TEST(GcsFileSystemTest, GetChildren_NoItems) {
+  std::vector<HttpRequest*> requests({new FakeHttpRequest(
+      "Uri: https://www.googleapis.com/storage/v1/b/bucket/o?"
+      "fields=items%2Fname%2Cprefixes%2CnextPageToken&delimiter=%2F&prefix="
+      "path%2F\n"
+      "Auth Token: fake_token\n",
+      "{\"prefixes\": [\"path/subpath/\"]}")});
+  GcsFileSystem fs(std::unique_ptr<AuthProvider>(new FakeAuthProvider),
+                   std::unique_ptr<HttpRequest::Factory>(
+                       new FakeHttpRequestFactory(&requests)),
+                   0 /* read ahead bytes */, 5 /* max upload attempts */);
+
+  std::vector<string> children;
+  TF_EXPECT_OK(fs.GetChildren("gs://bucket/path/", &children));
+
+  EXPECT_EQ(std::vector<string>({"subpath/"}), children);
+}
+
 TEST(GcsFileSystemTest, GetChildren_ThreeFiles) {
   std::vector<HttpRequest*> requests({new FakeHttpRequest(
       "Uri: https://www.googleapis.com/storage/v1/b/bucket/o?"
@@ -601,6 +619,27 @@ TEST(GcsFileSystemTest, GetChildren_ThreeFiles) {
             children);
 }
 
+TEST(GcsFileSystemTest, GetChildren_SelfDirectoryMarker) {
+  std::vector<HttpRequest*> requests({new FakeHttpRequest(
+      "Uri: https://www.googleapis.com/storage/v1/b/bucket/o?"
+      "fields=items%2Fname%2Cprefixes%2CnextPageToken&delimiter=%2F&prefix="
+      "path%2F\n"
+      "Auth Token: fake_token\n",
+      "{\"items\": [ "
+      "  { \"name\": \"path/\" },"
+      "  { \"name\": \"path/file3.txt\" }],"
+      "\"prefixes\": [\"path/subpath/\"]}")});
+  GcsFileSystem fs(std::unique_ptr<AuthProvider>(new FakeAuthProvider),
+                   std::unique_ptr<HttpRequest::Factory>(
+                       new FakeHttpRequestFactory(&requests)),
+                   0 /* read ahead bytes */, 5 /* max upload attempts */);
+
+  std::vector<string> children;
+  TF_EXPECT_OK(fs.GetChildren("gs://bucket/path/", &children));
+
+  EXPECT_EQ(std::vector<string>({"file3.txt", "subpath/"}), children);
+}
+
 TEST(GcsFileSystemTest, GetChildren_ThreeFiles_NoSlash) {
   std::vector<HttpRequest*> requests({new FakeHttpRequest(
       "Uri: https://www.googleapis.com/storage/v1/b/bucket/o?"
@@ -728,8 +767,9 @@ TEST(GcsFileSystemTest, GetMatchingPaths_BucketAndWildcard) {
 
   std::vector<string> result;
   TF_EXPECT_OK(fs.GetMatchingPaths("gs://bucket/*/*", &result));
-  EXPECT_EQ(std::vector<string>(
-                {"gs://bucket/path/file1.txt", "gs://bucket/path/file3.txt"}),
+  EXPECT_EQ(std::vector<string>({"gs://bucket/path/file1.txt",
+                                 "gs://bucket/path/file3.txt",
+                                 "gs://bucket/path/subpath"}),
             result);
 }
 
@@ -753,6 +793,24 @@ TEST(GcsFileSystemTest, GetMatchingPaths_FolderAndWildcard_Matches) {
             result);
 }
 
+TEST(GcsFileSystemTest, GetMatchingPaths_SelfDirectoryMarker) {
+  std::vector<HttpRequest*> requests({new FakeHttpRequest(
+      "Uri: https://www.googleapis.com/storage/v1/b/bucket/o?"
+      "fields=items%2Fname%2CnextPageToken&prefix=path%2F\n"
+      "Auth Token: fake_token\n",
+      "{\"items\": [ "
+      "  { \"name\": \"path/\" },"
+      "  { \"name\": \"path/file3.txt\" }]}")});
+  GcsFileSystem fs(std::unique_ptr<AuthProvider>(new FakeAuthProvider),
+                   std::unique_ptr<HttpRequest::Factory>(
+                       new FakeHttpRequestFactory(&requests)),
+                   0 /* read ahead bytes */, 5 /* max upload attempts */);
+
+  std::vector<string> result;
+  TF_EXPECT_OK(fs.GetMatchingPaths("gs://bucket/path/*", &result));
+  EXPECT_EQ(std::vector<string>({"gs://bucket/path/file3.txt"}), result);
+}
+
 TEST(GcsFileSystemTest, GetMatchingPaths_FolderAndWildcard_NoMatches) {
   std::vector<HttpRequest*> requests({new FakeHttpRequest(
       "Uri: https://www.googleapis.com/storage/v1/b/bucket/o?"
diff --git a/tensorflow/core/platform/cloud/retrying_file_system.cc b/tensorflow/core/platform/cloud/retrying_file_system.cc
index f8a897a484d..ccfbc05b6db 100644
--- a/tensorflow/core/platform/cloud/retrying_file_system.cc
+++ b/tensorflow/core/platform/cloud/retrying_file_system.cc
@@ -43,7 +43,6 @@ bool IsRetriable(Status status) {
 
 void WaitBeforeRetry(const int64 delay_micros) {
   const int64 random_micros = random::New64() % 1000000;
-
   Env::Default()->SleepForMicroseconds(std::min(delay_micros + random_micros,
                                                 kMaximumBackoffMicroseconds));
 }
@@ -57,7 +56,9 @@ Status CallWithRetries(const std::function<Status()>& f,
       return status;
     }
     const int64 delay_micros = initial_delay_microseconds << retries;
-    WaitBeforeRetry(delay_micros);
+    if (delay_micros > 0) {
+      WaitBeforeRetry(delay_micros);
+    }
     retries++;
   }
 }
@@ -65,7 +66,7 @@ Status CallWithRetries(const std::function<Status()>& f,
 class RetryingRandomAccessFile : public RandomAccessFile {
  public:
   RetryingRandomAccessFile(std::unique_ptr<RandomAccessFile> base_file,
-                           int64 delay_microseconds = 1000000)
+                           int64 delay_microseconds)
       : base_file_(std::move(base_file)),
         initial_delay_microseconds_(delay_microseconds) {}
 
@@ -84,10 +85,15 @@ class RetryingRandomAccessFile : public RandomAccessFile {
 class RetryingWritableFile : public WritableFile {
  public:
   RetryingWritableFile(std::unique_ptr<WritableFile> base_file,
-                       int64 delay_microseconds = 1000000)
+                       int64 delay_microseconds)
       : base_file_(std::move(base_file)),
         initial_delay_microseconds_(delay_microseconds) {}
 
+  ~RetryingWritableFile() {
+    // Makes sure the retrying version of Close() is called in the destructor.
+    Close();
+  }
+
   Status Append(const StringPiece& data) override {
     return CallWithRetries(
         std::bind(&WritableFile::Append, base_file_.get(), data),
@@ -120,7 +126,8 @@ Status RetryingFileSystem::NewRandomAccessFile(
                                                base_file_system_.get(),
                                                filename, &base_file),
                                      initial_delay_microseconds_));
-  result->reset(new RetryingRandomAccessFile(std::move(base_file)));
+  result->reset(new RetryingRandomAccessFile(std::move(base_file),
+                                             initial_delay_microseconds_));
   return Status::OK();
 }
 
@@ -131,7 +138,8 @@ Status RetryingFileSystem::NewWritableFile(
                                                base_file_system_.get(),
                                                filename, &base_file),
                                      initial_delay_microseconds_));
-  result->reset(new RetryingWritableFile(std::move(base_file)));
+  result->reset(new RetryingWritableFile(std::move(base_file),
+                                         initial_delay_microseconds_));
   return Status::OK();
 }
 
@@ -142,7 +150,8 @@ Status RetryingFileSystem::NewAppendableFile(
                                                base_file_system_.get(),
                                                filename, &base_file),
                                      initial_delay_microseconds_));
-  result->reset(new RetryingWritableFile(std::move(base_file)));
+  result->reset(new RetryingWritableFile(std::move(base_file),
+                                         initial_delay_microseconds_));
   return Status::OK();
 }
 
diff --git a/tensorflow/core/platform/cloud/retrying_file_system_test.cc b/tensorflow/core/platform/cloud/retrying_file_system_test.cc
index f939776b757..06c16b90925 100644
--- a/tensorflow/core/platform/cloud/retrying_file_system_test.cc
+++ b/tensorflow/core/platform/cloud/retrying_file_system_test.cc
@@ -261,7 +261,8 @@ TEST(RetryingFileSystemTest, NewRandomAccessFile_NoRetriesForSomeErrors) {
 
 TEST(RetryingFileSystemTest, NewWritableFile_ImmediateSuccess) {
   // Configure the mock base random access file.
-  ExpectedCalls expected_file_calls({std::make_tuple("Sync", Status::OK())});
+  ExpectedCalls expected_file_calls({std::make_tuple("Sync", Status::OK()),
+                                     std::make_tuple("Close", Status::OK())});
   std::unique_ptr<WritableFile> base_file(
       new MockWritableFile(expected_file_calls));
 
@@ -286,7 +287,8 @@ TEST(RetryingFileSystemTest, NewWritableFile_SuccessWith3rdTry) {
   ExpectedCalls expected_file_calls(
       {std::make_tuple("Sync", errors::Unavailable("Something is wrong")),
        std::make_tuple("Sync", errors::Unavailable("Something is wrong again")),
-       std::make_tuple("Sync", Status::OK())});
+       std::make_tuple("Sync", Status::OK()),
+       std::make_tuple("Close", Status::OK())});
   std::unique_ptr<WritableFile> base_file(
       new MockWritableFile(expected_file_calls));
 
@@ -306,12 +308,38 @@ TEST(RetryingFileSystemTest, NewWritableFile_SuccessWith3rdTry) {
   TF_EXPECT_OK(writable_file->Sync());
 }
 
+TEST(RetryingFileSystemTest, NewWritableFile_SuccessWith3rdTry_ViaDestructor) {
+  // Configure the mock base random access file.
+  ExpectedCalls expected_file_calls(
+      {std::make_tuple("Close", errors::Unavailable("Something is wrong")),
+       std::make_tuple("Close",
+                       errors::Unavailable("Something is wrong again")),
+       std::make_tuple("Close", Status::OK())});
+  std::unique_ptr<WritableFile> base_file(
+      new MockWritableFile(expected_file_calls));
+
+  // Configure the mock base file system.
+  ExpectedCalls expected_fs_calls(
+      {std::make_tuple("NewWritableFile", Status::OK())});
+  std::unique_ptr<MockFileSystem> base_fs(
+      new MockFileSystem(expected_fs_calls));
+  base_fs->writable_file_to_return = std::move(base_file);
+  RetryingFileSystem fs(std::move(base_fs), 0);
+
+  // Retrieve the wrapped writable file.
+  std::unique_ptr<WritableFile> writable_file;
+  TF_EXPECT_OK(fs.NewWritableFile("filename.txt", &writable_file));
+
+  writable_file.reset();  // Trigger Close() via destructor.
+}
+
 TEST(RetryingFileSystemTest, NewAppendableFile_SuccessWith3rdTry) {
   // Configure the mock base random access file.
   ExpectedCalls expected_file_calls(
       {std::make_tuple("Sync", errors::Unavailable("Something is wrong")),
        std::make_tuple("Sync", errors::Unavailable("Something is wrong again")),
-       std::make_tuple("Sync", Status::OK())});
+       std::make_tuple("Sync", Status::OK()),
+       std::make_tuple("Close", Status::OK())});
   std::unique_ptr<WritableFile> base_file(
       new MockWritableFile(expected_file_calls));
 
@@ -337,7 +365,8 @@ TEST(RetryingFileSystemTest, NewWritableFile_AllRetriesFailed) {
       {std::make_tuple("Sync", errors::Unavailable("Something is wrong")),
        std::make_tuple("Sync", errors::Unavailable("Something is wrong again")),
        std::make_tuple("Sync", errors::Unavailable("...and again")),
-       std::make_tuple("Sync", errors::Unavailable("And again"))});
+       std::make_tuple("Sync", errors::Unavailable("And again")),
+       std::make_tuple("Close", Status::OK())});
   std::unique_ptr<WritableFile> base_file(
       new MockWritableFile(expected_file_calls));
 
diff --git a/tensorflow/core/platform/default/build_config/BUILD b/tensorflow/core/platform/default/build_config/BUILD
index fc0c6a5091c..2cb64c3922c 100644
--- a/tensorflow/core/platform/default/build_config/BUILD
+++ b/tensorflow/core/platform/default/build_config/BUILD
@@ -77,16 +77,24 @@ cc_library(
     name = "platformlib",
     copts = tf_copts(),
     deps = [
+        ":gif",
+        ":jpeg",
         "//tensorflow/core:protos_cc",
         "@com_googlesource_code_re2//:re2",
         "@farmhash_archive//:farmhash",
-        "@gif_archive//:gif",
         "@highwayhash//:sip_hash",
-        "@jpeg_archive//:jpeg",
         "@png_archive//:png",
     ],
 )
 
+cc_library(
+    name = "gif",
+    copts = tf_copts(),
+    deps = [
+        "@gif_archive//:gif",
+    ],
+)
+
 cc_library(
     name = "jpeg",
     copts = tf_copts(),
diff --git a/tensorflow/core/platform/env.cc b/tensorflow/core/platform/env.cc
index a5dd7b45c4a..5a09fded9bf 100644
--- a/tensorflow/core/platform/env.cc
+++ b/tensorflow/core/platform/env.cc
@@ -70,7 +70,7 @@ Env::Env() : file_system_registry_(new FileSystemRegistryImpl) {}
 
 Status Env::GetFileSystemForFile(const string& fname, FileSystem** result) {
   StringPiece scheme, host, path;
-  ParseURI(fname, &scheme, &host, &path);
+  io::ParseURI(fname, &scheme, &host, &path);
   FileSystem* file_system = file_system_registry_->Lookup(scheme.ToString());
   if (!file_system) {
     return errors::Unimplemented("File system scheme ", scheme,
diff --git a/tensorflow/core/platform/env_test.cc b/tensorflow/core/platform/env_test.cc
index dbff7e25310..f6fa27327a6 100644
--- a/tensorflow/core/platform/env_test.cc
+++ b/tensorflow/core/platform/env_test.cc
@@ -229,35 +229,6 @@ TEST_F(DefaultEnvTest, LocalFileSystem) {
   }
 }
 
-#define EXPECT_PARSE_URI(uri, scheme, host, path)  \
-  do {                                             \
-    StringPiece s, h, p;                           \
-    ParseURI(uri, &s, &h, &p);                     \
-    EXPECT_EQ(scheme, s.ToString());               \
-    EXPECT_EQ(host, h.ToString());                 \
-    EXPECT_EQ(path, p.ToString());                 \
-    EXPECT_EQ(uri, CreateURI(scheme, host, path)); \
-  } while (0)
-
-TEST_F(DefaultEnvTest, CreateParseURI) {
-  EXPECT_PARSE_URI("http://foo", "http", "foo", "");
-  EXPECT_PARSE_URI("/encrypted/://foo", "", "", "/encrypted/://foo");
-  EXPECT_PARSE_URI("/usr/local/foo", "", "", "/usr/local/foo");
-  EXPECT_PARSE_URI("file:///usr/local/foo", "file", "", "/usr/local/foo");
-  EXPECT_PARSE_URI("local.file:///usr/local/foo", "local.file", "",
-                   "/usr/local/foo");
-  EXPECT_PARSE_URI("a-b:///foo", "", "", "a-b:///foo");
-  EXPECT_PARSE_URI(":///foo", "", "", ":///foo");
-  EXPECT_PARSE_URI("9dfd:///foo", "", "", "9dfd:///foo");
-  EXPECT_PARSE_URI("file:", "", "", "file:");
-  EXPECT_PARSE_URI("file:/", "", "", "file:/");
-  EXPECT_PARSE_URI("hdfs://localhost:8020/path/to/file", "hdfs",
-                   "localhost:8020", "/path/to/file");
-  EXPECT_PARSE_URI("hdfs://localhost:8020", "hdfs", "localhost:8020", "");
-  EXPECT_PARSE_URI("hdfs://localhost:8020/", "hdfs", "localhost:8020", "/");
-}
-#undef EXPECT_PARSE_URI
-
 TEST_F(DefaultEnvTest, SleepForMicroseconds) {
   const int64 start = env_->NowMicros();
   const int64 sleep_time = 1e6 + 5e5;
@@ -274,14 +245,14 @@ class TmpDirFileSystem : public NullFileSystem {
  public:
   bool FileExists(const string& dir) override {
     StringPiece scheme, host, path;
-    ParseURI(dir, &scheme, &host, &path);
+    io::ParseURI(dir, &scheme, &host, &path);
     if (path.empty()) return false;
     return Env::Default()->FileExists(io::JoinPath(BaseDir(), path));
   }
 
   Status CreateDir(const string& dir) override {
     StringPiece scheme, host, path;
-    ParseURI(dir, &scheme, &host, &path);
+    io::ParseURI(dir, &scheme, &host, &path);
     if (scheme != "tmpdirfs") {
       return errors::FailedPrecondition("scheme must be tmpdirfs");
     }
diff --git a/tensorflow/core/platform/file_system.cc b/tensorflow/core/platform/file_system.cc
index d71ff80143d..400835aa07e 100644
--- a/tensorflow/core/platform/file_system.cc
+++ b/tensorflow/core/platform/file_system.cc
@@ -22,7 +22,6 @@ limitations under the License.
 #include "tensorflow/core/lib/gtl/map_util.h"
 #include "tensorflow/core/lib/gtl/stl_util.h"
 #include "tensorflow/core/lib/io/path.h"
-#include "tensorflow/core/lib/strings/scanner.h"
 #include "tensorflow/core/lib/strings/str_util.h"
 #include "tensorflow/core/lib/strings/strcat.h"
 #include "tensorflow/core/platform/env.h"
@@ -79,43 +78,6 @@ WritableFile::~WritableFile() {}
 
 FileSystemRegistry::~FileSystemRegistry() {}
 
-void ParseURI(StringPiece remaining, StringPiece* scheme, StringPiece* host,
-              StringPiece* path) {
-  // 0. Parse scheme
-  // Make sure scheme matches [a-zA-Z][0-9a-zA-Z.]*
-  // TODO(keveman): Allow "+" and "-" in the scheme.
-  if (!strings::Scanner(remaining)
-           .One(strings::Scanner::LETTER)
-           .Many(strings::Scanner::LETTER_DIGIT_DOT)
-           .StopCapture()
-           .OneLiteral("://")
-           .GetResult(&remaining, scheme)) {
-    // If there's no scheme, assume the entire string is a path.
-    scheme->clear();
-    host->clear();
-    *path = remaining;
-    return;
-  }
-
-  // 1. Parse host
-  if (!strings::Scanner(remaining).ScanUntil('/').GetResult(&remaining, host)) {
-    // No path, so the rest of the URI is the host.
-    *host = remaining;
-    path->clear();
-    return;
-  }
-
-  // 2. The rest is the path
-  *path = remaining;
-}
-
-string CreateURI(StringPiece scheme, StringPiece host, StringPiece path) {
-  if (scheme.empty()) {
-    return path.ToString();
-  }
-  return strings::StrCat(scheme, "://", host, path);
-}
-
 Status FileSystem::GetMatchingPaths(const string& pattern,
                                     std::vector<string>* results) {
   results->clear();
@@ -237,9 +199,9 @@ Status FileSystem::DeleteRecursively(const string& dirname,
 
 Status FileSystem::RecursivelyCreateDir(const string& dirname) {
   StringPiece scheme, host, remaining_dir;
-  ParseURI(dirname, &scheme, &host, &remaining_dir);
+  io::ParseURI(dirname, &scheme, &host, &remaining_dir);
   std::vector<StringPiece> sub_dirs;
-  while (!FileExists(CreateURI(scheme, host, remaining_dir)) &&
+  while (!FileExists(io::CreateURI(scheme, host, remaining_dir)) &&
          !remaining_dir.empty()) {
     // Basename returns "" for / ending dirs.
     if (!remaining_dir.ends_with("/")) {
@@ -255,7 +217,7 @@ Status FileSystem::RecursivelyCreateDir(const string& dirname) {
   string built_path = remaining_dir.ToString();
   for (const StringPiece sub_dir : sub_dirs) {
     built_path = io::JoinPath(built_path, sub_dir);
-    TF_RETURN_IF_ERROR(CreateDir(CreateURI(scheme, host, built_path)));
+    TF_RETURN_IF_ERROR(CreateDir(io::CreateURI(scheme, host, built_path)));
   }
   return Status::OK();
 }
diff --git a/tensorflow/core/platform/file_system.h b/tensorflow/core/platform/file_system.h
index 4456e3f3e98..dfaf75be667 100644
--- a/tensorflow/core/platform/file_system.h
+++ b/tensorflow/core/platform/file_system.h
@@ -287,19 +287,6 @@ class FileSystemRegistry {
       std::vector<string>* schemes) = 0;
 };
 
-// Populates the scheme, host, and path from a URI.
-//
-// Corner cases:
-// - If the URI is invalid, scheme and host are set to empty strings and the
-//   passed string is assumed to be a path
-// - If the URI omits the path (e.g. file://host), then the path is left empty.
-void ParseURI(StringPiece uri, StringPiece* scheme, StringPiece* host,
-              StringPiece* path);
-
-// Creates a URI from a scheme, host, and path. If the scheme is empty, we just
-// return the path.
-string CreateURI(StringPiece scheme, StringPiece host, StringPiece path);
-
 }  // namespace tensorflow
 
 #endif  // TENSORFLOW_CORE_PLATFORM_FILE_SYSTEM_H_
diff --git a/tensorflow/core/platform/file_system_test.cc b/tensorflow/core/platform/file_system_test.cc
index 600af91206b..8cdabdc8bcd 100644
--- a/tensorflow/core/platform/file_system_test.cc
+++ b/tensorflow/core/platform/file_system_test.cc
@@ -112,7 +112,7 @@ class InterPlanetaryFileSystem : public NullFileSystem {
 
   void ParsePath(const string& name, string* parsed_path) {
     StringPiece scheme, host, path;
-    ParseURI(name, &scheme, &host, &path);
+    io::ParseURI(name, &scheme, &host, &path);
     ASSERT_EQ(scheme, "ipfs");
     ASSERT_EQ(host, "solarsystem");
     path.Consume("/");
diff --git a/tensorflow/core/platform/hadoop/hadoop_file_system.cc b/tensorflow/core/platform/hadoop/hadoop_file_system.cc
index d5792e82cdd..749d9e1fcda 100644
--- a/tensorflow/core/platform/hadoop/hadoop_file_system.cc
+++ b/tensorflow/core/platform/hadoop/hadoop_file_system.cc
@@ -126,7 +126,7 @@ Status HadoopFileSystem::Connect(StringPiece fname, hdfsFS* fs) {
   TF_RETURN_IF_ERROR(hdfs_->status());
 
   StringPiece scheme, namenode, path;
-  ParseURI(fname, &scheme, &namenode, &path);
+  io::ParseURI(fname, &scheme, &namenode, &path);
   const string nn = namenode.ToString();
 
   hdfsBuilder* builder = hdfs_->hdfsNewBuilder();
@@ -144,7 +144,7 @@ Status HadoopFileSystem::Connect(StringPiece fname, hdfsFS* fs) {
 
 string HadoopFileSystem::TranslateName(const string& name) const {
   StringPiece scheme, namenode, path;
-  ParseURI(name, &scheme, &namenode, &path);
+  io::ParseURI(name, &scheme, &namenode, &path);
   return path.ToString();
 }
 
diff --git a/tensorflow/core/platform/posix/env.cc b/tensorflow/core/platform/posix/env.cc
index 2f9c8e4b2f0..f353fb1c924 100644
--- a/tensorflow/core/platform/posix/env.cc
+++ b/tensorflow/core/platform/posix/env.cc
@@ -120,7 +120,8 @@ class PosixEnv : public Env {
                                                       symbol);
   }
 
-  string FormatLibraryFileName(const string& name, const string& version) {
+  string FormatLibraryFileName(const string& name,
+                               const string& version) override {
     return tensorflow::internal::FormatLibraryFileName(name, version);
   }
 };
diff --git a/tensorflow/core/platform/posix/posix_file_system.h b/tensorflow/core/platform/posix/posix_file_system.h
index 07bb8c9a6ff..ccff70cb56f 100644
--- a/tensorflow/core/platform/posix/posix_file_system.h
+++ b/tensorflow/core/platform/posix/posix_file_system.h
@@ -16,6 +16,7 @@ limitations under the License.
 #ifndef TENSORFLOW_CORE_PLATFORM_POSIX_POSIX_FILE_SYSTEM_H_
 #define TENSORFLOW_CORE_PLATFORM_POSIX_POSIX_FILE_SYSTEM_H_
 
+#include "tensorflow/core/lib/io/path.h"
 #include "tensorflow/core/platform/env.h"
 
 namespace tensorflow {
@@ -63,7 +64,7 @@ class LocalPosixFileSystem : public PosixFileSystem {
  public:
   string TranslateName(const string& name) const override {
     StringPiece scheme, host, path;
-    ParseURI(name, &scheme, &host, &path);
+    io::ParseURI(name, &scheme, &host, &path);
     return path.ToString();
   }
 };
diff --git a/tensorflow/core/platform/windows/windows_file_system.h b/tensorflow/core/platform/windows/windows_file_system.h
index 12b579bc86a..64da239d96d 100644
--- a/tensorflow/core/platform/windows/windows_file_system.h
+++ b/tensorflow/core/platform/windows/windows_file_system.h
@@ -16,6 +16,7 @@ limitations under the License.
 #ifndef TENSORFLOW_CORE_PLATFORM_WINDOWS_WINDOWS_FILE_SYSTEM_H_
 #define TENSORFLOW_CORE_PLATFORM_WINDOWS_WINDOWS_FILE_SYSTEM_H_
 
+#include "tensorflow/core/lib/io/path.h"
 #include "tensorflow/core/platform/file_system.h"
 
 #ifdef PLATFORM_WINDOWS
@@ -68,7 +69,7 @@ class LocalWinFileSystem : public WindowsFileSystem {
 public:
     string TranslateName(const string& name) const override {
       StringPiece scheme, host, path;
-      ParseURI(name, &scheme, &host, &path);
+      io::ParseURI(name, &scheme, &host, &path);
       return path.ToString();
     }
 };
diff --git a/tensorflow/core/protobuf/master.proto b/tensorflow/core/protobuf/master.proto
index 1dc5e0271e3..d22a68d89c5 100644
--- a/tensorflow/core/protobuf/master.proto
+++ b/tensorflow/core/protobuf/master.proto
@@ -122,6 +122,10 @@ message RunStepRequest {
 
   // Options for the run call.
   RunOptions options = 5;
+
+  // Partial run handle (optional). If specified, this will be a partial run
+  // execution, run up to the specified fetches.
+  string partial_run_handle = 6;
 }
 
 message RunStepResponse {
@@ -133,6 +137,42 @@ message RunStepResponse {
   RunMetadata metadata = 2;
 }
 
+////////////////////////////////////////////////////////////////////////////////
+//
+// PartialRunSetup method request/response protos.
+//
+// The caller should provide the future partial run feeds, fetches, and targets.
+// Then the caller can use RunStepRequest with is_partial set to make partial
+// run calls.
+//
+////////////////////////////////////////////////////////////////////////////////
+
+message PartialRunSetupRequest {
+  // REQUIRED: session_handle must be returned by a CreateSession call
+  // to the same master service.
+  string session_handle = 1;
+
+  // Tensors to be fed in future steps.
+  repeated string feed = 2;
+
+  // Fetches. A list of tensor names. The caller expects a tensor to be returned
+  // for each fetch[i] (see RunStepResponse.tensor), for corresponding partial
+  // RunStepRequests. The order of specified fetches does not change the
+  // execution order.
+  repeated string fetch = 3;
+
+  // Target Nodes. A list of node names. The named nodes will be run in future
+  // steps, but their outputs will not be fetched.
+  repeated string target = 4;
+}
+
+message PartialRunSetupResponse {
+  // The unique handle corresponding to the ongoing partial run call setup by
+  // the invocation to PartialRunSetup. This handle may be passed to
+  // RunStepRequest to send and receive tensors for this partial run.
+  string partial_run_handle = 1;
+}
+
 ////////////////////////////////////////////////////////////////////////////////
 //
 // CloseSession method request/response protos.
diff --git a/tensorflow/core/protobuf/master_service.proto b/tensorflow/core/protobuf/master_service.proto
index 4deb63e400b..7475491845c 100644
--- a/tensorflow/core/protobuf/master_service.proto
+++ b/tensorflow/core/protobuf/master_service.proto
@@ -91,6 +91,9 @@ service MasterService {
   // Extends a session.
   rpc ExtendSession(ExtendSessionRequest) returns (ExtendSessionResponse);
 
+  // Prepares future partial run calls.
+  rpc PartialRunSetup(PartialRunSetupRequest) returns (PartialRunSetupResponse);
+
   // Drives the graph computation.
   rpc RunStep(RunStepRequest) returns (RunStepResponse);
 
diff --git a/tensorflow/core/public/version.h b/tensorflow/core/public/version.h
index 1e8ae0b1bf9..060682700cc 100644
--- a/tensorflow/core/public/version.h
+++ b/tensorflow/core/public/version.h
@@ -20,7 +20,7 @@ limitations under the License.
 
 #define TF_MAJOR_VERSION 0
 #define TF_MINOR_VERSION 11
-#define TF_PATCH_VERSION 0rc1
+#define TF_PATCH_VERSION 0rc2
 
 // TF_VERSION_SUFFIX is non-empty for pre-releases (e.g. "-alpha", "-alpha.1",
 // "-beta", "-rc", "-rc.1")
diff --git a/tensorflow/core/util/cuda_kernel_helper.h b/tensorflow/core/util/cuda_kernel_helper.h
index 488c28e5305..a0b7341c798 100644
--- a/tensorflow/core/util/cuda_kernel_helper.h
+++ b/tensorflow/core/util/cuda_kernel_helper.h
@@ -77,16 +77,8 @@ __device__ __host__ inline T ldg(const T* address) {
 #define CUDA_ATOMIC_WRAPPER(op, T) \
   __device__ __forceinline__ T CudaAtomic##op(T* address, T val)
 
-// Reason of guarding: NVCC cannot compile the "::" in "cuda_builtin::atomicOp".
-#ifdef __GCUDACC__
-using cuda_builtin::__float_as_int;
-using cuda_builtin::__int_as_float;
-#define USE_CUDA_ATOMIC(op, T) \
-  CUDA_ATOMIC_WRAPPER(op, T) { return cuda_builtin::atomic##op(address, val); }
-#else
 #define USE_CUDA_ATOMIC(op, T) \
   CUDA_ATOMIC_WRAPPER(op, T) { return atomic##op(address, val); }
-#endif
 
 // For atomicAdd.
 USE_CUDA_ATOMIC(Add, int32);
diff --git a/tensorflow/core/util/tensor_bundle/tensor_bundle.cc b/tensorflow/core/util/tensor_bundle/tensor_bundle.cc
index 61a69a3840f..4b1a01277c8 100644
--- a/tensorflow/core/util/tensor_bundle/tensor_bundle.cc
+++ b/tensorflow/core/util/tensor_bundle/tensor_bundle.cc
@@ -343,7 +343,11 @@ Status BundleWriter::Finish() {
   status_ = env_->NewWritableFile(MetaFilename(prefix_), &file);
   if (!status_.ok()) return status_;
   {
-    table::TableBuilder builder(table::Options(), file.get());
+    // N.B.: the default use of Snappy compression may not be supported on all
+    // platforms (e.g. Android).  The metadata file is small, so this is fine.
+    table::Options options;
+    options.compression = table::kNoCompression;
+    table::TableBuilder builder(options, file.get());
     // Header entry.
     BundleHeaderProto header;
     header.set_num_shards(1);
diff --git a/tensorflow/core/util/work_sharder.cc b/tensorflow/core/util/work_sharder.cc
index 6cede8d461e..7922fc9224e 100644
--- a/tensorflow/core/util/work_sharder.cc
+++ b/tensorflow/core/util/work_sharder.cc
@@ -31,12 +31,10 @@ void Shard(int max_parallelism, thread::ThreadPool* workers, int64 total,
     work(0, total);
     return;
   }
-#ifdef EIGEN_USE_NONBLOCKING_THREAD_POOL
   if (max_parallelism >= workers->NumThreads()) {
     workers->ParallelFor(total, cost_per_unit, work);
     return;
   }
-#endif
   cost_per_unit = std::max(1LL, cost_per_unit);
   // We shard [0, total) into "num_shards" shards.
   //   1 <= num_shards <= num worker threads
diff --git a/tensorflow/examples/android/res/layout-land/camera_connection_fragment.xml b/tensorflow/examples/android/res/layout-land/camera_connection_fragment.xml
deleted file mode 100644
index 543e5358e68..00000000000
--- a/tensorflow/examples/android/res/layout-land/camera_connection_fragment.xml
+++ /dev/null
@@ -1,34 +0,0 @@
-<?xml version="1.0" encoding="utf-8"?><!--
- Copyright 2016 The TensorFlow Authors. All Rights Reserved.
-
- Licensed under the Apache License, Version 2.0 (the "License");
- you may not use this file except in compliance with the License.
- You may obtain a copy of the License at
-
-     http://www.apache.org/licenses/LICENSE-2.0
-
- Unless required by applicable law or agreed to in writing, software
- distributed under the License is distributed on an "AS IS" BASIS,
- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
- See the License for the specific language governing permissions and
- limitations under the License.
--->
-<RelativeLayout xmlns:android="http://schemas.android.com/apk/res/android"
-    android:layout_width="match_parent"
-    android:layout_height="match_parent">
-
-    <org.tensorflow.demo.AutoFitTextureView
-        android:id="@+id/texture"
-        android:layout_width="wrap_content"
-        android:layout_height="wrap_content"
-        android:layout_alignParentBottom="true"
-        android:layout_alignParentStart="true"
-        android:layout_alignParentTop="true" />
-
-    <org.tensorflow.demo.RecognitionScoreView
-        android:id="@+id/results"
-        android:layout_width="match_parent"
-        android:layout_height="112dp"
-        android:layout_alignParentTop="true" />
-        
-</RelativeLayout>
diff --git a/tensorflow/examples/android/res/layout/camera_connection_fragment.xml b/tensorflow/examples/android/res/layout/camera_connection_fragment.xml
index fcf08bf8835..420b69b5e3d 100644
--- a/tensorflow/examples/android/res/layout/camera_connection_fragment.xml
+++ b/tensorflow/examples/android/res/layout/camera_connection_fragment.xml
@@ -22,11 +22,17 @@
         android:layout_width="wrap_content"
         android:layout_height="wrap_content"
         android:layout_alignParentBottom="true" />
-    
+
     <org.tensorflow.demo.RecognitionScoreView
         android:id="@+id/results"
         android:layout_width="match_parent"
         android:layout_height="112dp"
         android:layout_alignParentTop="true" />
-        
+
+    <org.tensorflow.demo.OverlayView
+        android:id="@+id/overlay"
+        android:layout_width="match_parent"
+        android:layout_height="match_parent"
+        android:layout_alignParentBottom="true" />
+
 </RelativeLayout>
diff --git a/tensorflow/examples/android/src/org/tensorflow/demo/CameraActivity.java b/tensorflow/examples/android/src/org/tensorflow/demo/CameraActivity.java
index ede3af1467f..e8bbb999a7f 100644
--- a/tensorflow/examples/android/src/org/tensorflow/demo/CameraActivity.java
+++ b/tensorflow/examples/android/src/org/tensorflow/demo/CameraActivity.java
@@ -20,32 +20,72 @@ import android.Manifest;
 import android.app.Activity;
 import android.app.Fragment;
 import android.content.pm.PackageManager;
+import android.media.Image.Plane;
+import android.media.ImageReader.OnImageAvailableListener;
 import android.os.Build;
 import android.os.Bundle;
+import android.os.Handler;
+import android.os.HandlerThread;
+import android.util.Size;
+import android.view.MotionEvent;
 import android.view.WindowManager;
 import android.widget.Toast;
+import java.nio.ByteBuffer;
+import org.tensorflow.demo.env.Logger;
+
+public abstract class CameraActivity extends Activity implements OnImageAvailableListener {
+  private static final Logger LOGGER = new Logger();
 
-public abstract class CameraActivity extends Activity {
   private static final int PERMISSIONS_REQUEST = 1;
 
   private static final String PERMISSION_CAMERA = Manifest.permission.CAMERA;
   private static final String PERMISSION_STORAGE = Manifest.permission.WRITE_EXTERNAL_STORAGE;
 
+  private boolean debug = false;
+
+  private Handler handler;
+  private HandlerThread handlerThread;
+
   @Override
   protected void onCreate(final Bundle savedInstanceState) {
-    super.onCreate(savedInstanceState);
+    super.onCreate(null);
     getWindow().addFlags(WindowManager.LayoutParams.FLAG_KEEP_SCREEN_ON);
 
     setContentView(R.layout.activity_camera);
 
     if (hasPermission()) {
-      if (null == savedInstanceState) {
-        setFragment();
-      }
+      setFragment();
     } else {
       requestPermission();
     }
+  }
 
+  @Override
+  public synchronized void onResume() {
+    super.onResume();
+
+    handlerThread = new HandlerThread("inference");
+    handlerThread.start();
+    handler = new Handler(handlerThread.getLooper());
+  }
+
+  @Override
+  public synchronized void onPause() {
+    super.onPause();
+    handlerThread.quitSafely();
+    try {
+      handlerThread.join();
+      handlerThread = null;
+      handler = null;
+    } catch (final InterruptedException e) {
+      LOGGER.e(e, "Exception!");
+    }
+  }
+
+  protected synchronized void runInBackground(final Runnable r) {
+    if (handler != null) {
+      handler.post(r);
+    }
   }
 
   @Override
@@ -82,11 +122,47 @@ public abstract class CameraActivity extends Activity {
   }
 
   protected void setFragment() {
+    final Fragment fragment = CameraConnectionFragment.newInstance(
+        new CameraConnectionFragment.ConnectionCallback(){
+          @Override
+          public void onPreviewSizeChosen(final Size size, final int rotation) {
+            CameraActivity.this.onPreviewSizeChosen(size, rotation);
+          }
+        },
+        this, getLayoutId(), getDesiredPreviewFrameSize());
+
     getFragmentManager()
         .beginTransaction()
-        .replace(R.id.container, createFragment())
+        .replace(R.id.container, fragment)
         .commit();
   }
 
-  protected abstract Fragment createFragment();
+  protected void fillBytes(final Plane[] planes, final byte[][] yuvBytes) {
+    // Because of the variable row stride it's not possible to know in
+    // advance the actual necessary dimensions of the yuv planes.
+    for (int i = 0; i < planes.length; ++i) {
+      final ByteBuffer buffer = planes[i].getBuffer();
+      if (yuvBytes[i] == null) {
+        LOGGER.i("Initializing buffer %d at size %d", i, buffer.capacity());
+        yuvBytes[i] = new byte[buffer.capacity()];
+      }
+      buffer.get(yuvBytes[i]);
+    }
+  }
+
+  @Override
+  public boolean onTouchEvent(final MotionEvent event) {
+    if (event.getAction() == MotionEvent.ACTION_DOWN) {
+      debug = !debug;
+    }
+    return false;
+  }
+
+  public boolean isDebug() {
+    return debug;
+  }
+
+  protected abstract void onPreviewSizeChosen(final Size size, final int rotation);
+  protected abstract int getLayoutId();
+  protected abstract int getDesiredPreviewFrameSize();
 }
diff --git a/tensorflow/examples/android/src/org/tensorflow/demo/CameraConnectionFragment.java b/tensorflow/examples/android/src/org/tensorflow/demo/CameraConnectionFragment.java
index 0bd963b39ef..2e09e78b8a4 100644
--- a/tensorflow/examples/android/src/org/tensorflow/demo/CameraConnectionFragment.java
+++ b/tensorflow/examples/android/src/org/tensorflow/demo/CameraConnectionFragment.java
@@ -38,6 +38,7 @@ import android.hardware.camera2.CaptureResult;
 import android.hardware.camera2.TotalCaptureResult;
 import android.hardware.camera2.params.StreamConfigurationMap;
 import android.media.ImageReader;
+import android.media.ImageReader.OnImageAvailableListener;
 import android.os.Bundle;
 import android.os.Handler;
 import android.os.HandlerThread;
@@ -49,9 +50,6 @@ import android.view.TextureView;
 import android.view.View;
 import android.view.ViewGroup;
 import android.widget.Toast;
-
-import org.tensorflow.demo.env.Logger;
-
 import java.util.ArrayList;
 import java.util.Arrays;
 import java.util.Collections;
@@ -59,6 +57,7 @@ import java.util.Comparator;
 import java.util.List;
 import java.util.concurrent.Semaphore;
 import java.util.concurrent.TimeUnit;
+import org.tensorflow.demo.env.Logger;
 
 public class CameraConnectionFragment extends Fragment {
   private static final Logger LOGGER = new Logger();
@@ -69,8 +68,6 @@ public class CameraConnectionFragment extends Fragment {
    */
   private static final int MINIMUM_PREVIEW_SIZE = 320;
 
-  private ResultsView resultsView;
-
   /**
    * Conversion from screen rotation to JPEG orientation.
    */
@@ -111,6 +108,14 @@ public class CameraConnectionFragment extends Fragment {
         public void onSurfaceTextureUpdated(final SurfaceTexture texture) {}
       };
 
+  /**
+   * Callback for Activities to use to initialize their data once the
+   * selected preview size is known.
+   */
+  public interface ConnectionCallback {
+    void onPreviewSizeChosen(Size size, int cameraRotation);
+  }
+
   /**
    * ID of the current {@link CameraDevice}.
    */
@@ -184,16 +189,6 @@ public class CameraConnectionFragment extends Fragment {
    */
   private Handler backgroundHandler;
 
-  /**
-   * An additional thread for running inference so as not to block the camera.
-   */
-  private HandlerThread inferenceThread;
-
-  /**
-   * A {@link Handler} for running tasks in the background.
-   */
-  private Handler inferenceHandler;
-
   /**
    * An {@link ImageReader} that handles preview frame capture.
    */
@@ -215,9 +210,10 @@ public class CameraConnectionFragment extends Fragment {
   private final Semaphore cameraOpenCloseLock = new Semaphore(1);
 
   /**
-   * A {@link Classifier} object wrapping TensorFlow to pass frames to.
+   * A {@link OnImageAvailableListener} to receive frames as they are available.
    */
-  private final Classifier classifier;
+  private final OnImageAvailableListener imageListener;
+
   /**
    * The input size in pixels desired by TensorFlow (width and height of a square bitmap).
    */
@@ -228,9 +224,15 @@ public class CameraConnectionFragment extends Fragment {
    */
   private final int layout;
 
+
+  private final ConnectionCallback cameraConnectionCallback;
+
   private CameraConnectionFragment(
-      final Classifier classifier, final int layout, final int inputSize) {
-    this.classifier = classifier;
+      final ConnectionCallback connectionCallback,
+      final OnImageAvailableListener imageListener,
+      final int layout, final int inputSize) {
+    this.cameraConnectionCallback = connectionCallback;
+    this.imageListener = imageListener;
     this.layout = layout;
     this.inputSize = inputSize;
   }
@@ -268,8 +270,12 @@ public class CameraConnectionFragment extends Fragment {
       final Size[] choices, final int width, final int height, final Size aspectRatio) {
     // Collect the supported resolutions that are at least as big as the preview Surface
     final List<Size> bigEnough = new ArrayList<Size>();
+
+    final int minWidth = Math.max(width, MINIMUM_PREVIEW_SIZE);
+    final int minHeight = Math.max(height, MINIMUM_PREVIEW_SIZE);
+
     for (final Size option : choices) {
-      if (option.getHeight() >= MINIMUM_PREVIEW_SIZE && option.getWidth() >= MINIMUM_PREVIEW_SIZE) {
+      if (option.getHeight() >= minHeight && option.getWidth() >= minWidth) {
         LOGGER.i("Adding size: " + option.getWidth() + "x" + option.getHeight());
         bigEnough.add(option);
       } else {
@@ -289,8 +295,9 @@ public class CameraConnectionFragment extends Fragment {
   }
 
   public static CameraConnectionFragment newInstance(
-      final Classifier classifier, final int layout, final int inputSize) {
-    return new CameraConnectionFragment(classifier, layout, inputSize);
+      final ConnectionCallback callback,
+      final OnImageAvailableListener imageListener, final int layout, final int inputSize) {
+    return new CameraConnectionFragment(callback, imageListener, layout, inputSize);
   }
 
   @Override
@@ -302,7 +309,6 @@ public class CameraConnectionFragment extends Fragment {
   @Override
   public void onViewCreated(final View view, final Bundle savedInstanceState) {
     textureView = (AutoFitTextureView) view.findViewById(R.id.texture);
-    resultsView = (ResultsView) view.findViewById(R.id.results);
   }
 
   @Override
@@ -371,7 +377,8 @@ public class CameraConnectionFragment extends Fragment {
         // bus' bandwidth limitation, resulting in gorgeous previews but the storage of
         // garbage capture data.
         previewSize =
-            chooseOptimalSize(map.getOutputSizes(SurfaceTexture.class), width, height, largest);
+            chooseOptimalSize(map.getOutputSizes(SurfaceTexture.class),
+                inputSize, inputSize, largest);
 
         // We fit the aspect ratio of TextureView to the size of preview we picked.
         final int orientation = getResources().getConfiguration().orientation;
@@ -382,6 +389,8 @@ public class CameraConnectionFragment extends Fragment {
         }
 
         CameraConnectionFragment.this.cameraId = cameraId;
+
+        cameraConnectionCallback.onPreviewSizeChosen(previewSize, sensorOrientation);
         return;
       }
     } catch (final CameraAccessException e) {
@@ -446,10 +455,6 @@ public class CameraConnectionFragment extends Fragment {
     backgroundThread = new HandlerThread("ImageListener");
     backgroundThread.start();
     backgroundHandler = new Handler(backgroundThread.getLooper());
-
-    inferenceThread = new HandlerThread("InferenceThread");
-    inferenceThread.start();
-    inferenceHandler = new Handler(inferenceThread.getLooper());
   }
 
   /**
@@ -457,22 +462,15 @@ public class CameraConnectionFragment extends Fragment {
    */
   private void stopBackgroundThread() {
     backgroundThread.quitSafely();
-    inferenceThread.quitSafely();
     try {
       backgroundThread.join();
       backgroundThread = null;
       backgroundHandler = null;
-
-      inferenceThread.join();
-      inferenceThread = null;
-      inferenceThread = null;
     } catch (final InterruptedException e) {
       LOGGER.e(e, "Exception!");
     }
   }
 
-  private final TensorFlowImageListener tfPreviewListener = new TensorFlowImageListener();
-
   private final CameraCaptureSession.CaptureCallback captureCallback =
       new CameraCaptureSession.CaptureCallback() {
         @Override
@@ -513,7 +511,7 @@ public class CameraConnectionFragment extends Fragment {
           ImageReader.newInstance(
               previewSize.getWidth(), previewSize.getHeight(), ImageFormat.YUV_420_888, 2);
 
-      previewReader.setOnImageAvailableListener(tfPreviewListener, backgroundHandler);
+      previewReader.setOnImageAvailableListener(imageListener, backgroundHandler);
       previewRequestBuilder.addTarget(previewReader.getSurface());
 
       // Here, we create a CameraCaptureSession for camera preview.
@@ -557,11 +555,6 @@ public class CameraConnectionFragment extends Fragment {
     } catch (final CameraAccessException e) {
       LOGGER.e(e, "Exception!");
     }
-
-    LOGGER.i("Getting assets.");
-    tfPreviewListener.initialize(
-        classifier, resultsView, inputSize, inferenceHandler, sensorOrientation);
-    LOGGER.i("TensorFlow initialized.");
   }
 
   /**
diff --git a/tensorflow/examples/android/src/org/tensorflow/demo/ClassifierActivity.java b/tensorflow/examples/android/src/org/tensorflow/demo/ClassifierActivity.java
index 104ffbbd088..6f695dd7667 100644
--- a/tensorflow/examples/android/src/org/tensorflow/demo/ClassifierActivity.java
+++ b/tensorflow/examples/android/src/org/tensorflow/demo/ClassifierActivity.java
@@ -16,12 +16,29 @@
 
 package org.tensorflow.demo;
 
+import android.graphics.Bitmap;
+import android.graphics.Bitmap.Config;
+import android.graphics.Canvas;
+import android.graphics.Matrix;
+import android.graphics.Paint;
+import android.media.Image;
+import android.media.Image.Plane;
+import android.media.ImageReader;
+import android.media.ImageReader.OnImageAvailableListener;
+import android.os.SystemClock;
+import android.os.Trace;
+import android.util.Size;
+import android.util.TypedValue;
+import android.view.Display;
 import java.io.IOException;
-
-import android.app.Fragment;
+import java.util.List;
+import java.util.Vector;
+import org.tensorflow.demo.OverlayView.DrawCallback;
+import org.tensorflow.demo.env.BorderedText;
+import org.tensorflow.demo.env.ImageUtils;
 import org.tensorflow.demo.env.Logger;
 
-public class ClassifierActivity extends CameraActivity {
+public class ClassifierActivity extends CameraActivity implements OnImageAvailableListener {
   private static final Logger LOGGER = new Logger();
 
   // These are the settings for the original v1 Inception model. If you want to
@@ -41,9 +58,58 @@ public class ClassifierActivity extends CameraActivity {
   private static final String LABEL_FILE =
       "file:///android_asset/imagenet_comp_graph_label_strings.txt";
 
+  private static final boolean SAVE_PREVIEW_BITMAP = false;
+
+  private static final boolean MAINTAIN_ASPECT = true;
+
+  private TensorFlowImageClassifier classifier;
+
+  private Integer sensorOrientation;
+
+  private int previewWidth = 0;
+  private int previewHeight = 0;
+  private byte[][] yuvBytes;
+  private int[] rgbBytes = null;
+  private Bitmap rgbFrameBitmap = null;
+  private Bitmap croppedBitmap = null;
+
+  private Bitmap cropCopyBitmap;
+
+  private boolean computing = false;
+
+  private long timestamp = 0;
+
+  private Matrix frameToCropTransform;
+  private Matrix cropToFrameTransform;
+
+  private ResultsView resultsView;
+
+  private OverlayView overlayView;
+
+  private BorderedText borderedText;
+
+  private long lastProcessingTimeMs;
+
   @Override
-  protected Fragment createFragment() {
-    final TensorFlowImageClassifier classifier = new TensorFlowImageClassifier();
+  protected int getLayoutId() {
+    return R.layout.camera_connection_fragment;
+  }
+
+  @Override
+  protected int getDesiredPreviewFrameSize() {
+    return INPUT_SIZE;
+  }
+
+  private static final float TEXT_SIZE_DIP = 18;
+
+  @Override
+  public void onPreviewSizeChosen(final Size size, final int rotation) {
+    final float textSizePx = TypedValue.applyDimension(
+        TypedValue.COMPLEX_UNIT_DIP, TEXT_SIZE_DIP,
+        getResources().getDisplayMetrics());
+    borderedText = new BorderedText(textSizePx);
+
+    classifier = new TensorFlowImageClassifier();
     try {
       classifier.initializeTensorFlow(
         getAssets(), MODEL_FILE, LABEL_FILE, NUM_CLASSES, INPUT_SIZE, IMAGE_MEAN, IMAGE_STD,
@@ -52,7 +118,151 @@ public class ClassifierActivity extends CameraActivity {
       LOGGER.e(e, "Exception!");
     }
 
-    return CameraConnectionFragment.newInstance(
-        classifier, R.layout.camera_connection_fragment, INPUT_SIZE);
+    overlayView = (OverlayView) findViewById(R.id.overlay);
+    resultsView = (ResultsView) findViewById(R.id.results);
+    previewWidth = size.getWidth();
+    previewHeight = size.getHeight();
+
+    final Display display = getWindowManager().getDefaultDisplay();
+    final int screenOrientation = display.getRotation();
+
+    LOGGER.i("Sensor orientation: %d, Screen orientation: %d",
+        rotation, screenOrientation);
+
+    sensorOrientation = rotation + screenOrientation;
+
+    if (sensorOrientation % 180 == 90) {
+      overlayView.setAspectRatio(size.getHeight(), size.getWidth());
+    } else {
+      overlayView.setAspectRatio(size.getWidth(), size.getHeight());
+    }
+
+    LOGGER.i("Initializing at size %dx%d", previewWidth, previewHeight);
+    rgbBytes = new int[previewWidth * previewHeight];
+    rgbFrameBitmap = Bitmap.createBitmap(previewWidth, previewHeight, Config.ARGB_8888);
+    croppedBitmap = Bitmap.createBitmap(INPUT_SIZE, INPUT_SIZE, Config.ARGB_8888);
+
+    frameToCropTransform = ImageUtils.getTransformationMatrix(
+        previewWidth, previewHeight,
+        INPUT_SIZE, INPUT_SIZE,
+        sensorOrientation, MAINTAIN_ASPECT);
+
+    cropToFrameTransform = new Matrix();
+    frameToCropTransform.invert(cropToFrameTransform);
+
+    yuvBytes = new byte[3][];
+
+    overlayView.addCallback(new DrawCallback() {
+      @Override
+      public void drawCallback(final Canvas canvas) {
+        renderDebug(canvas);
+      }
+    });
+  }
+
+  @Override
+  public void onImageAvailable(final ImageReader reader) {
+    Image image = null;
+
+    ++timestamp;
+
+    try {
+      image = reader.acquireLatestImage();
+
+      if (image == null) {
+        return;
+      }
+
+      if (computing) {
+        image.close();
+        return;
+      }
+      computing = true;
+
+      Trace.beginSection("imageAvailable");
+
+      final Plane[] planes = image.getPlanes();
+      fillBytes(planes, yuvBytes);
+
+      final int yRowStride = planes[0].getRowStride();
+      final int uvRowStride = planes[1].getRowStride();
+      final int uvPixelStride = planes[1].getPixelStride();
+      ImageUtils.convertYUV420ToARGB8888(
+          yuvBytes[0],
+          yuvBytes[1],
+          yuvBytes[2],
+          rgbBytes,
+          previewWidth,
+          previewHeight,
+          yRowStride,
+          uvRowStride,
+          uvPixelStride,
+          false);
+
+      image.close();
+    } catch (final Exception e) {
+      if (image != null) {
+        image.close();
+      }
+      LOGGER.e(e, "Exception!");
+      Trace.endSection();
+      return;
+    }
+
+    rgbFrameBitmap.setPixels(rgbBytes, 0, previewWidth, 0, 0, previewWidth, previewHeight);
+    final Canvas canvas = new Canvas(croppedBitmap);
+    canvas.drawBitmap(rgbFrameBitmap, frameToCropTransform, null);
+
+    // For examining the actual TF input.
+    if (SAVE_PREVIEW_BITMAP) {
+      ImageUtils.saveBitmap(croppedBitmap);
+    }
+
+    runInBackground(
+        new Runnable() {
+          @Override
+          public void run() {
+            final long startTime = SystemClock.uptimeMillis();
+            final List<Classifier.Recognition> results = classifier.recognizeImage(croppedBitmap);
+            lastProcessingTimeMs = SystemClock.uptimeMillis() - startTime;
+
+            cropCopyBitmap = Bitmap.createBitmap(croppedBitmap);
+            resultsView.setResults(results);
+            overlayView.postInvalidate();
+            computing = false;
+          }
+        });
+
+    Trace.endSection();
+  }
+
+  private void renderDebug(Canvas canvas) {
+    if (!isDebug()) {
+      return;
+    }
+    final Bitmap copy = cropCopyBitmap;
+    if (copy != null) {
+      final Matrix matrix = new Matrix();
+      final float scaleFactor = 2;
+      matrix.postScale(scaleFactor, scaleFactor);
+      matrix.postTranslate(
+          canvas.getWidth() - copy.getWidth() * scaleFactor,
+          canvas.getHeight() - copy.getHeight() * scaleFactor);
+      canvas.drawBitmap(copy, matrix, new Paint());
+
+      final Vector<String> lines = new Vector<String>();
+      lines.add("Frame: " + previewWidth + "x" + previewHeight);
+      lines.add("Crop: " + copy.getWidth() + "x" + copy.getHeight());
+      lines.add("View: " + canvas.getWidth() + "x" + canvas.getHeight());
+      lines.add("Rotation: " + sensorOrientation);
+      lines.add("Inference time: " + lastProcessingTimeMs + "ms");
+
+      int lineNum = 0;
+      for (final String line : lines) {
+        borderedText.drawText(canvas, 10,
+            canvas.getHeight() - 10 - borderedText.getTextSize() * lineNum, line);
+        ++lineNum;
+      }
+    }
   }
 }
diff --git a/tensorflow/examples/android/src/org/tensorflow/demo/OverlayView.java b/tensorflow/examples/android/src/org/tensorflow/demo/OverlayView.java
new file mode 100644
index 00000000000..b874bb07380
--- /dev/null
+++ b/tensorflow/examples/android/src/org/tensorflow/demo/OverlayView.java
@@ -0,0 +1,94 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+package org.tensorflow.demo;
+
+import android.content.Context;
+import android.graphics.Canvas;
+import android.util.AttributeSet;
+import android.view.MotionEvent;
+import android.view.View;
+import android.view.View.MeasureSpec;
+import java.util.LinkedList;
+import java.util.List;
+
+/**
+ * A simple View providing a render callback to other classes.
+ */
+public class OverlayView extends View {
+  public OverlayView(final Context context, final AttributeSet attrs) {
+    super(context, attrs);
+  }
+
+  /**
+   * Interface defining the callback for client classes.
+   */
+  public interface DrawCallback {
+    public void drawCallback(final Canvas canvas);
+  }
+
+  private int ratioWidth;
+  private int ratioHeight;
+
+  private boolean debug;
+
+  private final List<DrawCallback> callbacks = new LinkedList<DrawCallback>();
+
+  @Override
+  public boolean onTouchEvent(final MotionEvent e) {
+    super.onTouchEvent(e);
+    if (e.getAction() == MotionEvent.ACTION_DOWN) {
+      debug = !debug;
+    }
+    return false;
+  }
+
+  public void addCallback(final DrawCallback callback) {
+    callbacks.add(callback);
+  }
+
+  @Override
+  public synchronized void draw(final Canvas canvas) {
+    for (final DrawCallback callback : callbacks) {
+      callback.drawCallback(canvas);
+    }
+  }
+
+  public void setAspectRatio(final int width, final int height) {
+    if (width < 0 || height < 0) {
+      throw new IllegalArgumentException("Size cannot be negative.");
+    }
+    ratioWidth = width;
+    ratioHeight = height;
+    requestLayout();
+  }
+
+  @Override
+  protected void onMeasure(final int widthMeasureSpec, final int heightMeasureSpec) {
+    super.onMeasure(widthMeasureSpec, heightMeasureSpec);
+    final int width = MeasureSpec.getSize(widthMeasureSpec);
+    final int height = MeasureSpec.getSize(heightMeasureSpec);
+    if (0 == ratioWidth || 0 == ratioHeight) {
+      setMeasuredDimension(width, height);
+    } else {
+      if (width < height * ratioWidth / ratioHeight) {
+        setMeasuredDimension(width, width * ratioHeight / ratioWidth);
+      } else {
+        setMeasuredDimension(height * ratioWidth / ratioHeight, height);
+      }
+    }
+  }
+
+}
diff --git a/tensorflow/examples/android/src/org/tensorflow/demo/TensorFlowImageClassifier.java b/tensorflow/examples/android/src/org/tensorflow/demo/TensorFlowImageClassifier.java
index c2ac42657e2..d49982e17a6 100644
--- a/tensorflow/examples/android/src/org/tensorflow/demo/TensorFlowImageClassifier.java
+++ b/tensorflow/examples/android/src/org/tensorflow/demo/TensorFlowImageClassifier.java
@@ -160,7 +160,8 @@ public class TensorFlowImageClassifier implements Classifier {
       }
     }
     final ArrayList<Recognition> recognitions = new ArrayList<Recognition>();
-    for (int i = 0; i < Math.min(pq.size(), MAX_RESULTS); ++i) {
+    int recognitionsSize = Math.min(pq.size(), MAX_RESULTS);
+    for (int i = 0; i < recognitionsSize; ++i) {
       recognitions.add(pq.poll());
     }
     Trace.endSection(); // "recognizeImage"
diff --git a/tensorflow/examples/android/src/org/tensorflow/demo/env/BorderedText.java b/tensorflow/examples/android/src/org/tensorflow/demo/env/BorderedText.java
new file mode 100644
index 00000000000..e4b13bb7abf
--- /dev/null
+++ b/tensorflow/examples/android/src/org/tensorflow/demo/env/BorderedText.java
@@ -0,0 +1,119 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+package org.tensorflow.demo.env;
+
+import android.graphics.Canvas;
+import android.graphics.Color;
+import android.graphics.Paint;
+import android.graphics.Paint.Align;
+import android.graphics.Paint.Style;
+import android.graphics.Rect;
+
+/**
+ * A class that encapsulates the tedious bits of rendering legible, bordered text onto a canvas.
+ */
+public class BorderedText {
+  private final Paint interiorPaint;
+  private final Paint exteriorPaint;
+
+  private final float textSize;
+
+  /**
+   * Creates a left-aligned bordered text object with a white interior, and a black exterior with
+   * the specified text size.
+   *
+   * @param textSize text size in pixels
+   */
+  public BorderedText(final float textSize) {
+    this(Color.WHITE, Color.BLACK, textSize);
+  }
+
+  /**
+   * Create a bordered text object with the specified interior and exterior colors, text size and
+   * alignment.
+   *
+   * @param interiorColor the interior text color
+   * @param exteriorColor the exterior text color
+   * @param textSize text size in pixels
+   */
+  public BorderedText(final int interiorColor, final int exteriorColor, final float textSize) {
+    interiorPaint = new Paint();
+    interiorPaint.setTextSize(textSize);
+    interiorPaint.setColor(interiorColor);
+    interiorPaint.setStyle(Style.FILL);
+    interiorPaint.setAntiAlias(false);
+    interiorPaint.setAlpha(255);
+
+    exteriorPaint = new Paint();
+    exteriorPaint.setTextSize(textSize);
+    exteriorPaint.setColor(exteriorColor);
+    exteriorPaint.setStyle(Style.FILL_AND_STROKE);
+    exteriorPaint.setStrokeWidth(textSize / 8);
+    exteriorPaint.setAntiAlias(false);
+    exteriorPaint.setAlpha(255);
+
+    this.textSize = textSize;
+  }
+
+  public void drawText(final Canvas canvas, final float posX, final float posY, final String text) {
+    /*
+    if (widths == null || widths.length < text.length()) {
+      widths = new float[text.length()];
+      positions = new float[text.length() * 2];
+    }
+
+    exteriorPaint.getTextWidths(text, widths);
+    float lastPosX = posX;
+    for (int i = 0; i < widths.length; ++i) {
+      positions[i * 2] = lastPosX;
+      positions[i * 2 + 1] = posY;
+      lastPosX += widths[i];
+    }
+    */
+
+    //canvas.drawPosText(text, positions, exteriorPaint);
+    //canvas.drawPosText(text, positions, exteriorPaint);
+    canvas.drawText(text, posX, posY, exteriorPaint);
+    canvas.drawText(text, posX, posY, interiorPaint);
+  }
+
+  public void setInteriorColor(final int color) {
+    interiorPaint.setColor(color);
+  }
+
+  public void setExteriorColor(final int color) {
+    exteriorPaint.setColor(color);
+  }
+
+  public float getTextSize() {
+    return textSize;
+  }
+
+  public void setAlpha(final int alpha) {
+    interiorPaint.setAlpha(alpha);
+    exteriorPaint.setAlpha(alpha);
+  }
+
+  public void getTextBounds(
+      final String line, final int index, final int count, final Rect lineBounds) {
+    interiorPaint.getTextBounds(line, index, count, lineBounds);
+  }
+
+  public void setTextAlign(final Align align) {
+    interiorPaint.setTextAlign(align);
+    exteriorPaint.setTextAlign(align);
+  }
+}
diff --git a/tensorflow/examples/android/src/org/tensorflow/demo/env/ImageUtils.java b/tensorflow/examples/android/src/org/tensorflow/demo/env/ImageUtils.java
index a6a8c583190..6f957d1abd5 100644
--- a/tensorflow/examples/android/src/org/tensorflow/demo/env/ImageUtils.java
+++ b/tensorflow/examples/android/src/org/tensorflow/demo/env/ImageUtils.java
@@ -16,8 +16,8 @@ limitations under the License.
 package org.tensorflow.demo.env;
 
 import android.graphics.Bitmap;
+import android.graphics.Matrix;
 import android.os.Environment;
-
 import java.io.File;
 import java.io.FileOutputStream;
 
@@ -49,6 +49,16 @@ public class ImageUtils {
    * @param bitmap The bitmap to save.
    */
   public static void saveBitmap(final Bitmap bitmap) {
+    saveBitmap(bitmap, "preview.png");
+  }
+
+  /**
+   * Saves a Bitmap object to disk for analysis.
+   *
+   * @param bitmap The bitmap to save.
+   * @param filename The location to save the bitmap to.
+   */
+  public static void saveBitmap(final Bitmap bitmap, final String filename) {
     final String root =
         Environment.getExternalStorageDirectory().getAbsolutePath() + File.separator + "tensorflow";
     LOGGER.i("Saving %dx%d bitmap to %s.", bitmap.getWidth(), bitmap.getHeight(), root);
@@ -58,7 +68,7 @@ public class ImageUtils {
       LOGGER.i("Make dir failed");
     }
 
-    final String fname = "preview.png";
+    final String fname = filename;
     final File file = new File(myDir, fname);
     if (file.exists()) {
       file.delete();
@@ -151,4 +161,66 @@ public class ImageUtils {
    */
   public static native void convertRGB565ToYUV420SP(
       byte[] input, byte[] output, int width, int height);
+
+  /**
+   * Returns a transformation matrix from one reference frame into another.
+   * Handles cropping (if maintaining aspect ratio is desired) and rotation.
+   *
+   * @param srcWidth Width of source frame.
+   * @param srcHeight Height of source frame.
+   * @param dstWidth Width of destination frame.
+   * @param dstHeight Height of destination frame.
+   * @param applyRotation Amount of rotation to apply from one frame to another.
+   *  Must be a multiple of 90.
+   * @param maintainAspectRatio If true, will ensure that scaling in x and y remains constant,
+   * cropping the image if necessary.
+   * @return The transformation fulfilling the desired requirements.
+   */
+  public static Matrix getTransformationMatrix(
+      final int srcWidth,
+      final int srcHeight,
+      final int dstWidth,
+      final int dstHeight,
+      final int applyRotation,
+      final boolean maintainAspectRatio) {
+    final Matrix matrix = new Matrix();
+
+    if (applyRotation != 0) {
+      // Translate so center of image is at origin.
+      matrix.postTranslate(-srcWidth / 2.0f, -srcHeight / 2.0f);
+
+      // Rotate around origin.
+      matrix.postRotate(applyRotation);
+    }
+
+    // Account for the already applied rotation, if any, and then determine how
+    // much scaling is needed for each axis.
+    final boolean transpose = (Math.abs(applyRotation) + 90) % 180 == 0;
+
+    final int inWidth = transpose ? srcHeight : srcWidth;
+    final int inHeight = transpose ? srcWidth : srcHeight;
+
+    // Apply scaling if necessary.
+    if (inWidth != dstWidth || inHeight != dstHeight) {
+      final float scaleFactorX = dstWidth / (float) inWidth;
+      final float scaleFactorY = dstHeight / (float) inHeight;
+
+      if (maintainAspectRatio) {
+        // Scale by minimum factor so that dst is filled completely while
+        // maintaining the aspect ratio. Some image may fall off the edge.
+        final float scaleFactor = Math.max(scaleFactorX, scaleFactorX);
+        matrix.postScale(scaleFactor, scaleFactor);
+      } else {
+        // Scale exactly to fill dst from src.
+        matrix.postScale(scaleFactorX, scaleFactorY);
+      }
+    }
+
+    if (applyRotation != 0) {
+      // Translate back from origin centered reference to destination frame.
+      matrix.postTranslate(dstWidth / 2.0f, dstHeight / 2.0f);
+    }
+
+    return matrix;
+  }
 }
diff --git a/tensorflow/examples/android/src/org/tensorflow/demo/env/Size.java b/tensorflow/examples/android/src/org/tensorflow/demo/env/Size.java
new file mode 100644
index 00000000000..ef15d14daa8
--- /dev/null
+++ b/tensorflow/examples/android/src/org/tensorflow/demo/env/Size.java
@@ -0,0 +1,143 @@
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+
+package org.tensorflow.demo.env;
+
+import android.graphics.Bitmap;
+import android.text.TextUtils;
+import java.io.Serializable;
+import java.util.ArrayList;
+import java.util.List;
+
+/**
+ * Size class independent of a Camera object.
+ */
+public class Size implements Comparable<Size>, Serializable {
+
+  // 1.4 went out with this UID so we'll need to maintain it to preserve pending queries when
+  // upgrading.
+  public static final long serialVersionUID = 7689808733290872361L;
+
+  public final int width;
+  public final int height;
+
+  public Size(final int width, final int height) {
+    this.width = width;
+    this.height = height;
+  }
+
+  public Size(final Bitmap bmp) {
+    this.width = bmp.getWidth();
+    this.height = bmp.getHeight();
+  }
+
+  /**
+   * Rotate a size by the given number of degrees.
+   * @param size Size to rotate.
+   * @param rotation Degrees {0, 90, 180, 270} to rotate the size.
+   * @return Rotated size.
+   */
+  public static Size getRotatedSize(final Size size, final int rotation) {
+    if (rotation % 180 != 0) {
+      // The phone is portrait, therefore the camera is sideways and frame should be rotated.
+      return new Size(size.height, size.width);
+    }
+    return size;
+  }
+
+  public static Size parseFromString(String sizeString) {
+    if (TextUtils.isEmpty(sizeString)) {
+      return null;
+    }
+
+    sizeString = sizeString.trim();
+
+    // The expected format is "<width>x<height>".
+    final String[] components = sizeString.split("x");
+    if (components.length == 2) {
+      try {
+        final int width = Integer.parseInt(components[0]);
+        final int height = Integer.parseInt(components[1]);
+        return new Size(width, height);
+      } catch (final NumberFormatException e) {
+        return null;
+      }
+    } else {
+      return null;
+    }
+  }
+
+  public static List<Size> sizeStringToList(final String sizes) {
+    final List<Size> sizeList = new ArrayList<Size>();
+    if (sizes != null) {
+      final String[] pairs = sizes.split(",");
+      for (final String pair : pairs) {
+        final Size size = Size.parseFromString(pair);
+        if (size != null) {
+          sizeList.add(size);
+        }
+      }
+    }
+    return sizeList;
+  }
+
+  public static String sizeListToString(final List<Size> sizes) {
+    String sizesString = "";
+    if (sizes != null && sizes.size() > 0) {
+      sizesString = sizes.get(0).toString();
+      for (int i = 1; i < sizes.size(); i++) {
+        sizesString += "," + sizes.get(i).toString();
+      }
+    }
+    return sizesString;
+  }
+
+  public final float aspectRatio() {
+    return (float) width / (float) height;
+  }
+
+  @Override
+  public int compareTo(final Size other) {
+    return width * height - other.width * other.height;
+  }
+
+  @Override
+  public boolean equals(final Object other) {
+    if (other == null) {
+      return false;
+    }
+
+    if (!(other instanceof Size)) {
+      return false;
+    }
+
+    final Size otherSize = (Size) other;
+    return (width == otherSize.width && height == otherSize.height);
+  }
+
+  @Override
+  public int hashCode() {
+    return width * 32713 + height;
+  }
+
+  @Override
+  public String toString() {
+    return dimensionsAsString(width, height);
+  }
+
+  public static final String dimensionsAsString(final int width, final int height) {
+    return width + "x" + height;
+  }
+}
diff --git a/tensorflow/examples/image_retraining/retrain.py b/tensorflow/examples/image_retraining/retrain.py
index 392f0176d37..74c1de8fd7d 100644
--- a/tensorflow/examples/image_retraining/retrain.py
+++ b/tensorflow/examples/image_retraining/retrain.py
@@ -66,7 +66,6 @@ from __future__ import print_function
 
 import argparse
 from datetime import datetime
-import glob
 import hashlib
 import os.path
 import random
@@ -131,7 +130,7 @@ def create_image_lists(image_dir, testing_percentage, validation_percentage):
     print("Image directory '" + image_dir + "' not found.")
     return None
   result = {}
-  sub_dirs = [x[0] for x in os.walk(image_dir)]
+  sub_dirs = [x[0] for x in gfile.Walk(image_dir)]
   # The root directory comes first, so skip it.
   is_root_dir = True
   for sub_dir in sub_dirs:
@@ -146,7 +145,7 @@ def create_image_lists(image_dir, testing_percentage, validation_percentage):
     print("Looking for images in '" + dir_name + "'")
     for extension in extensions:
       file_glob = os.path.join(image_dir, dir_name, '*.' + extension)
-      file_list.extend(glob.glob(file_glob))
+      file_list.extend(gfile.Glob(file_glob))
     if not file_list:
       print('No files found')
       continue
diff --git a/tensorflow/examples/learn/BUILD b/tensorflow/examples/learn/BUILD
index b7eb2ce1cba..169cd8d8670 100644
--- a/tensorflow/examples/learn/BUILD
+++ b/tensorflow/examples/learn/BUILD
@@ -156,6 +156,25 @@ py_binary(
     ],
 )
 
+py_binary(
+    name = "mnist",
+    srcs = ["mnist.py"],
+    srcs_version = "PY2AND3",
+    deps = [
+        "//tensorflow:tensorflow_py",
+        "//tensorflow/examples/tutorials/mnist:input_data",
+    ],
+)
+
+py_binary(
+    name = "multiple_gpu",
+    srcs = ["multiple_gpu.py"],
+    srcs_version = "PY2AND3",
+    deps = [
+        "//tensorflow:tensorflow_py",
+    ],
+)
+
 sh_test(
     name = "examples_test",
     size = "large",
diff --git a/tensorflow/examples/learn/examples_test.sh b/tensorflow/examples/learn/examples_test.sh
index 317e70d5745..8942720271c 100755
--- a/tensorflow/examples/learn/examples_test.sh
+++ b/tensorflow/examples/learn/examples_test.sh
@@ -46,16 +46,16 @@ function test() {
 
 test boston
 test iris
-test iris_custom_model
 test iris_custom_decay_dnn
+test iris_custom_model
 test iris_run_config
 test iris_val_based_early_stopping
 test iris_with_pipeline
+test random_forest_mnist
 test resnet
 test text_classification --test_with_fake_data
 test text_classification_builtin_rnn_model --test_with_fake_data
-test text_classification_cnn --test_with_fake_data
 test text_classification_character_cnn --test_with_fake_data
 test text_classification_character_rnn --test_with_fake_data
-test random_forest_mnist
+test text_classification_cnn --test_with_fake_data
 test wide_n_deep_tutorial
diff --git a/tensorflow/examples/learn/iris_custom_model.py b/tensorflow/examples/learn/iris_custom_model.py
index 149ee47fa75..bfe5238eba5 100644
--- a/tensorflow/examples/learn/iris_custom_model.py
+++ b/tensorflow/examples/learn/iris_custom_model.py
@@ -38,17 +38,18 @@ def my_model(features, target):
                           normalizer_fn=normalizer_fn,
                           normalizer_params=normalizer_params)
 
-  # Create two tensors respectively for prediction and loss.
-  prediction, loss = (
-      tf.contrib.learn.models.logistic_regression(features, target)
-  )
+  # Compute logits (1 per class) and compute loss.
+  logits = layers.fully_connected(features, 3, activation_fn=None)
+  loss = tf.contrib.losses.softmax_cross_entropy(logits, target)
 
   # Create a tensor for training op.
   train_op = tf.contrib.layers.optimize_loss(
       loss, tf.contrib.framework.get_global_step(), optimizer='Adagrad',
       learning_rate=0.1)
 
-  return {'class': tf.argmax(prediction, 1), 'prob': prediction}, loss, train_op
+  return ({
+      'class': tf.argmax(logits, 1),
+      'prob': tf.nn.softmax(logits)}, loss, train_op)
 
 
 def main(unused_argv):
diff --git a/tensorflow/examples/learn/iris_with_pipeline.py b/tensorflow/examples/learn/iris_with_pipeline.py
index c548387f388..94cfbceee0f 100644
--- a/tensorflow/examples/learn/iris_with_pipeline.py
+++ b/tensorflow/examples/learn/iris_with_pipeline.py
@@ -47,7 +47,7 @@ def main(unused_argv):
 
   pipeline.fit(x_train, y_train, DNNclassifier__steps=200)
 
-  score = accuracy_score(y_test, pipeline.predict(x_test))
+  score = accuracy_score(y_test, list(pipeline.predict(x_test)))
   print('Accuracy: {0:f}'.format(score))
 
 
diff --git a/tensorflow/examples/learn/mnist.py b/tensorflow/examples/learn/mnist.py
new file mode 100644
index 00000000000..8b416373ba0
--- /dev/null
+++ b/tensorflow/examples/learn/mnist.py
@@ -0,0 +1,104 @@
+#  Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+
+"""This showcases how simple it is to build image classification networks.
+
+It follows description from this TensorFlow tutorial:
+    https://www.tensorflow.org/versions/master/tutorials/mnist/pros/index.html#deep-mnist-for-experts
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import numpy as np
+from sklearn import metrics
+import tensorflow as tf
+from tensorflow.contrib import layers
+from tensorflow.contrib import learn
+
+
+def max_pool_2x2(tensor_in):
+  return tf.nn.max_pool(
+      tensor_in, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')
+
+
+def conv_model(feature, target, mode):
+  """2-layer convolution model."""
+  # Convert the target to a one-hot tensor of shape (batch_size, 10) and
+  # with a on-value of 1 for each one-hot vector of length 10.
+  target = tf.one_hot(tf.cast(target, tf.int32), 10, 1, 0)
+
+  # Reshape feature to 4d tensor with 2nd and 3rd dimensions being
+  # image width and height final dimension being the number of color channels.
+  feature = tf.reshape(feature, [-1, 28, 28, 1])
+
+  # First conv layer will compute 32 features for each 5x5 patch
+  with tf.variable_scope('conv_layer1'):
+    h_conv1 = layers.convolution(feature, 32, kernel_size=[5, 5],
+                                 activation_fn=tf.nn.relu)
+    h_pool1 = max_pool_2x2(h_conv1)
+
+  # Second conv layer will compute 64 features for each 5x5 patch.
+  with tf.variable_scope('conv_layer2'):
+    h_conv2 = layers.convolution(h_pool1, 64, kernel_size=[5, 5],
+                                 activation_fn=tf.nn.relu)
+    h_pool2 = max_pool_2x2(h_conv2)
+    # reshape tensor into a batch of vectors
+    h_pool2_flat = tf.reshape(h_pool2, [-1, 7 * 7 * 64])
+
+  # Densely connected layer with 1024 neurons.
+  h_fc1 = layers.dropout(
+      layers.fully_connected(
+          h_pool2_flat, 1024, activation_fn=tf.nn.relu), keep_prob=0.5,
+      is_training=mode == tf.contrib.learn.ModeKeys.TRAIN)
+
+  # Compute logits (1 per class) and compute loss.
+  logits = layers.fully_connected(h_fc1, 10, activation_fn=None)
+  loss = tf.contrib.losses.softmax_cross_entropy(logits, target)
+
+  # Create a tensor for training op.
+  train_op = layers.optimize_loss(
+      loss, tf.contrib.framework.get_global_step(), optimizer='SGD',
+      learning_rate=0.001)
+
+  return tf.argmax(logits, 1), loss, train_op
+
+
+def main(unused_args):
+  ### Download and load MNIST dataset.
+  mnist = learn.datasets.load_dataset('mnist')
+
+  ### Linear classifier.
+  feature_columns = learn.infer_real_valued_columns_from_input(
+      mnist.train.images)
+  classifier = learn.LinearClassifier(
+      feature_columns=feature_columns, n_classes=10)
+  classifier.fit(mnist.train.images, mnist.train.labels.astype(np.int32),
+                 batch_size=100, steps=1000)
+  score = metrics.accuracy_score(
+      mnist.test.labels, list(classifier.predict(mnist.test.images)))
+  print('Accuracy: {0:f}'.format(score))
+
+  ### Convolutional network
+  classifier = learn.Estimator(model_fn=conv_model)
+  classifier.fit(mnist.train.images, mnist.train.labels,
+                 batch_size=100, steps=20000)
+  score = metrics.accuracy_score(
+      mnist.test.labels, list(classifier.predict(mnist.test.images)))
+  print('Accuracy: {0:f}'.format(score))
+
+
+if __name__ == '__main__':
+  tf.app.run()
diff --git a/tensorflow/examples/learn/multiple_gpu.py b/tensorflow/examples/learn/multiple_gpu.py
new file mode 100644
index 00000000000..6647ec3d42e
--- /dev/null
+++ b/tensorflow/examples/learn/multiple_gpu.py
@@ -0,0 +1,87 @@
+#  Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+#  Licensed under the Apache License, Version 2.0 (the "License");
+#  you may not use this file except in compliance with the License.
+#  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+"""Example of using Estimator with multiple GPUs to distribute one model.
+
+This example only runs if you have multiple GPUs to assign to.
+"""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from sklearn import cross_validation
+from sklearn import datasets
+from sklearn import metrics
+import tensorflow as tf
+from tensorflow.contrib import layers
+from tensorflow.contrib import learn
+
+
+def my_model(features, target):
+  """DNN with three hidden layers, and dropout of 0.1 probability.
+
+  Note: If you want to run this example with multiple GPUs, Cuda Toolkit 7.0 and
+  CUDNN 6.5 V2 from NVIDIA need to be installed beforehand.
+
+  Args:
+    features: `Tensor` of input features.
+    target: `Tensor` of targets.
+
+  Returns:
+    Tuple of predictions, loss and training op.
+  """
+  # Convert the target to a one-hot tensor of shape (length of features, 3) and
+  # with a on-value of 1 for each one-hot vector of length 3.
+  target = tf.one_hot(target, 3, 1, 0)
+
+  # Create three fully connected layers respectively of size 10, 20, and 10 with
+  # each layer having a dropout probability of 0.1.
+  normalizer_fn = layers.dropout
+  normalizer_params = {'keep_prob': 0.5}
+  with tf.device('/gpu:1'):
+    features = layers.stack(features, layers.fully_connected, [10, 20, 10],
+                            normalizer_fn=normalizer_fn,
+                            normalizer_params=normalizer_params)
+
+  with tf.device('/gpu:2'):
+    # Compute logits (1 per class) and compute loss.
+    logits = layers.fully_connected(features, 3, activation_fn=None)
+    loss = tf.contrib.losses.softmax_cross_entropy(logits, target)
+
+    # Create a tensor for training op.
+    train_op = tf.contrib.layers.optimize_loss(
+        loss, tf.contrib.framework.get_global_step(), optimizer='Adagrad',
+        learning_rate=0.1)
+
+  return ({
+      'class': tf.argmax(logits, 1),
+      'prob': tf.nn.softmax(logits)}, loss, train_op)
+
+
+def main(unused_argv):
+  iris = datasets.load_iris()
+  x_train, x_test, y_train, y_test = cross_validation.train_test_split(
+      iris.data, iris.target, test_size=0.2, random_state=42)
+
+  classifier = learn.Estimator(model_fn=my_model)
+  classifier.fit(x_train, y_train, steps=1000)
+
+  y_predicted = [
+      p['class'] for p in classifier.predict(x_test, as_iterable=True)]
+  score = metrics.accuracy_score(y_test, y_predicted)
+  print('Accuracy: {0:f}'.format(score))
+
+
+if __name__ == '__main__':
+  tf.app.run()
diff --git a/tensorflow/examples/learn/resnet.py b/tensorflow/examples/learn/resnet.py
index 3e9b579b357..fe1a07ccfa1 100755
--- a/tensorflow/examples/learn/resnet.py
+++ b/tensorflow/examples/learn/resnet.py
@@ -132,7 +132,10 @@ def res_net(x, y, activation=tf.nn.relu):
   net = tf.reshape(net, [-1, net_shape[1] * net_shape[2] * net_shape[3]])
 
   target = tf.one_hot(y, depth=10, dtype=tf.float32)
-  return learn.models.logistic_regression(net, target)
+  logits = tf.contrib.layers.fully_connected(net, 10, activation_fn=None)
+  loss = tf.contrib.losses.softmax_cross_entropy(logits, target)
+  return tf.softmax(logits), loss
+
 
 def res_net_model(x, y):
   prediction, loss = res_net(x, y)
diff --git a/tensorflow/examples/learn/text_classification.py b/tensorflow/examples/learn/text_classification.py
index 87a23831f35..7ad77787abb 100644
--- a/tensorflow/examples/learn/text_classification.py
+++ b/tensorflow/examples/learn/text_classification.py
@@ -34,28 +34,29 @@ EMBEDDING_SIZE = 50
 n_words = 0
 
 
-def bag_of_words_model(x, y):
+def bag_of_words_model(features, target):
   """A bag-of-words model. Note it disregards the word order in the text."""
-  target = tf.one_hot(y, 15, 1, 0)
-  word_vectors = learn.ops.categorical_variable(x, n_classes=n_words,
-      embedding_size=EMBEDDING_SIZE, name='words')
-  features = tf.reduce_max(word_vectors, reduction_indices=1)
-  prediction, loss = learn.models.logistic_regression(features, target)
+  target = tf.one_hot(target, 15, 1, 0)
+  features = tf.contrib.layers.bow_encoder(
+      features, vocab_size=n_words, embed_dim=EMBEDDING_SIZE)
+  logits = tf.contrib.layers.fully_connected(features, 15, activation_fn=None)
+  loss = tf.contrib.losses.softmax_cross_entropy(logits, target)
   train_op = tf.contrib.layers.optimize_loss(
       loss, tf.contrib.framework.get_global_step(),
       optimizer='Adam', learning_rate=0.01)
-  return {'class': tf.argmax(prediction, 1), 'prob': prediction}, loss, train_op
+  return (
+      {'class': tf.argmax(logits, 1), 'prob': tf.nn.softmax(logits)},
+      loss, train_op)
 
 
-def rnn_model(x, y):
-  """Recurrent neural network model to predict from sequence of words
-  to a class."""
+def rnn_model(features, target):
+  """RNN model to predict from sequence of words to a class."""
   # Convert indexes of words into embeddings.
   # This creates embeddings matrix of [n_words, EMBEDDING_SIZE] and then
   # maps word indexes of the sequence into [batch_size, sequence_length,
   # EMBEDDING_SIZE].
-  word_vectors = learn.ops.categorical_variable(x, n_classes=n_words,
-      embedding_size=EMBEDDING_SIZE, name='words')
+  word_vectors = tf.contrib.layers.embed_sequence(
+      features, vocab_size=n_words, embed_dim=EMBEDDING_SIZE, scope='words')
 
   # Split into list of embedding per word, while removing doc length dim.
   # word_list results to be a list of tensors [batch_size, EMBEDDING_SIZE].
@@ -71,15 +72,18 @@ def rnn_model(x, y):
   # Given encoding of RNN, take encoding of last step (e.g hidden size of the
   # neural network of last step) and pass it as features for logistic
   # regression over output classes.
-  target = tf.one_hot(y, 15, 1, 0)
-  prediction, loss = learn.models.logistic_regression(encoding, target)
+  target = tf.one_hot(target, 15, 1, 0)
+  logits = tf.contrib.layers.fully_connected(encoding, 15, activation_fn=None)
+  loss = tf.contrib.losses.softmax_cross_entropy(logits, target)
 
   # Create a training op.
   train_op = tf.contrib.layers.optimize_loss(
       loss, tf.contrib.framework.get_global_step(),
       optimizer='Adam', learning_rate=0.01)
 
-  return {'class': tf.argmax(prediction, 1), 'prob': prediction}, loss, train_op
+  return (
+      {'class': tf.argmax(logits, 1), 'prob': tf.nn.softmax(logits)},
+      loss, train_op)
 
 
 def main(unused_argv):
@@ -100,7 +104,11 @@ def main(unused_argv):
   print('Total words: %d' % n_words)
 
   # Build model
-  classifier = learn.Estimator(model_fn=bag_of_words_model)
+  # Switch between rnn_model and bag_of_words_model to test different models.
+  model_fn = rnn_model
+  if FLAGS.bow_model:
+    model_fn = bag_of_words_model
+  classifier = learn.Estimator(model_fn=model_fn)
 
   # Train and predict
   classifier.fit(x_train, y_train, steps=100)
@@ -118,5 +126,11 @@ if __name__ == '__main__':
       help='Test the example code with fake data.',
       action='store_true'
   )
+  parser.add_argument(
+      '--bow_model',
+      default=False,
+      help='Run with BOW model instead of RNN.',
+      action='store_true'
+  )
   FLAGS, unparsed = parser.parse_known_args()
   tf.app.run(main=main, argv=[sys.argv[0]] + unparsed)
diff --git a/tensorflow/examples/learn/text_classification_builtin_rnn_model.py b/tensorflow/examples/learn/text_classification_builtin_rnn_model.py
index 6a1c05b86b1..79654eb9021 100644
--- a/tensorflow/examples/learn/text_classification_builtin_rnn_model.py
+++ b/tensorflow/examples/learn/text_classification_builtin_rnn_model.py
@@ -32,14 +32,14 @@ EMBEDDING_SIZE = 50
 n_words = 0
 
 
-def input_op_fn(x):
+def input_op_fn(features):
   """Customized function to transform batched x into embeddings."""
   # Convert indexes of words into embeddings.
   # This creates embeddings matrix of [n_words, EMBEDDING_SIZE] and then
   # maps word indexes of the sequence into [batch_size, sequence_length,
   # EMBEDDING_SIZE].
-  word_vectors = learn.ops.categorical_variable(x, n_classes=n_words,
-      embedding_size=EMBEDDING_SIZE, name='words')
+  word_vectors = tf.contrib.layers.embed_sequence(
+      features, vocab_size=n_words, embed_dim=EMBEDDING_SIZE, scope='words')
   # Split into list of embedding per word, while removing doc length dim.
   # word_list results to be a list of tensors [batch_size, EMBEDDING_SIZE].
   word_list = tf.unpack(word_vectors, axis=1)
diff --git a/tensorflow/examples/learn/text_classification_character_cnn.py b/tensorflow/examples/learn/text_classification_character_cnn.py
index e84790471b5..ffb5a51ad4d 100644
--- a/tensorflow/examples/learn/text_classification_character_cnn.py
+++ b/tensorflow/examples/learn/text_classification_character_cnn.py
@@ -48,15 +48,15 @@ POOLING_WINDOW = 4
 POOLING_STRIDE = 2
 
 
-def char_cnn_model(x, y):
+def char_cnn_model(features, target):
   """Character level convolutional neural network model to predict classes."""
-  y = tf.one_hot(y, 15, 1, 0)
-  byte_list = tf.reshape(learn.ops.one_hot_matrix(x, 256),
+  target = tf.one_hot(target, 15, 1, 0)
+  byte_list = tf.reshape(tf.one_hot(features, 256, 1, 0),
                          [-1, MAX_DOCUMENT_LENGTH, 256, 1])
   with tf.variable_scope('CNN_Layer1'):
     # Apply Convolution filtering on input sequence.
-    conv1 = tf.contrib.layers.convolution2d(byte_list, N_FILTERS,
-                             FILTER_SHAPE1, padding='VALID')
+    conv1 = tf.contrib.layers.convolution2d(
+        byte_list, N_FILTERS, FILTER_SHAPE1, padding='VALID')
     # Add a RELU for non linearity.
     conv1 = tf.nn.relu(conv1)
     # Max pooling across output of Convolution+Relu.
@@ -66,20 +66,22 @@ def char_cnn_model(x, y):
     pool1 = tf.transpose(pool1, [0, 1, 3, 2])
   with tf.variable_scope('CNN_Layer2'):
     # Second level of convolution filtering.
-    conv2 = tf.contrib.layers.convolution2d(pool1, N_FILTERS,
-                                            FILTER_SHAPE2,
-                                            padding='VALID')
+    conv2 = tf.contrib.layers.convolution2d(
+        pool1, N_FILTERS, FILTER_SHAPE2, padding='VALID')
     # Max across each filter to get useful features for classification.
     pool2 = tf.squeeze(tf.reduce_max(conv2, 1), squeeze_dims=[1])
 
   # Apply regular WX + B and classification.
-  prediction, loss = learn.models.logistic_regression(pool2, y)
+  logits = tf.contrib.layers.fully_connected(pool2, 15, activation_fn=None)
+  loss = tf.contrib.losses.softmax_cross_entropy(logits, target)
 
   train_op = tf.contrib.layers.optimize_loss(
       loss, tf.contrib.framework.get_global_step(),
       optimizer='Adam', learning_rate=0.01)
 
-  return {'class': tf.argmax(prediction, 1), 'prob': prediction}, loss, train_op
+  return (
+      {'class': tf.argmax(logits, 1), 'prob': tf.nn.softmax(logits)},
+      loss, train_op)
 
 
 def main(unused_argv):
diff --git a/tensorflow/examples/learn/text_classification_character_rnn.py b/tensorflow/examples/learn/text_classification_character_rnn.py
index e62663aa8af..bca3df4c04f 100644
--- a/tensorflow/examples/learn/text_classification_character_rnn.py
+++ b/tensorflow/examples/learn/text_classification_character_rnn.py
@@ -44,22 +44,25 @@ MAX_DOCUMENT_LENGTH = 100
 HIDDEN_SIZE = 20
 
 
-def char_rnn_model(x, y):
+def char_rnn_model(features, target):
   """Character level recurrent neural network model to predict classes."""
-  y = tf.one_hot(y, 15, 1, 0)
-  byte_list = learn.ops.one_hot_matrix(x, 256)
+  target = tf.one_hot(target, 15, 1, 0)
+  byte_list = tf.ont_hot(features, 256, 1, 0)
   byte_list = tf.unpack(byte_list, axis=1)
 
   cell = tf.nn.rnn_cell.GRUCell(HIDDEN_SIZE)
   _, encoding = tf.nn.rnn(cell, byte_list, dtype=tf.float32)
 
-  prediction, loss = learn.models.logistic_regression(encoding, y)
+  logits = tf.contrib.layers.fully_connected(encoding, 15, activation_fn=None)
+  loss = tf.contrib.losses.softmax_cross_entropy(logits, target)
 
   train_op = tf.contrib.layers.optimize_loss(
       loss, tf.contrib.framework.get_global_step(),
       optimizer='Adam', learning_rate=0.01)
 
-  return {'class': tf.argmax(prediction, 1), 'prob': prediction}, loss, train_op
+  return (
+      {'class': tf.argmax(logits, 1), 'prob': tf.nn.softmax(logits)},
+      loss, train_op)
 
 
 def main(unused_argv):
diff --git a/tensorflow/examples/learn/text_classification_cnn.py b/tensorflow/examples/learn/text_classification_cnn.py
index f71df272ead..cb17ae46ae5 100644
--- a/tensorflow/examples/learn/text_classification_cnn.py
+++ b/tensorflow/examples/learn/text_classification_cnn.py
@@ -40,16 +40,15 @@ POOLING_STRIDE = 2
 n_words = 0
 
 
-def cnn_model(x, y):
-  """2 layer Convolutional network to predict from sequence of words
-  to a class."""
+def cnn_model(features, target):
+  """2 layer ConvNet to predict from sequence of words to a class."""
   # Convert indexes of words into embeddings.
   # This creates embeddings matrix of [n_words, EMBEDDING_SIZE] and then
   # maps word indexes of the sequence into [batch_size, sequence_length,
   # EMBEDDING_SIZE].
-  y = tf.one_hot(y, 15, 1, 0)
-  word_vectors = learn.ops.categorical_variable(x, n_classes=n_words,
-      embedding_size=EMBEDDING_SIZE, name='words')
+  target = tf.one_hot(target, 15, 1, 0)
+  word_vectors = tf.contrib.layers.embed_sequence(
+      features, vocab_size=n_words, embed_dim=EMBEDDING_SIZE, scope='words')
   word_vectors = tf.expand_dims(word_vectors, 3)
   with tf.variable_scope('CNN_Layer1'):
     # Apply Convolution filtering on input sequence.
@@ -58,7 +57,8 @@ def cnn_model(x, y):
     # Add a RELU for non linearity.
     conv1 = tf.nn.relu(conv1)
     # Max pooling across output of Convolution+Relu.
-    pool1 = tf.nn.max_pool(conv1, ksize=[1, POOLING_WINDOW, 1, 1],
+    pool1 = tf.nn.max_pool(
+        conv1, ksize=[1, POOLING_WINDOW, 1, 1],
         strides=[1, POOLING_STRIDE, 1, 1], padding='SAME')
     # Transpose matrix so that n_filters from convolution becomes width.
     pool1 = tf.transpose(pool1, [0, 1, 3, 2])
@@ -70,13 +70,16 @@ def cnn_model(x, y):
     pool2 = tf.squeeze(tf.reduce_max(conv2, 1), squeeze_dims=[1])
 
   # Apply regular WX + B and classification.
-  prediction, loss = learn.models.logistic_regression(pool2, y)
+  logits = tf.contrib.layers.fully_connected(pool2, 15, activation_fn=None)
+  loss = tf.contrib.losses.softmax_cross_entropy(logits, target)
 
   train_op = tf.contrib.layers.optimize_loss(
       loss, tf.contrib.framework.get_global_step(),
       optimizer='Adam', learning_rate=0.01)
 
-  return {'class': tf.argmax(prediction, 1), 'prob': prediction}, loss, train_op
+  return (
+      {'class': tf.argmax(logits, 1), 'prob': tf.nn.softmax(logits)},
+      loss, train_op)
 
 
 def main(unused_argv):
diff --git a/tensorflow/examples/skflow/BUILD b/tensorflow/examples/skflow/BUILD
deleted file mode 100644
index e18e9b1c1c7..00000000000
--- a/tensorflow/examples/skflow/BUILD
+++ /dev/null
@@ -1,38 +0,0 @@
-# Example models (using skflow).
-
-package(default_visibility = ["//tensorflow:internal"])
-
-licenses(["notice"])  # Apache 2.0
-
-exports_files(["LICENSE"])
-
-py_binary(
-    name = "mnist",
-    srcs = ["mnist.py"],
-    srcs_version = "PY2AND3",
-    deps = [
-        "//tensorflow:tensorflow_py",
-        "//tensorflow/examples/tutorials/mnist:input_data",
-    ],
-)
-
-py_binary(
-    name = "multiple_gpu",
-    srcs = ["multiple_gpu.py"],
-    srcs_version = "PY2AND3",
-    deps = [
-        "//tensorflow:tensorflow_py",
-    ],
-)
-
-filegroup(
-    name = "all_files",
-    srcs = glob(
-        ["**/*"],
-        exclude = [
-            "**/METADATA",
-            "**/OWNERS",
-        ],
-    ),
-    visibility = ["//tensorflow:__subpackages__"],
-)
diff --git a/tensorflow/examples/skflow/mnist.py b/tensorflow/examples/skflow/mnist.py
deleted file mode 100644
index e2b78883e4e..00000000000
--- a/tensorflow/examples/skflow/mnist.py
+++ /dev/null
@@ -1,82 +0,0 @@
-#  Copyright 2016 The TensorFlow Authors. All Rights Reserved.
-#
-#  Licensed under the Apache License, Version 2.0 (the "License");
-#  you may not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing, software
-#  distributed under the License is distributed on an "AS IS" BASIS,
-#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-#  See the License for the specific language governing permissions and
-#  limitations under the License.
-
-"""This showcases how simple it is to build image classification networks.
-
-It follows description from this TensorFlow tutorial:
-    https://www.tensorflow.org/versions/master/tutorials/mnist/pros/index.html#deep-mnist-for-experts
-"""
-
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from sklearn import metrics
-import tensorflow as tf
-from tensorflow.contrib import learn
-
-### Download and load MNIST data.
-
-mnist = learn.datasets.load_dataset('mnist')
-
-### Linear classifier.
-
-feature_columns = learn.infer_real_valued_columns_from_input(mnist.train.images)
-classifier = learn.LinearClassifier(
-    feature_columns=feature_columns, n_classes=10)
-classifier.fit(mnist.train.images, mnist.train.labels, batch_size=100,
-               steps=1000)
-score = metrics.accuracy_score(
-    mnist.test.labels, classifier.predict(mnist.test.images))
-print('Accuracy: {0:f}'.format(score))
-
-### Convolutional network
-
-
-def max_pool_2x2(tensor_in):
-  return tf.nn.max_pool(
-      tensor_in, ksize=[1, 2, 2, 1], strides=[1, 2, 2, 1], padding='SAME')
-
-
-def conv_model(X, y):
-  # pylint: disable=invalid-name,missing-docstring
-  # reshape X to 4d tensor with 2nd and 3rd dimensions being image width and
-  # height final dimension being the number of color channels.
-  X = tf.reshape(X, [-1, 28, 28, 1])
-  # first conv layer will compute 32 features for each 5x5 patch
-  with tf.variable_scope('conv_layer1'):
-    h_conv1 = learn.ops.conv2d(X, n_filters=32, filter_shape=[5, 5],
-                               bias=True, activation=tf.nn.relu)
-    h_pool1 = max_pool_2x2(h_conv1)
-  # second conv layer will compute 64 features for each 5x5 patch.
-  with tf.variable_scope('conv_layer2'):
-    h_conv2 = learn.ops.conv2d(h_pool1, n_filters=64, filter_shape=[5, 5],
-                               bias=True, activation=tf.nn.relu)
-    h_pool2 = max_pool_2x2(h_conv2)
-    # reshape tensor into a batch of vectors
-    h_pool2_flat = tf.reshape(h_pool2, [-1, 7 * 7 * 64])
-  # densely connected layer with 1024 neurons.
-  h_fc1 = tf.contrib.layers.dropout(
-      tf.contrib.layers.legacy_fully_connected(
-          h_pool2_flat, 1024, weight_init=None, activation_fn=tf.nn.relu))
-  return learn.models.logistic_regression(h_fc1, y)
-
-# Training and predicting.
-classifier = learn.TensorFlowEstimator(
-    model_fn=conv_model, n_classes=10, batch_size=100, steps=20000,
-    learning_rate=0.001)
-classifier.fit(mnist.train.images, mnist.train.labels)
-score = metrics.accuracy_score(
-    mnist.test.labels, classifier.predict(mnist.test.images))
-print('Accuracy: {0:f}'.format(score))
diff --git a/tensorflow/examples/skflow/multiple_gpu.py b/tensorflow/examples/skflow/multiple_gpu.py
deleted file mode 100644
index 5bb647e54ee..00000000000
--- a/tensorflow/examples/skflow/multiple_gpu.py
+++ /dev/null
@@ -1,44 +0,0 @@
-#  Copyright 2016 The TensorFlow Authors. All Rights Reserved.
-#
-#  Licensed under the Apache License, Version 2.0 (the "License");
-#  you may not use this file except in compliance with the License.
-#  You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-#  Unless required by applicable law or agreed to in writing, software
-#  distributed under the License is distributed on an "AS IS" BASIS,
-#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-#  See the License for the specific language governing permissions and
-#  limitations under the License.
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-from sklearn import datasets, metrics, cross_validation
-import tensorflow as tf
-from tensorflow.contrib import learn
-
-iris = datasets.load_iris()
-X_train, X_test, y_train, y_test = cross_validation.train_test_split(iris.data, iris.target,
-    test_size=0.2, random_state=42)
-
-def my_model(X, y):
-  """
-  This is DNN with 10, 20, 10 hidden layers, and dropout of 0.5 probability.
-
-  Note: If you want to run this example with multiple GPUs, Cuda Toolkit 7.0 and
-  CUDNN 6.5 V2 from NVIDIA need to be installed beforehand.
-  """
-  with tf.device('/gpu:1'):
-    dnn = lambda inputs, num_outputs, scope: tf.contrib.layers.dropout(
-        tf.contrib.layers.legacy_fully_connected(
-            inputs, num_outputs, weight_init=None, activation_fn=tf.nn.relu))
-    layers = tf.contrib.layers.stack(X, dnn, [10, 20, 10])
-  with tf.device('/gpu:2'):
-    return learn.models.logistic_regression(layers, y)
-
-classifier = learn.TensorFlowEstimator(model_fn=my_model, n_classes=3)
-classifier.fit(X_train, y_train)
-score = metrics.accuracy_score(y_test, classifier.predict(X_test))
-print('Accuracy: {0:f}'.format(score))
diff --git a/tensorflow/g3doc/api_docs/cc/ClassEnv.md b/tensorflow/g3doc/api_docs/cc/ClassEnv.md
index 0010c0fbb23..88a39a5ee86 100644
--- a/tensorflow/g3doc/api_docs/cc/ClassEnv.md
+++ b/tensorflow/g3doc/api_docs/cc/ClassEnv.md
@@ -90,6 +90,24 @@ Stores in *result the names of the children of the specified directory. The name
 
 Original contents of *results are dropped.
 
+#### `virtual bool tensorflow::Env::MatchPath(const string &path, const string &pattern)=0` {#virtual_bool_tensorflow_Env_MatchPath}
+
+Returns true if the path matches the given pattern. The wildcards allowed in pattern are described below (GetMatchingPaths).
+
+
+
+#### `Status tensorflow::Env::GetMatchingPaths(const string &pattern, std::vector< string > *results)` {#Status_tensorflow_Env_GetMatchingPaths}
+
+Given a pattern, stores in *results the set of paths that matches that pattern. *results is cleared.
+
+pattern must match all of a name, not just a substring. pattern: { term } term: &apos;*&apos;: matches any sequence of non-&apos;/&apos; characters &apos;?&apos;: matches a single non-&apos;/&apos; character &apos;[&apos; [ &apos;^&apos; ] { match-list } &apos;]&apos;: matches any single character (not) on the list c: matches character c (c != &apos;*&apos;, &apos;?&apos;, &apos;\&apos;, &apos;[&apos;) &apos;\&apos; c: matches character c character-range: c: matches character c (c != &apos;\&apos;, &apos;-&apos;, &apos;]&apos;) &apos;\&apos; c: matches character c lo &apos;-&apos; hi: matches character c for lo <= c <= hi
+
+Typical return codes
+
+OK - no errors
+
+UNIMPLEMENTED - Some underlying functions (like GetChildren) are not implemented The default implementation uses a combination of GetChildren, MatchPath and IsDirectory.
+
 #### `Status tensorflow::Env::DeleteFile(const string &fname)` {#Status_tensorflow_Env_DeleteFile}
 
 Deletes the named file.
@@ -110,12 +128,28 @@ PERMISSION_DENIED - dirname or some descendant is not writable
 
 UNIMPLEMENTED - Some underlying functions (like Delete) are not implemented
 
+#### `Status tensorflow::Env::RecursivelyCreateDir(const string &dirname)` {#Status_tensorflow_Env_RecursivelyCreateDir}
+
+Creates the specified directory and all the necessary subdirectories. Typical return codes.
+
+
+
+OK - successfully created the directory and sub directories, even if they were already created.
+
+PERMISSION_DENIED - dirname or some subdirectory is not writable.
+
 #### `Status tensorflow::Env::CreateDir(const string &dirname)` {#Status_tensorflow_Env_CreateDir}
 
-Creates the specified directory.
+Creates the specified directory. Typical return codes.
 
 
 
+OK - successfully created the directory.
+
+ALREADY_EXISTS - directory already exists.
+
+PERMISSION_DENIED - dirname is not writable.
+
 #### `Status tensorflow::Env::DeleteDir(const string &dirname)` {#Status_tensorflow_Env_DeleteDir}
 
 Deletes the specified directory.
diff --git a/tensorflow/g3doc/api_docs/cc/ClassEnvWrapper.md b/tensorflow/g3doc/api_docs/cc/ClassEnvWrapper.md
index f0041f5be92..153dc8ca361 100644
--- a/tensorflow/g3doc/api_docs/cc/ClassEnvWrapper.md
+++ b/tensorflow/g3doc/api_docs/cc/ClassEnvWrapper.md
@@ -42,6 +42,12 @@ Returns the file system schemes registered for this Env .
 
 
 
+#### `bool tensorflow::EnvWrapper::MatchPath(const string &path, const string &pattern) override` {#bool_tensorflow_EnvWrapper_MatchPath}
+
+Returns true if the path matches the given pattern. The wildcards allowed in pattern are described below (GetMatchingPaths).
+
+
+
 #### `uint64 tensorflow::EnvWrapper::NowMicros() override` {#uint64_tensorflow_EnvWrapper_NowMicros}
 
 Returns the number of micro-seconds since some fixed point in time. Only useful for computing deltas of time.
diff --git a/tensorflow/g3doc/api_docs/cc/ClassTensor.md b/tensorflow/g3doc/api_docs/cc/ClassTensor.md
index e221a026935..b909bffe3a5 100644
--- a/tensorflow/g3doc/api_docs/cc/ClassTensor.md
+++ b/tensorflow/g3doc/api_docs/cc/ClassTensor.md
@@ -100,12 +100,6 @@ Convenience accessor for the tensor shape.
 
 
 
-#### `size_t tensorflow::Tensor::BufferHash() const` {#size_t_tensorflow_Tensor_BufferHash}
-
-
-
-
-
 #### `bool tensorflow::Tensor::IsInitialized() const` {#bool_tensorflow_Tensor_IsInitialized}
 
 If necessary, has this Tensor been initialized?
@@ -379,7 +373,7 @@ NOTE: The underlying tensor buffer is refcounted, so the lifetime of the content
 
 REQUIRES: `DataTypeCanUseMemcpy(dtype())`.
 
-#### `void tensorflow::Tensor::UnsafeCopyFromInternal(const Tensor &, const TensorShape &)` {#void_tensorflow_Tensor_UnsafeCopyFromInternal}
+#### `void tensorflow::Tensor::UnsafeCopyFromInternal(const Tensor &, DataType dtype, const TensorShape &)` {#void_tensorflow_Tensor_UnsafeCopyFromInternal}
 
 
 
diff --git a/tensorflow/g3doc/api_docs/python/array_ops.md b/tensorflow/g3doc/api_docs/python/array_ops.md
index adc18589110..83176a7d193 100644
--- a/tensorflow/g3doc/api_docs/python/array_ops.md
+++ b/tensorflow/g3doc/api_docs/python/array_ops.md
@@ -2240,6 +2240,92 @@ count ==> [2, 1, 3, 1, 2]
 *  <b>`count`</b>: A `Tensor` of type `out_idx`. 1-D.
 
 
+- - -
+
+### `tf.scatter_nd(indices, updates, shape, name=None)` {#scatter_nd}
+
+Creates a new tensor by applying sparse `updates` to individual values or slices within a zero tensor of the given `shape` tensor according to indices.
+
+This operator is the inverse of the [tf.gather_nd](#gather_nd) operator which extracts values or slices from a given tensor.
+
+TODO(simister): Add a link to Variable.__getitem__ documentation on slice syntax.
+
+`shape` is a `TensorShape` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `shape`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `shape`.
+
+`updates` is Tensor of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, shape[K], ..., shape[P-1]].
+```
+
+The simplest form of scatter is to insert individual elements in a tensor by index. For example, say we want to insert 4 scattered elements in a rank-1 tensor with 8 elements.
+
+<div style="width:70%; margin:auto; margin-bottom:10px; margin-top:20px;">
+<img style="width:100%" src="../../images/ScatterNd1.png" alt>
+</div>
+
+In Python, this scatter operation would look like this:
+
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    shape = tf.constant([8])
+    scatter = tf.scatter_nd(indices, updates, shape)
+    with tf.Session() as sess:
+      print sess.run(scatter)
+
+The resulting tensor would look like this:
+
+    [0, 11, 0, 10, 9, 0, 0, 12]
+
+We can also, insert entire slices of a higher rank tensor all at once. For example, if we wanted to insert two slices in the first dimension of a rank-3 tensor with two matrices of new values.
+
+<div style="width:70%; margin:auto; margin-bottom:10px; margin-top:20px;">
+<img style="width:100%" src="../../images/ScatterNd2.png" alt>
+</div>
+
+In Python, this scatter operation would look like this:
+
+    indices = tf.constant([[0], [2]])
+    updates = tf.constant([[[5, 5, 5, 5], [6, 6, 6, 6],
+                            [7, 7, 7, 7], [8, 8, 8, 8]],
+                           [[5, 5, 5, 5], [6, 6, 6, 6],
+                            [7, 7, 7, 7], [8, 8, 8, 8]]])
+    shape = tf.constant([4, 4, 4])
+    scatter = tf.scatter_nd(indices, updates, shape)
+    with tf.Session() as sess:
+      print sess.run(scatter)
+
+The resulting tensor would look like this:
+
+    [[[5, 5, 5, 5], [6, 6, 6, 6], [7, 7, 7, 7], [8, 8, 8, 8]],
+     [[0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0]],
+     [[5, 5, 5, 5], [6, 6, 6, 6], [7, 7, 7, 7], [8, 8, 8, 8]],
+     [[0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0]]]
+
+##### Args:
+
+
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`.
+    A Tensor. Must have the same type as tensor. A tensor of updated values to store in ref.
+*  <b>`shape`</b>: A `Tensor`. Must have the same type as `indices`.
+    A vector. The shape of the resulting tensor.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor`. Has the same type as `updates`.
+  A new tensor with the given shape and updates applied according to the indices.
+
+
 - - -
 
 ### `tf.dynamic_partition(data, partitions, num_partitions, name=None)` {#dynamic_partition}
@@ -2758,3 +2844,175 @@ Returns the difference between the `x` and `y` treated as sets.
   A `Tensor` that is of type `index_dtype` representing indices from .
 
 
+
+## Fake quantization
+Operations used to help train for better quantization accuracy.
+
+- - -
+
+### `tf.fake_quant_with_min_max_args(inputs, min=None, max=None, name=None)` {#fake_quant_with_min_max_args}
+
+Fake-quantize the 'inputs' tensor, type float to 'outputs' tensor of same type.
+
+Attributes [min; max] define the clamping range for the 'inputs' data.  Op
+divides this range into 255 steps (total of 256 values), then replaces each
+'inputs' value with the closest of the quantized step values.
+
+Quantization is called fake since the output is still in floating point.
+
+##### Args:
+
+
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+*  <b>`min`</b>: An optional `float`. Defaults to `-6`.
+*  <b>`max`</b>: An optional `float`. Defaults to `6`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor` of type `float32`.
+
+
+- - -
+
+### `tf.fake_quant_with_min_max_args_gradient(gradients, inputs, min=None, max=None, name=None)` {#fake_quant_with_min_max_args_gradient}
+
+Compute gradients for a FakeQuantWithMinMaxArgs operation.
+
+##### Args:
+
+
+*  <b>`gradients`</b>: A `Tensor` of type `float32`.
+    Backpropagated gradients above the FakeQuantWithMinMaxArgs operation.
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+    Values passed as inputs to the FakeQuantWithMinMaxArgs operation.
+*  <b>`min`</b>: An optional `float`. Defaults to `-6`.
+*  <b>`max`</b>: An optional `float`. Defaults to `6`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor` of type `float32`.
+  Backpropagated gradients below the FakeQuantWithMinMaxArgs operation:
+  `gradients * (inputs >= min && inputs <= max)`.
+
+
+- - -
+
+### `tf.fake_quant_with_min_max_vars(inputs, min, max, name=None)` {#fake_quant_with_min_max_vars}
+
+Fake-quantize the 'inputs' tensor of type float and shape `[b, h, w, d]` via
+
+global float scalars `min` and `max` to 'outputs' tensor of same shape as
+`inputs`.
+
+[min; max] is the clamping range for the 'inputs' data.  Op divides this range
+into 255 steps (total of 256 values), then replaces each 'inputs' value with the
+closest of the quantized step values.
+
+This operation has a gradient and thus allows for training `min` and `max` values.
+
+##### Args:
+
+
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+*  <b>`min`</b>: A `Tensor` of type `float32`.
+*  <b>`max`</b>: A `Tensor` of type `float32`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor` of type `float32`.
+
+
+- - -
+
+### `tf.fake_quant_with_min_max_vars_gradient(gradients, inputs, min, max, name=None)` {#fake_quant_with_min_max_vars_gradient}
+
+Compute gradients for a FakeQuantWithMinMaxVars operation.
+
+##### Args:
+
+
+*  <b>`gradients`</b>: A `Tensor` of type `float32`.
+    Backpropagated gradients above the FakeQuantWithMinMaxVars operation.
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+    Values passed as inputs to the FakeQuantWithMinMaxVars operation.
+    min, max: Quantization interval, scalar floats.
+*  <b>`min`</b>: A `Tensor` of type `float32`.
+*  <b>`max`</b>: A `Tensor` of type `float32`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A tuple of `Tensor` objects (backprops_wrt_input, backprop_wrt_min, backprop_wrt_max).
+
+*  <b>`backprops_wrt_input`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. inputs:
+    `gradients * (inputs >= min && inputs <= max)`.
+*  <b>`backprop_wrt_min`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. min parameter:
+    `sum(gradients * (inputs < min))`.
+*  <b>`backprop_wrt_max`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. max parameter:
+    `sum(gradients * (inputs > max))`.
+
+
+- - -
+
+### `tf.fake_quant_with_min_max_vars_per_channel(inputs, min, max, name=None)` {#fake_quant_with_min_max_vars_per_channel}
+
+Fake-quantize the 'inputs' tensor of type float and one of the shapes: `[d]`,
+
+`[b, d]` `[b, h, w, d]` via per-channel floats `min` and `max` of shape `[d]`
+to 'outputs' tensor of same shape as `inputs`.
+
+[min; max] is the clamping range for the 'inputs' data in the corresponding
+depth channel.  Op divides this range into 255 steps (total of 256 values), then
+replaces each 'inputs' value with the closest of the quantized step values.
+
+This operation has a gradient and thus allows for training `min` and `max` values.
+
+##### Args:
+
+
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+*  <b>`min`</b>: A `Tensor` of type `float32`.
+*  <b>`max`</b>: A `Tensor` of type `float32`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor` of type `float32`.
+
+
+- - -
+
+### `tf.fake_quant_with_min_max_vars_per_channel_gradient(gradients, inputs, min, max, name=None)` {#fake_quant_with_min_max_vars_per_channel_gradient}
+
+Compute gradients for a FakeQuantWithMinMaxVarsPerChannel operation.
+
+##### Args:
+
+
+*  <b>`gradients`</b>: A `Tensor` of type `float32`.
+    Backpropagated gradients above the FakeQuantWithMinMaxVars operation,
+    shape one of: `[d]`, `[b, d]`,  `[b, h, w, d]`.
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+    Values passed as inputs to the FakeQuantWithMinMaxVars operation, shape
+      same as `gradients`.
+    min, max: Quantization interval, floats of shape `[d]`.
+*  <b>`min`</b>: A `Tensor` of type `float32`.
+*  <b>`max`</b>: A `Tensor` of type `float32`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A tuple of `Tensor` objects (backprops_wrt_input, backprop_wrt_min, backprop_wrt_max).
+
+*  <b>`backprops_wrt_input`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. inputs, shape same as
+    `inputs`:
+      `gradients * (inputs >= min && inputs <= max)`.
+*  <b>`backprop_wrt_min`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. min parameter, shape `[d]`:
+    `sum_per_d(gradients * (inputs < min))`.
+*  <b>`backprop_wrt_max`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. max parameter, shape `[d]`:
+    `sum_per_d(gradients * (inputs > max))`.
+
+
diff --git a/tensorflow/g3doc/api_docs/python/contrib.bayesflow.stochastic_tensor.md b/tensorflow/g3doc/api_docs/python/contrib.bayesflow.stochastic_tensor.md
index 98881fc13ad..04f2e5ae7e6 100644
--- a/tensorflow/g3doc/api_docs/python/contrib.bayesflow.stochastic_tensor.md
+++ b/tensorflow/g3doc/api_docs/python/contrib.bayesflow.stochastic_tensor.md
@@ -41,13 +41,6 @@ Base Class for Tensor-like objects that emit stochastic values.
 
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BaseStochasticTensor.input_dict` {#BaseStochasticTensor.input_dict}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.BaseStochasticTensor.loss(sample_loss)` {#BaseStochasticTensor.loss}
@@ -92,14 +85,14 @@ constant with respect to the input for purposes of the gradient.
 StochasticTensor is a BaseStochasticTensor backed by a distribution.
 - - -
 
-#### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.__init__(dist_cls, name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#StochasticTensor.__init__}
+#### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.__init__(dist, name='StochasticTensor', dist_value_type=None, loss_fn=score_function)` {#StochasticTensor.__init__}
 
 Construct a `StochasticTensor`.
 
-`StochasticTensor` will instantiate a distribution from `dist_cls` and
-`dist_args` and its `value` method will return the same value each time
-it is called. What `value` is returned is controlled by the
-`dist_value_type` (defaults to `SampleAndReshapeValue`).
+`StochasticTensor` is backed by the `dist` distribution and its `value`
+method will return the same value each time it is called. What `value` is
+returned is controlled by the `dist_value_type` (defaults to
+`SampleAndReshapeValue`).
 
 Some distributions' sample functions are not differentiable (e.g. a sample
 from a discrete distribution like a Bernoulli) and so to differentiate
@@ -117,34 +110,26 @@ reparameterized distributions; it will also return None if the value type is
 ##### Args:
 
 
-*  <b>`dist_cls`</b>: a `Distribution` class.
+*  <b>`dist`</b>: an instance of `Distribution`.
 *  <b>`name`</b>: a name for this `StochasticTensor` and its ops.
 *  <b>`dist_value_type`</b>: a `_StochasticValueType`, which will determine what the
       `value` of this `StochasticTensor` will be. If not provided, the
       value type set with the `value_type` context manager will be used.
-*  <b>`loss_fn`</b>: callable that takes `(st, st.value(), influenced_loss)`, where
+*  <b>`loss_fn`</b>: callable that takes
+      `(st, st.value(), influenced_loss)`, where
       `st` is this `StochasticTensor`, and returns a `Tensor` loss. By
       default, `loss_fn` is the `score_function`, or more precisely, the
       integral of the score function, such that when the gradient is taken,
       the score function results. See the `stochastic_gradient_estimators`
       module for additional loss functions and baselines.
-*  <b>`**dist_args`</b>: keyword arguments to be passed through to `dist_cls` on
-      construction.
 
 ##### Raises:
 
 
-*  <b>`TypeError`</b>: if `dist_cls` is not a `Distribution`.
+*  <b>`TypeError`</b>: if `dist` is not an instance of `Distribution`.
 *  <b>`TypeError`</b>: if `loss_fn` is not `callable`.
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.clone(name=None, **dist_args)` {#StochasticTensor.clone}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.distribution` {#StochasticTensor.distribution}
@@ -173,13 +158,6 @@ reparameterized distributions; it will also return None if the value type is
 
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.input_dict` {#StochasticTensor.input_dict}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.loss(final_loss, name='Loss')` {#StochasticTensor.loss}
@@ -359,8 +337,8 @@ with sg.value_type(sg.SampleAndReshapeValue(n=2)):
 st_value = st.value()
 assertEqual(st_value.get_shape(), (4, 3))
 
-dt_value_val = sess.run([st_value])[0]  # or e.g. run([tf.identity(st)])[0]
-assertEqual(dt_value_val.shape, (4, 3))
+st_value_val = sess.run([st_value])[0]  # or e.g. run([tf.identity(st)])[0]
+assertEqual(st_value_val.shape, (4, 3))
 ```
 - - -
 
@@ -458,3340 +436,6 @@ in a `stop_gradients` call to disable any possible backpropagation.
 
 
 
-
-## Automatically Generated StochasticTensors
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor` {#BernoulliTensor}
-
-`BernoulliTensor` is a `StochasticTensor` backed by the distribution `Bernoulli`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BernoulliTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.clone(name=None, **dist_args)` {#BernoulliTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.distribution` {#BernoulliTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.dtype` {#BernoulliTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.entropy(name='entropy')` {#BernoulliTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.graph` {#BernoulliTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.input_dict` {#BernoulliTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.loss(final_loss, name='Loss')` {#BernoulliTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.mean(name='mean')` {#BernoulliTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.name` {#BernoulliTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.value(name='value')` {#BernoulliTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.value_type` {#BernoulliTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor` {#BernoulliWithSigmoidPTensor}
-
-`BernoulliWithSigmoidPTensor` is a `StochasticTensor` backed by the distribution `BernoulliWithSigmoidP`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BernoulliWithSigmoidPTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.clone(name=None, **dist_args)` {#BernoulliWithSigmoidPTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.distribution` {#BernoulliWithSigmoidPTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.dtype` {#BernoulliWithSigmoidPTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.entropy(name='entropy')` {#BernoulliWithSigmoidPTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.graph` {#BernoulliWithSigmoidPTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.input_dict` {#BernoulliWithSigmoidPTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.loss(final_loss, name='Loss')` {#BernoulliWithSigmoidPTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.mean(name='mean')` {#BernoulliWithSigmoidPTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.name` {#BernoulliWithSigmoidPTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.value(name='value')` {#BernoulliWithSigmoidPTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.value_type` {#BernoulliWithSigmoidPTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.BetaTensor` {#BetaTensor}
-
-`BetaTensor` is a `StochasticTensor` backed by the distribution `Beta`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BetaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.clone(name=None, **dist_args)` {#BetaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.distribution` {#BetaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.dtype` {#BetaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.entropy(name='entropy')` {#BetaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.graph` {#BetaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.input_dict` {#BetaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.loss(final_loss, name='Loss')` {#BetaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.mean(name='mean')` {#BetaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.name` {#BetaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.value(name='value')` {#BetaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.value_type` {#BetaTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor` {#BetaWithSoftplusABTensor}
-
-`BetaWithSoftplusABTensor` is a `StochasticTensor` backed by the distribution `BetaWithSoftplusAB`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BetaWithSoftplusABTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.clone(name=None, **dist_args)` {#BetaWithSoftplusABTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.distribution` {#BetaWithSoftplusABTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.dtype` {#BetaWithSoftplusABTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.entropy(name='entropy')` {#BetaWithSoftplusABTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.graph` {#BetaWithSoftplusABTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.input_dict` {#BetaWithSoftplusABTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.loss(final_loss, name='Loss')` {#BetaWithSoftplusABTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.mean(name='mean')` {#BetaWithSoftplusABTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.name` {#BetaWithSoftplusABTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.value(name='value')` {#BetaWithSoftplusABTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.value_type` {#BetaWithSoftplusABTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.BinomialTensor` {#BinomialTensor}
-
-`BinomialTensor` is a `StochasticTensor` backed by the distribution `Binomial`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BinomialTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.clone(name=None, **dist_args)` {#BinomialTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.distribution` {#BinomialTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.dtype` {#BinomialTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.entropy(name='entropy')` {#BinomialTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.graph` {#BinomialTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.input_dict` {#BinomialTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.loss(final_loss, name='Loss')` {#BinomialTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.mean(name='mean')` {#BinomialTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.name` {#BinomialTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.value(name='value')` {#BinomialTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.value_type` {#BinomialTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor` {#CategoricalTensor}
-
-`CategoricalTensor` is a `StochasticTensor` backed by the distribution `Categorical`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#CategoricalTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.clone(name=None, **dist_args)` {#CategoricalTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.distribution` {#CategoricalTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.dtype` {#CategoricalTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.entropy(name='entropy')` {#CategoricalTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.graph` {#CategoricalTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.input_dict` {#CategoricalTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.loss(final_loss, name='Loss')` {#CategoricalTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.mean(name='mean')` {#CategoricalTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.name` {#CategoricalTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.value(name='value')` {#CategoricalTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.value_type` {#CategoricalTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor` {#Chi2Tensor}
-
-`Chi2Tensor` is a `StochasticTensor` backed by the distribution `Chi2`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#Chi2Tensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.clone(name=None, **dist_args)` {#Chi2Tensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.distribution` {#Chi2Tensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.dtype` {#Chi2Tensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.entropy(name='entropy')` {#Chi2Tensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.graph` {#Chi2Tensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.input_dict` {#Chi2Tensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.loss(final_loss, name='Loss')` {#Chi2Tensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.mean(name='mean')` {#Chi2Tensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.name` {#Chi2Tensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.value(name='value')` {#Chi2Tensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.value_type` {#Chi2Tensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor` {#Chi2WithAbsDfTensor}
-
-`Chi2WithAbsDfTensor` is a `StochasticTensor` backed by the distribution `Chi2WithAbsDf`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#Chi2WithAbsDfTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.clone(name=None, **dist_args)` {#Chi2WithAbsDfTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.distribution` {#Chi2WithAbsDfTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.dtype` {#Chi2WithAbsDfTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.entropy(name='entropy')` {#Chi2WithAbsDfTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.graph` {#Chi2WithAbsDfTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.input_dict` {#Chi2WithAbsDfTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.loss(final_loss, name='Loss')` {#Chi2WithAbsDfTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.mean(name='mean')` {#Chi2WithAbsDfTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.name` {#Chi2WithAbsDfTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.value(name='value')` {#Chi2WithAbsDfTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.value_type` {#Chi2WithAbsDfTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.DirichletTensor` {#DirichletTensor}
-
-`DirichletTensor` is a `StochasticTensor` backed by the distribution `Dirichlet`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#DirichletTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.clone(name=None, **dist_args)` {#DirichletTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.distribution` {#DirichletTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.dtype` {#DirichletTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.entropy(name='entropy')` {#DirichletTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.graph` {#DirichletTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.input_dict` {#DirichletTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.loss(final_loss, name='Loss')` {#DirichletTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.mean(name='mean')` {#DirichletTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.name` {#DirichletTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.value(name='value')` {#DirichletTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.value_type` {#DirichletTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor` {#DirichletMultinomialTensor}
-
-`DirichletMultinomialTensor` is a `StochasticTensor` backed by the distribution `DirichletMultinomial`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#DirichletMultinomialTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.clone(name=None, **dist_args)` {#DirichletMultinomialTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.distribution` {#DirichletMultinomialTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.dtype` {#DirichletMultinomialTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.entropy(name='entropy')` {#DirichletMultinomialTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.graph` {#DirichletMultinomialTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.input_dict` {#DirichletMultinomialTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.loss(final_loss, name='Loss')` {#DirichletMultinomialTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.mean(name='mean')` {#DirichletMultinomialTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.name` {#DirichletMultinomialTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.value(name='value')` {#DirichletMultinomialTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.value_type` {#DirichletMultinomialTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor` {#ExponentialTensor}
-
-`ExponentialTensor` is a `StochasticTensor` backed by the distribution `Exponential`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#ExponentialTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.clone(name=None, **dist_args)` {#ExponentialTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.distribution` {#ExponentialTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.dtype` {#ExponentialTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.entropy(name='entropy')` {#ExponentialTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.graph` {#ExponentialTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.input_dict` {#ExponentialTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.loss(final_loss, name='Loss')` {#ExponentialTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.mean(name='mean')` {#ExponentialTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.name` {#ExponentialTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.value(name='value')` {#ExponentialTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.value_type` {#ExponentialTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor` {#ExponentialWithSoftplusLamTensor}
-
-`ExponentialWithSoftplusLamTensor` is a `StochasticTensor` backed by the distribution `ExponentialWithSoftplusLam`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#ExponentialWithSoftplusLamTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.clone(name=None, **dist_args)` {#ExponentialWithSoftplusLamTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.distribution` {#ExponentialWithSoftplusLamTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.dtype` {#ExponentialWithSoftplusLamTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.entropy(name='entropy')` {#ExponentialWithSoftplusLamTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.graph` {#ExponentialWithSoftplusLamTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.input_dict` {#ExponentialWithSoftplusLamTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.loss(final_loss, name='Loss')` {#ExponentialWithSoftplusLamTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.mean(name='mean')` {#ExponentialWithSoftplusLamTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.name` {#ExponentialWithSoftplusLamTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.value(name='value')` {#ExponentialWithSoftplusLamTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.value_type` {#ExponentialWithSoftplusLamTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.GammaTensor` {#GammaTensor}
-
-`GammaTensor` is a `StochasticTensor` backed by the distribution `Gamma`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#GammaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.clone(name=None, **dist_args)` {#GammaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.distribution` {#GammaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.dtype` {#GammaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.entropy(name='entropy')` {#GammaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.graph` {#GammaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.input_dict` {#GammaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.loss(final_loss, name='Loss')` {#GammaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.mean(name='mean')` {#GammaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.name` {#GammaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.value(name='value')` {#GammaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.value_type` {#GammaTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor` {#GammaWithSoftplusAlphaBetaTensor}
-
-`GammaWithSoftplusAlphaBetaTensor` is a `StochasticTensor` backed by the distribution `GammaWithSoftplusAlphaBeta`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#GammaWithSoftplusAlphaBetaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.clone(name=None, **dist_args)` {#GammaWithSoftplusAlphaBetaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.distribution` {#GammaWithSoftplusAlphaBetaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.dtype` {#GammaWithSoftplusAlphaBetaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.entropy(name='entropy')` {#GammaWithSoftplusAlphaBetaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.graph` {#GammaWithSoftplusAlphaBetaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.input_dict` {#GammaWithSoftplusAlphaBetaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.loss(final_loss, name='Loss')` {#GammaWithSoftplusAlphaBetaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.mean(name='mean')` {#GammaWithSoftplusAlphaBetaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.name` {#GammaWithSoftplusAlphaBetaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.value(name='value')` {#GammaWithSoftplusAlphaBetaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.value_type` {#GammaWithSoftplusAlphaBetaTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor` {#InverseGammaTensor}
-
-`InverseGammaTensor` is a `StochasticTensor` backed by the distribution `InverseGamma`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#InverseGammaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.clone(name=None, **dist_args)` {#InverseGammaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.distribution` {#InverseGammaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.dtype` {#InverseGammaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.entropy(name='entropy')` {#InverseGammaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.graph` {#InverseGammaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.input_dict` {#InverseGammaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.loss(final_loss, name='Loss')` {#InverseGammaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.mean(name='mean')` {#InverseGammaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.name` {#InverseGammaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.value(name='value')` {#InverseGammaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.value_type` {#InverseGammaTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor` {#InverseGammaWithSoftplusAlphaBetaTensor}
-
-`InverseGammaWithSoftplusAlphaBetaTensor` is a `StochasticTensor` backed by the distribution `InverseGammaWithSoftplusAlphaBeta`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#InverseGammaWithSoftplusAlphaBetaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.clone(name=None, **dist_args)` {#InverseGammaWithSoftplusAlphaBetaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.distribution` {#InverseGammaWithSoftplusAlphaBetaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.dtype` {#InverseGammaWithSoftplusAlphaBetaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.entropy(name='entropy')` {#InverseGammaWithSoftplusAlphaBetaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.graph` {#InverseGammaWithSoftplusAlphaBetaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.input_dict` {#InverseGammaWithSoftplusAlphaBetaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.loss(final_loss, name='Loss')` {#InverseGammaWithSoftplusAlphaBetaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.mean(name='mean')` {#InverseGammaWithSoftplusAlphaBetaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.name` {#InverseGammaWithSoftplusAlphaBetaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.value(name='value')` {#InverseGammaWithSoftplusAlphaBetaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.value_type` {#InverseGammaWithSoftplusAlphaBetaTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor` {#LaplaceTensor}
-
-`LaplaceTensor` is a `StochasticTensor` backed by the distribution `Laplace`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#LaplaceTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.clone(name=None, **dist_args)` {#LaplaceTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.distribution` {#LaplaceTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.dtype` {#LaplaceTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.entropy(name='entropy')` {#LaplaceTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.graph` {#LaplaceTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.input_dict` {#LaplaceTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.loss(final_loss, name='Loss')` {#LaplaceTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.mean(name='mean')` {#LaplaceTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.name` {#LaplaceTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.value(name='value')` {#LaplaceTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.value_type` {#LaplaceTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor` {#LaplaceWithSoftplusScaleTensor}
-
-`LaplaceWithSoftplusScaleTensor` is a `StochasticTensor` backed by the distribution `LaplaceWithSoftplusScale`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#LaplaceWithSoftplusScaleTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.clone(name=None, **dist_args)` {#LaplaceWithSoftplusScaleTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.distribution` {#LaplaceWithSoftplusScaleTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.dtype` {#LaplaceWithSoftplusScaleTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.entropy(name='entropy')` {#LaplaceWithSoftplusScaleTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.graph` {#LaplaceWithSoftplusScaleTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.input_dict` {#LaplaceWithSoftplusScaleTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.loss(final_loss, name='Loss')` {#LaplaceWithSoftplusScaleTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.mean(name='mean')` {#LaplaceWithSoftplusScaleTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.name` {#LaplaceWithSoftplusScaleTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.value(name='value')` {#LaplaceWithSoftplusScaleTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.value_type` {#LaplaceWithSoftplusScaleTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.MixtureTensor` {#MixtureTensor}
-
-`MixtureTensor` is a `StochasticTensor` backed by the distribution `Mixture`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MixtureTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.clone(name=None, **dist_args)` {#MixtureTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.distribution` {#MixtureTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.dtype` {#MixtureTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.entropy(name='entropy')` {#MixtureTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.graph` {#MixtureTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.input_dict` {#MixtureTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.loss(final_loss, name='Loss')` {#MixtureTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.mean(name='mean')` {#MixtureTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.name` {#MixtureTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.value(name='value')` {#MixtureTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.value_type` {#MixtureTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor` {#MultinomialTensor}
-
-`MultinomialTensor` is a `StochasticTensor` backed by the distribution `Multinomial`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultinomialTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.clone(name=None, **dist_args)` {#MultinomialTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.distribution` {#MultinomialTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.dtype` {#MultinomialTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.entropy(name='entropy')` {#MultinomialTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.graph` {#MultinomialTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.input_dict` {#MultinomialTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.loss(final_loss, name='Loss')` {#MultinomialTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.mean(name='mean')` {#MultinomialTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.name` {#MultinomialTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.value(name='value')` {#MultinomialTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.value_type` {#MultinomialTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor` {#MultivariateNormalCholeskyTensor}
-
-`MultivariateNormalCholeskyTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalCholesky`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalCholeskyTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.clone(name=None, **dist_args)` {#MultivariateNormalCholeskyTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.distribution` {#MultivariateNormalCholeskyTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.dtype` {#MultivariateNormalCholeskyTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.entropy(name='entropy')` {#MultivariateNormalCholeskyTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.graph` {#MultivariateNormalCholeskyTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.input_dict` {#MultivariateNormalCholeskyTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.loss(final_loss, name='Loss')` {#MultivariateNormalCholeskyTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.mean(name='mean')` {#MultivariateNormalCholeskyTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.name` {#MultivariateNormalCholeskyTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.value(name='value')` {#MultivariateNormalCholeskyTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.value_type` {#MultivariateNormalCholeskyTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor` {#MultivariateNormalDiagTensor}
-
-`MultivariateNormalDiagTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalDiag`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalDiagTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.clone(name=None, **dist_args)` {#MultivariateNormalDiagTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.distribution` {#MultivariateNormalDiagTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.dtype` {#MultivariateNormalDiagTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.entropy(name='entropy')` {#MultivariateNormalDiagTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.graph` {#MultivariateNormalDiagTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.input_dict` {#MultivariateNormalDiagTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.loss(final_loss, name='Loss')` {#MultivariateNormalDiagTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.mean(name='mean')` {#MultivariateNormalDiagTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.name` {#MultivariateNormalDiagTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.value(name='value')` {#MultivariateNormalDiagTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.value_type` {#MultivariateNormalDiagTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor` {#MultivariateNormalDiagPlusVDVTTensor}
-
-`MultivariateNormalDiagPlusVDVTTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalDiagPlusVDVT`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalDiagPlusVDVTTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.clone(name=None, **dist_args)` {#MultivariateNormalDiagPlusVDVTTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.distribution` {#MultivariateNormalDiagPlusVDVTTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.dtype` {#MultivariateNormalDiagPlusVDVTTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.entropy(name='entropy')` {#MultivariateNormalDiagPlusVDVTTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.graph` {#MultivariateNormalDiagPlusVDVTTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.input_dict` {#MultivariateNormalDiagPlusVDVTTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.loss(final_loss, name='Loss')` {#MultivariateNormalDiagPlusVDVTTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.mean(name='mean')` {#MultivariateNormalDiagPlusVDVTTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.name` {#MultivariateNormalDiagPlusVDVTTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.value(name='value')` {#MultivariateNormalDiagPlusVDVTTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.value_type` {#MultivariateNormalDiagPlusVDVTTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor` {#MultivariateNormalDiagWithSoftplusStDevTensor}
-
-`MultivariateNormalDiagWithSoftplusStDevTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalDiagWithSoftplusStDev`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalDiagWithSoftplusStDevTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.clone(name=None, **dist_args)` {#MultivariateNormalDiagWithSoftplusStDevTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.distribution` {#MultivariateNormalDiagWithSoftplusStDevTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.dtype` {#MultivariateNormalDiagWithSoftplusStDevTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.entropy(name='entropy')` {#MultivariateNormalDiagWithSoftplusStDevTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.graph` {#MultivariateNormalDiagWithSoftplusStDevTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.input_dict` {#MultivariateNormalDiagWithSoftplusStDevTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.loss(final_loss, name='Loss')` {#MultivariateNormalDiagWithSoftplusStDevTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.mean(name='mean')` {#MultivariateNormalDiagWithSoftplusStDevTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.name` {#MultivariateNormalDiagWithSoftplusStDevTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.value(name='value')` {#MultivariateNormalDiagWithSoftplusStDevTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.value_type` {#MultivariateNormalDiagWithSoftplusStDevTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor` {#MultivariateNormalFullTensor}
-
-`MultivariateNormalFullTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalFull`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalFullTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.clone(name=None, **dist_args)` {#MultivariateNormalFullTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.distribution` {#MultivariateNormalFullTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.dtype` {#MultivariateNormalFullTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.entropy(name='entropy')` {#MultivariateNormalFullTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.graph` {#MultivariateNormalFullTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.input_dict` {#MultivariateNormalFullTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.loss(final_loss, name='Loss')` {#MultivariateNormalFullTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.mean(name='mean')` {#MultivariateNormalFullTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.name` {#MultivariateNormalFullTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.value(name='value')` {#MultivariateNormalFullTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.value_type` {#MultivariateNormalFullTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.NormalTensor` {#NormalTensor}
-
-`NormalTensor` is a `StochasticTensor` backed by the distribution `Normal`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#NormalTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.clone(name=None, **dist_args)` {#NormalTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.distribution` {#NormalTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.dtype` {#NormalTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.entropy(name='entropy')` {#NormalTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.graph` {#NormalTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.input_dict` {#NormalTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.loss(final_loss, name='Loss')` {#NormalTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.mean(name='mean')` {#NormalTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.name` {#NormalTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.value(name='value')` {#NormalTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.value_type` {#NormalTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor` {#NormalWithSoftplusSigmaTensor}
-
-`NormalWithSoftplusSigmaTensor` is a `StochasticTensor` backed by the distribution `NormalWithSoftplusSigma`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#NormalWithSoftplusSigmaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.clone(name=None, **dist_args)` {#NormalWithSoftplusSigmaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.distribution` {#NormalWithSoftplusSigmaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.dtype` {#NormalWithSoftplusSigmaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.entropy(name='entropy')` {#NormalWithSoftplusSigmaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.graph` {#NormalWithSoftplusSigmaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.input_dict` {#NormalWithSoftplusSigmaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.loss(final_loss, name='Loss')` {#NormalWithSoftplusSigmaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.mean(name='mean')` {#NormalWithSoftplusSigmaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.name` {#NormalWithSoftplusSigmaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.value(name='value')` {#NormalWithSoftplusSigmaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.value_type` {#NormalWithSoftplusSigmaTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.PoissonTensor` {#PoissonTensor}
-
-`PoissonTensor` is a `StochasticTensor` backed by the distribution `Poisson`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#PoissonTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.clone(name=None, **dist_args)` {#PoissonTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.distribution` {#PoissonTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.dtype` {#PoissonTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.entropy(name='entropy')` {#PoissonTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.graph` {#PoissonTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.input_dict` {#PoissonTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.loss(final_loss, name='Loss')` {#PoissonTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.mean(name='mean')` {#PoissonTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.name` {#PoissonTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.value(name='value')` {#PoissonTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.value_type` {#PoissonTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor` {#QuantizedDistributionTensor}
-
-`QuantizedDistributionTensor` is a `StochasticTensor` backed by the distribution `QuantizedDistribution`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#QuantizedDistributionTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.clone(name=None, **dist_args)` {#QuantizedDistributionTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.distribution` {#QuantizedDistributionTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.dtype` {#QuantizedDistributionTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.entropy(name='entropy')` {#QuantizedDistributionTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.graph` {#QuantizedDistributionTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.input_dict` {#QuantizedDistributionTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.loss(final_loss, name='Loss')` {#QuantizedDistributionTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.mean(name='mean')` {#QuantizedDistributionTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.name` {#QuantizedDistributionTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.value(name='value')` {#QuantizedDistributionTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.value_type` {#QuantizedDistributionTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.StudentTTensor` {#StudentTTensor}
-
-`StudentTTensor` is a `StochasticTensor` backed by the distribution `StudentT`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#StudentTTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.clone(name=None, **dist_args)` {#StudentTTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.distribution` {#StudentTTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.dtype` {#StudentTTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.entropy(name='entropy')` {#StudentTTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.graph` {#StudentTTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.input_dict` {#StudentTTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.loss(final_loss, name='Loss')` {#StudentTTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.mean(name='mean')` {#StudentTTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.name` {#StudentTTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.value(name='value')` {#StudentTTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.value_type` {#StudentTTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor` {#StudentTWithAbsDfSoftplusSigmaTensor}
-
-`StudentTWithAbsDfSoftplusSigmaTensor` is a `StochasticTensor` backed by the distribution `StudentTWithAbsDfSoftplusSigma`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#StudentTWithAbsDfSoftplusSigmaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.clone(name=None, **dist_args)` {#StudentTWithAbsDfSoftplusSigmaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.distribution` {#StudentTWithAbsDfSoftplusSigmaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.dtype` {#StudentTWithAbsDfSoftplusSigmaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.entropy(name='entropy')` {#StudentTWithAbsDfSoftplusSigmaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.graph` {#StudentTWithAbsDfSoftplusSigmaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.input_dict` {#StudentTWithAbsDfSoftplusSigmaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.loss(final_loss, name='Loss')` {#StudentTWithAbsDfSoftplusSigmaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.mean(name='mean')` {#StudentTWithAbsDfSoftplusSigmaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.name` {#StudentTWithAbsDfSoftplusSigmaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.value(name='value')` {#StudentTWithAbsDfSoftplusSigmaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.value_type` {#StudentTWithAbsDfSoftplusSigmaTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor` {#TransformedDistributionTensor}
-
-`TransformedDistributionTensor` is a `StochasticTensor` backed by the distribution `TransformedDistribution`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#TransformedDistributionTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.clone(name=None, **dist_args)` {#TransformedDistributionTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.distribution` {#TransformedDistributionTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.dtype` {#TransformedDistributionTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.entropy(name='entropy')` {#TransformedDistributionTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.graph` {#TransformedDistributionTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.input_dict` {#TransformedDistributionTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.loss(final_loss, name='Loss')` {#TransformedDistributionTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.mean(name='mean')` {#TransformedDistributionTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.name` {#TransformedDistributionTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.value(name='value')` {#TransformedDistributionTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.value_type` {#TransformedDistributionTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.UniformTensor` {#UniformTensor}
-
-`UniformTensor` is a `StochasticTensor` backed by the distribution `Uniform`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#UniformTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.clone(name=None, **dist_args)` {#UniformTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.distribution` {#UniformTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.dtype` {#UniformTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.entropy(name='entropy')` {#UniformTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.graph` {#UniformTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.input_dict` {#UniformTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.loss(final_loss, name='Loss')` {#UniformTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.mean(name='mean')` {#UniformTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.name` {#UniformTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.value(name='value')` {#UniformTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.value_type` {#UniformTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor` {#WishartCholeskyTensor}
-
-`WishartCholeskyTensor` is a `StochasticTensor` backed by the distribution `WishartCholesky`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#WishartCholeskyTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.clone(name=None, **dist_args)` {#WishartCholeskyTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.distribution` {#WishartCholeskyTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.dtype` {#WishartCholeskyTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.entropy(name='entropy')` {#WishartCholeskyTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.graph` {#WishartCholeskyTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.input_dict` {#WishartCholeskyTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.loss(final_loss, name='Loss')` {#WishartCholeskyTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.mean(name='mean')` {#WishartCholeskyTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.name` {#WishartCholeskyTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.value(name='value')` {#WishartCholeskyTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.value_type` {#WishartCholeskyTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor` {#WishartFullTensor}
-
-`WishartFullTensor` is a `StochasticTensor` backed by the distribution `WishartFull`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#WishartFullTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.clone(name=None, **dist_args)` {#WishartFullTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.distribution` {#WishartFullTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.dtype` {#WishartFullTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.entropy(name='entropy')` {#WishartFullTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.graph` {#WishartFullTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.input_dict` {#WishartFullTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.loss(final_loss, name='Loss')` {#WishartFullTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.mean(name='mean')` {#WishartFullTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.name` {#WishartFullTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.value(name='value')` {#WishartFullTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.value_type` {#WishartFullTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor` {#beta_aaTensor}
-
-`beta_aaTensor` is a `StochasticTensor` backed by the distribution `beta_aa`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#beta_aaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.clone(name=None, **dist_args)` {#beta_aaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.distribution` {#beta_aaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.dtype` {#beta_aaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.entropy(name='entropy')` {#beta_aaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.graph` {#beta_aaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.input_dict` {#beta_aaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.loss(final_loss, name='Loss')` {#beta_aaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.mean(name='mean')` {#beta_aaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.name` {#beta_aaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.value(name='value')` {#beta_aaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.value_type` {#beta_aaTensor.value_type}
-
-
-
-
-
-- - -
-
-### `class tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor` {#beta_bbTensor}
-
-`beta_bbTensor` is a `StochasticTensor` backed by the distribution `beta_bb`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#beta_bbTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.clone(name=None, **dist_args)` {#beta_bbTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.distribution` {#beta_bbTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.dtype` {#beta_bbTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.entropy(name='entropy')` {#beta_bbTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.graph` {#beta_bbTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.input_dict` {#beta_bbTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.loss(final_loss, name='Loss')` {#beta_bbTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.mean(name='mean')` {#beta_bbTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.name` {#beta_bbTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.value(name='value')` {#beta_bbTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.value_type` {#beta_bbTensor.value_type}
-
-
-
-
-
-
 ## Other Functions and Classes
 - - -
 
@@ -3800,38 +444,29 @@ in a `stop_gradients` call to disable any possible backpropagation.
 A StochasticTensor with an observed value.
 - - -
 
-#### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.__init__(dist_cls, value, name=None, **dist_args)` {#ObservedStochasticTensor.__init__}
+#### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.__init__(dist, value, name=None)` {#ObservedStochasticTensor.__init__}
 
 Construct an `ObservedStochasticTensor`.
 
-`ObservedStochasticTensor` will instantiate a distribution from `dist_cls`
-and `dist_args` but use the provided value instead of sampling from the
-distribution. The provided value argument must be appropriately shaped
-to have come from the constructed distribution.
+`ObservedStochasticTensor` is backed by distribution `dist` and uses the
+provided value instead of using the current value type to draw a value from
+the distribution. The provided value argument must be appropriately shaped
+to have come from the distribution.
 
 ##### Args:
 
 
-*  <b>`dist_cls`</b>: a `Distribution` class.
+*  <b>`dist`</b>: an instance of `Distribution`.
 *  <b>`value`</b>: a Tensor containing the observed value
 *  <b>`name`</b>: a name for this `ObservedStochasticTensor` and its ops.
-*  <b>`**dist_args`</b>: keyword arguments to be passed through to `dist_cls` on
-      construction.
 
 ##### Raises:
 
 
-*  <b>`TypeError`</b>: if `dist_cls` is not a `Distribution`.
+*  <b>`TypeError`</b>: if `dist` is not an instance of `Distribution`.
 *  <b>`ValueError`</b>: if `value` is not compatible with the distribution.
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.clone(name=None, **dist_args)` {#ObservedStochasticTensor.clone}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.distribution` {#ObservedStochasticTensor.distribution}
@@ -3860,13 +495,6 @@ to have come from the constructed distribution.
 
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.input_dict` {#ObservedStochasticTensor.input_dict}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.loss(final_loss, name=None)` {#ObservedStochasticTensor.loss}
diff --git a/tensorflow/g3doc/api_docs/python/contrib.distributions.md b/tensorflow/g3doc/api_docs/python/contrib.distributions.md
index bc4a79cf85f..a86285a0196 100644
--- a/tensorflow/g3doc/api_docs/python/contrib.distributions.md
+++ b/tensorflow/g3doc/api_docs/python/contrib.distributions.md
@@ -17325,62 +17325,6 @@ Variance.
 
 
 
-- - -
-
-### `tf.contrib.distributions.matrix_diag_transform(matrix, transform=None, name=None)` {#matrix_diag_transform}
-
-Transform diagonal of [batch-]matrix, leave rest of matrix unchanged.
-
-Create a trainable covariance defined by a Cholesky factor:
-
-```python
-# Transform network layer into 2 x 2 array.
-matrix_values = tf.contrib.layers.fully_connected(activations, 4)
-matrix = tf.reshape(matrix_values, (batch_size, 2, 2))
-
-# Make the diagonal positive.  If the upper triangle was zero, this would be a
-# valid Cholesky factor.
-chol = matrix_diag_transform(matrix, transform=tf.nn.softplus)
-
-# OperatorPDCholesky ignores the upper triangle.
-operator = OperatorPDCholesky(chol)
-```
-
-Example of heteroskedastic 2-D linear regression.
-
-```python
-# Get a trainable Cholesky factor.
-matrix_values = tf.contrib.layers.fully_connected(activations, 4)
-matrix = tf.reshape(matrix_values, (batch_size, 2, 2))
-chol = matrix_diag_transform(matrix, transform=tf.nn.softplus)
-
-# Get a trainable mean.
-mu = tf.contrib.layers.fully_connected(activations, 2)
-
-# This is a fully trainable multivariate normal!
-dist = tf.contrib.distributions.MVNCholesky(mu, chol)
-
-# Standard log loss.  Minimizing this will "train" mu and chol, and then dist
-# will be a distribution predicting labels as multivariate Gaussians.
-loss = -1 * tf.reduce_mean(dist.log_pdf(labels))
-```
-
-##### Args:
-
-
-*  <b>`matrix`</b>: Rank `R` `Tensor`, `R >= 2`, where the last two dimensions are
-    equal.
-*  <b>`transform`</b>: Element-wise function mapping `Tensors` to `Tensors`.  To
-    be applied to the diagonal of `matrix`.  If `None`, `matrix` is returned
-    unchanged.  Defaults to `None`.
-*  <b>`name`</b>: A name to give created ops.
-    Defaults to "matrix_diag_transform".
-
-##### Returns:
-
-  A `Tensor` with same shape and `dtype` as `matrix`.
-
-
 
 ### Other multivariate distributions
 
@@ -20793,6 +20737,65 @@ Variance.
 
 
 
+### Multivariate Utilities
+
+- - -
+
+### `tf.contrib.distributions.matrix_diag_transform(matrix, transform=None, name=None)` {#matrix_diag_transform}
+
+Transform diagonal of [batch-]matrix, leave rest of matrix unchanged.
+
+Create a trainable covariance defined by a Cholesky factor:
+
+```python
+# Transform network layer into 2 x 2 array.
+matrix_values = tf.contrib.layers.fully_connected(activations, 4)
+matrix = tf.reshape(matrix_values, (batch_size, 2, 2))
+
+# Make the diagonal positive.  If the upper triangle was zero, this would be a
+# valid Cholesky factor.
+chol = matrix_diag_transform(matrix, transform=tf.nn.softplus)
+
+# OperatorPDCholesky ignores the upper triangle.
+operator = OperatorPDCholesky(chol)
+```
+
+Example of heteroskedastic 2-D linear regression.
+
+```python
+# Get a trainable Cholesky factor.
+matrix_values = tf.contrib.layers.fully_connected(activations, 4)
+matrix = tf.reshape(matrix_values, (batch_size, 2, 2))
+chol = matrix_diag_transform(matrix, transform=tf.nn.softplus)
+
+# Get a trainable mean.
+mu = tf.contrib.layers.fully_connected(activations, 2)
+
+# This is a fully trainable multivariate normal!
+dist = tf.contrib.distributions.MVNCholesky(mu, chol)
+
+# Standard log loss.  Minimizing this will "train" mu and chol, and then dist
+# will be a distribution predicting labels as multivariate Gaussians.
+loss = -1 * tf.reduce_mean(dist.log_pdf(labels))
+```
+
+##### Args:
+
+
+*  <b>`matrix`</b>: Rank `R` `Tensor`, `R >= 2`, where the last two dimensions are
+    equal.
+*  <b>`transform`</b>: Element-wise function mapping `Tensors` to `Tensors`.  To
+    be applied to the diagonal of `matrix`.  If `None`, `matrix` is returned
+    unchanged.  Defaults to `None`.
+*  <b>`name`</b>: A name to give created ops.
+    Defaults to "matrix_diag_transform".
+
+##### Returns:
+
+  A `Tensor` with same shape and `dtype` as `matrix`.
+
+
+
 ## Transformed distributions
 
 - - -
@@ -23052,7 +23055,7 @@ will broadcast in the case of multidimensional sets of parameters.
 
 
 
-## Kullback Leibler Divergence
+## Kullback-Leibler Divergence
 
 - - -
 
diff --git a/tensorflow/g3doc/api_docs/python/contrib.integrate.md b/tensorflow/g3doc/api_docs/python/contrib.integrate.md
new file mode 100644
index 00000000000..dc2c16a0dac
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/contrib.integrate.md
@@ -0,0 +1,135 @@
+<!-- This file is machine generated: DO NOT EDIT! -->
+
+# Integrate (contrib)
+[TOC]
+
+Integration and ODE solvers for TensorFlow.
+
+## Example: Lorenz attractor
+
+We can use `odeint` to solve the
+[Lorentz system](https://en.wikipedia.org/wiki/Lorenz_system) of ordinary
+differential equations, a prototypical example of chaotic dynamics:
+
+```python
+rho = 28.0
+sigma = 10.0
+beta = 8.0/3.0
+
+def lorenz_equation(state, t):
+  x, y, z = tf.unpack(state)
+  dx = sigma * (y - x)
+  dy = x * (rho - z) - y
+  dz = x * y - beta * z
+  return tf.pack([dx, dy, dz])
+
+init_state = tf.constant([0, 2, 20], dtype=tf.float64)
+t = np.linspace(0, 50, num=5000)
+tensor_state, tensor_info = tf.contrib.integrate.odeint(
+    lorenz_equation, init_state, t, full_output=True)
+
+sess = tf.Session()
+state, info = sess.run([tensor_state, tensor_info])
+x, y, z = state.T
+plt.plot(x, z)
+```
+
+<div style="width:70%; margin:auto; margin-bottom:10px; margin-top:20px;">
+<img style="width:100%" src="../../images/lorenz_attractor.png" alt>
+</div>
+
+## Ops
+
+- - -
+
+### `tf.contrib.integrate.odeint(func, y0, t, rtol=1e-06, atol=1e-12, method=None, options=None, full_output=False, name=None)` {#odeint}
+
+Integrate a system of ordinary differential equations.
+
+Solves the initial value problem for a non-stiff system of first order ode-s:
+
+  ```
+  dy/dt = func(y, t), y(t[0]) = y0
+  ```
+
+where y is a Tensor of any shape.
+
+For example:
+
+  ```
+  # solve `dy/dt = -y`, corresponding to exponential decay
+  tf.contrib.integrate.odeint(lambda y, _: -y, 1.0, [0, 1, 2])
+  => [1, exp(-1), exp(-2)]
+  ```
+
+Output dtypes and numerical precision are based on the dtypes of the inputs
+`y0` and `t`.
+
+Currently, implements 5th order Runge-Kutta with adaptive step size control
+and dense output, using the Dormand-Prince method. Similar to the 'dopri5'
+method of `scipy.integrate.ode` and MATLAB's `ode45`.
+
+Based on: Shampine, Lawrence F. (1986), "Some Practical Runge-Kutta Formulas",
+Mathematics of Computation, American Mathematical Society, 46 (173): 135-150,
+doi:10.2307/2008219
+
+##### Args:
+
+
+*  <b>`func`</b>: Function that maps a Tensor holding the state `y` and a scalar Tensor
+    `t` into a Tensor of state derivatives with respect to time.
+*  <b>`y0`</b>: N-D Tensor giving starting value of `y` at time point `t[0]`. May
+    have any floating point or complex dtype.
+*  <b>`t`</b>: 1-D Tensor holding a sequence of time points for which to solve for
+    `y`. The initial time point should be the first element of this sequence,
+    and each time must be larger than the previous time. May have any floating
+    point dtype. If not provided as a Tensor, converted to a Tensor with
+    float64 dtype.
+*  <b>`rtol`</b>: optional float64 Tensor specifying an upper bound on relative error,
+    per element of `y`.
+*  <b>`atol`</b>: optional float64 Tensor specifying an upper bound on absolute error,
+    per element of `y`.
+*  <b>`method`</b>: optional string indicating the integration method to use. Currently,
+    the only valid option is `'dopri5'`.
+*  <b>`options`</b>: optional dict of configuring options for the indicated integration
+    method. Can only be provided if a `method` is explicitly set. For
+    `'dopri5'`, valid options include:
+    * first_step: an initial guess for the size of the first integration
+      (current default: 1.0, but may later be changed to use heuristics based
+      on the gradient).
+    * safety: safety factor for adaptive step control, generally a constant
+      in the range 0.8-1 (default: 0.9).
+    * ifactor: maximum factor by which the adaptive step may be increased
+      (default: 10.0).
+    * dfactor: maximum factor by which the adpative step may be decreased
+      (default: 0.2).
+    * max_num_steps: integer maximum number of integrate steps between time
+      points in `t` (default: 1000).
+*  <b>`full_output`</b>: optional boolean. If True, `odeint` returns a tuple
+    `(y, info_dict)` describing the integration process.
+*  <b>`name`</b>: Optional name for this operation.
+
+##### Returns:
+
+
+*  <b>`y`</b>: (N+1)-D tensor, where the first dimension corresponds to different
+    time points. Contains the solved value of y for each desired time point in
+    `t`, with the initial value `y0` being the first element along the first
+    dimension.
+*  <b>`info_dict`</b>: only if `full_output == True`. A dict with the following values:
+    * num_func_evals: integer Tensor counting the number of function
+      evaluations.
+    * integrate_points: 1D float64 Tensor with the upper bound of each
+      integration time step.
+    * error_ratio: 1D float Tensor with the estimated ratio of the integration
+      error to the error tolerance at each integration step. An ratio greater
+      than 1 corresponds to rejected steps.
+
+##### Raises:
+
+
+*  <b>`ValueError`</b>: if an invalid `method` is provided.
+*  <b>`TypeError`</b>: if `options` is supplied without `method`, or if `t` or `y0` has
+    an invalid dtype.
+
+
diff --git a/tensorflow/g3doc/api_docs/python/contrib.learn.md b/tensorflow/g3doc/api_docs/python/contrib.learn.md
index 8d55f807aed..30f6bbee6d4 100644
--- a/tensorflow/g3doc/api_docs/python/contrib.learn.md
+++ b/tensorflow/g3doc/api_docs/python/contrib.learn.md
@@ -1265,21 +1265,18 @@ classes. When number of possible classes is 2, this is binary classification.
 Example:
 
 ```python
-education = sparse_column_with_hash_bucket(column_name="education",
-                                           hash_bucket_size=1000)
-occupation = sparse_column_with_hash_bucket(column_name="occupation",
-                                            hash_bucket_size=1000)
+sparse_column_a = sparse_column_with_hash_bucket(...)
+sparse_column_b = sparse_column_with_hash_bucket(...)
 
-education_x_occupation = crossed_column(columns=[education, occupation],
-                                        hash_bucket_size=10000)
+sparse_feature_a_x_sparse_feature_b = crossed_column(...)
 
 # Estimator using the default optimizer.
 estimator = LinearClassifier(
-    feature_columns=[occupation, education_x_occupation])
+    feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b])
 
 # Or estimator using the FTRL optimizer with regularization.
 estimator = LinearClassifier(
-    feature_columns=[occupation, education_x_occupation],
+    feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b],
     optimizer=tf.train.FtrlOptimizer(
       learning_rate=0.1,
       l1_regularization_strength=0.001
@@ -1287,7 +1284,7 @@ estimator = LinearClassifier(
 
 # Or estimator using the SDCAOptimizer.
 estimator = LinearClassifier(
-   feature_columns=[occupation, education_x_occupation],
+   feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b],
    optimizer=tf.contrib.linear_optimizer.SDCAOptimizer(
      example_id_column='example_id',
      num_loss_partitions=...,
@@ -1483,16 +1480,13 @@ feature values.
 Example:
 
 ```python
-education = sparse_column_with_hash_bucket(column_name="education",
-                                           hash_bucket_size=1000)
-occupation = sparse_column_with_hash_bucket(column_name="occupation",
-                                            hash_bucket_size=1000)
+sparse_column_a = sparse_column_with_hash_bucket(...)
+sparse_column_b = sparse_column_with_hash_bucket(...)
 
-education_x_occupation = crossed_column(columns=[education, occupation],
-                                        hash_bucket_size=10000)
+sparse_feature_a_x_sparse_feature_b = crossed_column(...)
 
 estimator = LinearRegressor(
-    feature_columns=[occupation, education_x_occupation])
+    feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b])
 
 # Input builders
 def input_fn_train: # returns x, y
diff --git a/tensorflow/g3doc/api_docs/python/contrib.metrics.md b/tensorflow/g3doc/api_docs/python/contrib.metrics.md
index 326a90b2c40..856be448660 100644
--- a/tensorflow/g3doc/api_docs/python/contrib.metrics.md
+++ b/tensorflow/g3doc/api_docs/python/contrib.metrics.md
@@ -300,7 +300,12 @@ This value is ultimately returned as `auc`, an idempotent operation that
 computes the area under a discretized curve of precision versus recall values
 (computed using the aforementioned variables). The `num_thresholds` variable
 controls the degree of discretization with larger numbers of thresholds more
-closely approximating the true AUC.
+closely approximating the true AUC. The quality of the approximation may vary
+dramatically depending on `num_thresholds`.
+
+For best results, `predictions` should be distributed approximately uniformly
+in the range [0, 1] and not peaked around 0 or 1. The quality of the AUC
+approximation may be poor if this is not the case.
 
 For estimation of the metric over a stream of data, the function creates an
 `update_op` operation that updates these variables and returns the `auc`.
diff --git a/tensorflow/g3doc/api_docs/python/framework.md b/tensorflow/g3doc/api_docs/python/framework.md
index 498e7d999f3..86de039e7bd 100644
--- a/tensorflow/g3doc/api_docs/python/framework.md
+++ b/tensorflow/g3doc/api_docs/python/framework.md
@@ -2845,10 +2845,18 @@ variables.
 
 The following standard keys are defined:
 
-* `VARIABLES`: the `Variable` objects that comprise a model, and
-  must be saved and restored together. See
-  [`tf.all_variables()`](../../api_docs/python/state_ops.md#all_variables)
+* `GLOBAL_VARIABLES`: the default collection of `Variable` objects, shared
+  across distributed environment (model variables are subset of these). See
+  [`tf.global_variables()`](../../api_docs/python/state_ops.md#global_variables)
   for more details.
+  Commonly, all `TRAINABLE_VARIABLES` variables will be in `MODEL_VARIABLES`,
+  and all `MODEL_VARIABLES` variables will be in `GLOBAL_VARIABLES`.
+* `LOCAL_VARIABLES`: the subset of `Variable` objects that are local to each
+  machine. Usually used for temporarily variables, like counters.
+  Note: use `tf.contrib.framework.local_variable` to add to this collection.
+* `MODEL_VARIABLES`: the subset of `Variable` objects that are used in the
+  model for inference (feed forward). Note: use
+  `tf.contrib.framework.model_variable` to add to this collection.
 * `TRAINABLE_VARIABLES`: the subset of `Variable` objects that will
   be trained by an optimizer. See
   [`tf.trainable_variables()`](../../api_docs/python/state_ops.md#trainable_variables)
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.md
deleted file mode 100644
index 380b9d2c7f2..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`BetaWithSoftplusABTensor` is a `StochasticTensor` backed by the distribution `BetaWithSoftplusAB`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BetaWithSoftplusABTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.clone(name=None, **dist_args)` {#BetaWithSoftplusABTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.distribution` {#BetaWithSoftplusABTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.dtype` {#BetaWithSoftplusABTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.entropy(name='entropy')` {#BetaWithSoftplusABTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.graph` {#BetaWithSoftplusABTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.input_dict` {#BetaWithSoftplusABTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.loss(final_loss, name='Loss')` {#BetaWithSoftplusABTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.mean(name='mean')` {#BetaWithSoftplusABTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.name` {#BetaWithSoftplusABTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.value(name='value')` {#BetaWithSoftplusABTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaWithSoftplusABTensor.value_type` {#BetaWithSoftplusABTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.md
deleted file mode 100644
index 874892f110f..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`GammaWithSoftplusAlphaBetaTensor` is a `StochasticTensor` backed by the distribution `GammaWithSoftplusAlphaBeta`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#GammaWithSoftplusAlphaBetaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.clone(name=None, **dist_args)` {#GammaWithSoftplusAlphaBetaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.distribution` {#GammaWithSoftplusAlphaBetaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.dtype` {#GammaWithSoftplusAlphaBetaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.entropy(name='entropy')` {#GammaWithSoftplusAlphaBetaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.graph` {#GammaWithSoftplusAlphaBetaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.input_dict` {#GammaWithSoftplusAlphaBetaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.loss(final_loss, name='Loss')` {#GammaWithSoftplusAlphaBetaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.mean(name='mean')` {#GammaWithSoftplusAlphaBetaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.name` {#GammaWithSoftplusAlphaBetaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.value(name='value')` {#GammaWithSoftplusAlphaBetaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaWithSoftplusAlphaBetaTensor.value_type` {#GammaWithSoftplusAlphaBetaTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.md
deleted file mode 100644
index 7be941bb9a5..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`MultivariateNormalDiagPlusVDVTTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalDiagPlusVDVT`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalDiagPlusVDVTTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.clone(name=None, **dist_args)` {#MultivariateNormalDiagPlusVDVTTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.distribution` {#MultivariateNormalDiagPlusVDVTTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.dtype` {#MultivariateNormalDiagPlusVDVTTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.entropy(name='entropy')` {#MultivariateNormalDiagPlusVDVTTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.graph` {#MultivariateNormalDiagPlusVDVTTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.input_dict` {#MultivariateNormalDiagPlusVDVTTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.loss(final_loss, name='Loss')` {#MultivariateNormalDiagPlusVDVTTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.mean(name='mean')` {#MultivariateNormalDiagPlusVDVTTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.name` {#MultivariateNormalDiagPlusVDVTTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.value(name='value')` {#MultivariateNormalDiagPlusVDVTTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagPlusVDVTTensor.value_type` {#MultivariateNormalDiagPlusVDVTTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.md
index dc1975bf123..da7082ffb65 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.md
@@ -1,38 +1,29 @@
 A StochasticTensor with an observed value.
 - - -
 
-#### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.__init__(dist_cls, value, name=None, **dist_args)` {#ObservedStochasticTensor.__init__}
+#### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.__init__(dist, value, name=None)` {#ObservedStochasticTensor.__init__}
 
 Construct an `ObservedStochasticTensor`.
 
-`ObservedStochasticTensor` will instantiate a distribution from `dist_cls`
-and `dist_args` but use the provided value instead of sampling from the
-distribution. The provided value argument must be appropriately shaped
-to have come from the constructed distribution.
+`ObservedStochasticTensor` is backed by distribution `dist` and uses the
+provided value instead of using the current value type to draw a value from
+the distribution. The provided value argument must be appropriately shaped
+to have come from the distribution.
 
 ##### Args:
 
 
-*  <b>`dist_cls`</b>: a `Distribution` class.
+*  <b>`dist`</b>: an instance of `Distribution`.
 *  <b>`value`</b>: a Tensor containing the observed value
 *  <b>`name`</b>: a name for this `ObservedStochasticTensor` and its ops.
-*  <b>`**dist_args`</b>: keyword arguments to be passed through to `dist_cls` on
-      construction.
 
 ##### Raises:
 
 
-*  <b>`TypeError`</b>: if `dist_cls` is not a `Distribution`.
+*  <b>`TypeError`</b>: if `dist` is not an instance of `Distribution`.
 *  <b>`ValueError`</b>: if `value` is not compatible with the distribution.
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.clone(name=None, **dist_args)` {#ObservedStochasticTensor.clone}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.distribution` {#ObservedStochasticTensor.distribution}
@@ -61,13 +52,6 @@ to have come from the constructed distribution.
 
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.input_dict` {#ObservedStochasticTensor.input_dict}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.ObservedStochasticTensor.loss(final_loss, name=None)` {#ObservedStochasticTensor.loss}
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.SampleAndReshapeValue.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.SampleAndReshapeValue.md
index 6d12b859ffe..6b564c36b9f 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.SampleAndReshapeValue.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.SampleAndReshapeValue.md
@@ -23,8 +23,8 @@ with sg.value_type(sg.SampleAndReshapeValue(n=2)):
 st_value = st.value()
 assertEqual(st_value.get_shape(), (4, 3))
 
-dt_value_val = sess.run([st_value])[0]  # or e.g. run([tf.identity(st)])[0]
-assertEqual(dt_value_val.shape, (4, 3))
+st_value_val = sess.run([st_value])[0]  # or e.g. run([tf.identity(st)])[0]
+assertEqual(st_value_val.shape, (4, 3))
 ```
 - - -
 
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.md
deleted file mode 100644
index 52493288601..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`TransformedDistributionTensor` is a `StochasticTensor` backed by the distribution `TransformedDistribution`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#TransformedDistributionTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.clone(name=None, **dist_args)` {#TransformedDistributionTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.distribution` {#TransformedDistributionTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.dtype` {#TransformedDistributionTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.entropy(name='entropy')` {#TransformedDistributionTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.graph` {#TransformedDistributionTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.input_dict` {#TransformedDistributionTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.loss(final_loss, name='Loss')` {#TransformedDistributionTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.mean(name='mean')` {#TransformedDistributionTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.name` {#TransformedDistributionTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.value(name='value')` {#TransformedDistributionTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.TransformedDistributionTensor.value_type` {#TransformedDistributionTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.learn.LinearRegressor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.learn.LinearRegressor.md
index bdeab9de13c..2352b13897a 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.learn.LinearRegressor.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.contrib.learn.LinearRegressor.md
@@ -6,16 +6,13 @@ feature values.
 Example:
 
 ```python
-education = sparse_column_with_hash_bucket(column_name="education",
-                                           hash_bucket_size=1000)
-occupation = sparse_column_with_hash_bucket(column_name="occupation",
-                                            hash_bucket_size=1000)
+sparse_column_a = sparse_column_with_hash_bucket(...)
+sparse_column_b = sparse_column_with_hash_bucket(...)
 
-education_x_occupation = crossed_column(columns=[education, occupation],
-                                        hash_bucket_size=10000)
+sparse_feature_a_x_sparse_feature_b = crossed_column(...)
 
 estimator = LinearRegressor(
-    feature_columns=[occupation, education_x_occupation])
+    feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b])
 
 # Input builders
 def input_fn_train: # returns x, y
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.fake_quant_with_min_max_vars_gradient.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.fake_quant_with_min_max_vars_gradient.md
new file mode 100644
index 00000000000..b363afe7cef
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.fake_quant_with_min_max_vars_gradient.md
@@ -0,0 +1,27 @@
+### `tf.fake_quant_with_min_max_vars_gradient(gradients, inputs, min, max, name=None)` {#fake_quant_with_min_max_vars_gradient}
+
+Compute gradients for a FakeQuantWithMinMaxVars operation.
+
+##### Args:
+
+
+*  <b>`gradients`</b>: A `Tensor` of type `float32`.
+    Backpropagated gradients above the FakeQuantWithMinMaxVars operation.
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+    Values passed as inputs to the FakeQuantWithMinMaxVars operation.
+    min, max: Quantization interval, scalar floats.
+*  <b>`min`</b>: A `Tensor` of type `float32`.
+*  <b>`max`</b>: A `Tensor` of type `float32`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A tuple of `Tensor` objects (backprops_wrt_input, backprop_wrt_min, backprop_wrt_max).
+
+*  <b>`backprops_wrt_input`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. inputs:
+    `gradients * (inputs >= min && inputs <= max)`.
+*  <b>`backprop_wrt_min`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. min parameter:
+    `sum(gradients * (inputs < min))`.
+*  <b>`backprop_wrt_max`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. max parameter:
+    `sum(gradients * (inputs > max))`.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.fake_quant_with_min_max_vars_per_channel_gradient.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.fake_quant_with_min_max_vars_per_channel_gradient.md
new file mode 100644
index 00000000000..a7a62e29b31
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard0/tf.fake_quant_with_min_max_vars_per_channel_gradient.md
@@ -0,0 +1,30 @@
+### `tf.fake_quant_with_min_max_vars_per_channel_gradient(gradients, inputs, min, max, name=None)` {#fake_quant_with_min_max_vars_per_channel_gradient}
+
+Compute gradients for a FakeQuantWithMinMaxVarsPerChannel operation.
+
+##### Args:
+
+
+*  <b>`gradients`</b>: A `Tensor` of type `float32`.
+    Backpropagated gradients above the FakeQuantWithMinMaxVars operation,
+    shape one of: `[d]`, `[b, d]`,  `[b, h, w, d]`.
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+    Values passed as inputs to the FakeQuantWithMinMaxVars operation, shape
+      same as `gradients`.
+    min, max: Quantization interval, floats of shape `[d]`.
+*  <b>`min`</b>: A `Tensor` of type `float32`.
+*  <b>`max`</b>: A `Tensor` of type `float32`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A tuple of `Tensor` objects (backprops_wrt_input, backprop_wrt_min, backprop_wrt_max).
+
+*  <b>`backprops_wrt_input`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. inputs, shape same as
+    `inputs`:
+      `gradients * (inputs >= min && inputs <= max)`.
+*  <b>`backprop_wrt_min`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. min parameter, shape `[d]`:
+    `sum_per_d(gradients * (inputs < min))`.
+*  <b>`backprop_wrt_max`</b>: A `Tensor` of type `float32`. Backpropagated gradients w.r.t. max parameter, shape `[d]`:
+    `sum_per_d(gradients * (inputs > max))`.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.all_variables.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.all_variables.md
index 904b99f321a..a64640478ff 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.all_variables.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.all_variables.md
@@ -1,12 +1,8 @@
-### `tf.all_variables()` {#all_variables}
+### `tf.all_variables(*args, **kwargs)` {#all_variables}
 
-Returns all variables that must be saved/restored.
+See `tf.global_variables`. (deprecated)
 
-The `Variable()` constructor automatically adds new variables to the graph
-collection `GraphKeys.VARIABLES`. This convenience function returns the
-contents of that collection.
-
-##### Returns:
-
-  A list of `Variable` objects.
+THIS FUNCTION IS DEPRECATED. It will be removed after 2016-03-02.
+Instructions for updating:
+Please use tf.global_variables instead.
 
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.BaseStochasticTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.BaseStochasticTensor.md
index 8e1c5a98864..0bee637f4d2 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.BaseStochasticTensor.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.BaseStochasticTensor.md
@@ -20,13 +20,6 @@ Base Class for Tensor-like objects that emit stochastic values.
 
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BaseStochasticTensor.input_dict` {#BaseStochasticTensor.input_dict}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.BaseStochasticTensor.loss(sample_loss)` {#BaseStochasticTensor.loss}
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.BetaTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.BetaTensor.md
deleted file mode 100644
index 12f015573d2..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.BetaTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`BetaTensor` is a `StochasticTensor` backed by the distribution `Beta`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BetaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.clone(name=None, **dist_args)` {#BetaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.distribution` {#BetaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.dtype` {#BetaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.entropy(name='entropy')` {#BetaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.graph` {#BetaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.input_dict` {#BetaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.loss(final_loss, name='Loss')` {#BetaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.mean(name='mean')` {#BetaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.name` {#BetaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.value(name='value')` {#BetaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BetaTensor.value_type` {#BetaTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.md
deleted file mode 100644
index 3354de85c9c..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`LaplaceWithSoftplusScaleTensor` is a `StochasticTensor` backed by the distribution `LaplaceWithSoftplusScale`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#LaplaceWithSoftplusScaleTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.clone(name=None, **dist_args)` {#LaplaceWithSoftplusScaleTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.distribution` {#LaplaceWithSoftplusScaleTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.dtype` {#LaplaceWithSoftplusScaleTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.entropy(name='entropy')` {#LaplaceWithSoftplusScaleTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.graph` {#LaplaceWithSoftplusScaleTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.input_dict` {#LaplaceWithSoftplusScaleTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.loss(final_loss, name='Loss')` {#LaplaceWithSoftplusScaleTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.mean(name='mean')` {#LaplaceWithSoftplusScaleTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.name` {#LaplaceWithSoftplusScaleTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.value(name='value')` {#LaplaceWithSoftplusScaleTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceWithSoftplusScaleTensor.value_type` {#LaplaceWithSoftplusScaleTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.integrate.odeint.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.integrate.odeint.md
new file mode 100644
index 00000000000..25b2709be88
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.integrate.odeint.md
@@ -0,0 +1,90 @@
+### `tf.contrib.integrate.odeint(func, y0, t, rtol=1e-06, atol=1e-12, method=None, options=None, full_output=False, name=None)` {#odeint}
+
+Integrate a system of ordinary differential equations.
+
+Solves the initial value problem for a non-stiff system of first order ode-s:
+
+  ```
+  dy/dt = func(y, t), y(t[0]) = y0
+  ```
+
+where y is a Tensor of any shape.
+
+For example:
+
+  ```
+  # solve `dy/dt = -y`, corresponding to exponential decay
+  tf.contrib.integrate.odeint(lambda y, _: -y, 1.0, [0, 1, 2])
+  => [1, exp(-1), exp(-2)]
+  ```
+
+Output dtypes and numerical precision are based on the dtypes of the inputs
+`y0` and `t`.
+
+Currently, implements 5th order Runge-Kutta with adaptive step size control
+and dense output, using the Dormand-Prince method. Similar to the 'dopri5'
+method of `scipy.integrate.ode` and MATLAB's `ode45`.
+
+Based on: Shampine, Lawrence F. (1986), "Some Practical Runge-Kutta Formulas",
+Mathematics of Computation, American Mathematical Society, 46 (173): 135-150,
+doi:10.2307/2008219
+
+##### Args:
+
+
+*  <b>`func`</b>: Function that maps a Tensor holding the state `y` and a scalar Tensor
+    `t` into a Tensor of state derivatives with respect to time.
+*  <b>`y0`</b>: N-D Tensor giving starting value of `y` at time point `t[0]`. May
+    have any floating point or complex dtype.
+*  <b>`t`</b>: 1-D Tensor holding a sequence of time points for which to solve for
+    `y`. The initial time point should be the first element of this sequence,
+    and each time must be larger than the previous time. May have any floating
+    point dtype. If not provided as a Tensor, converted to a Tensor with
+    float64 dtype.
+*  <b>`rtol`</b>: optional float64 Tensor specifying an upper bound on relative error,
+    per element of `y`.
+*  <b>`atol`</b>: optional float64 Tensor specifying an upper bound on absolute error,
+    per element of `y`.
+*  <b>`method`</b>: optional string indicating the integration method to use. Currently,
+    the only valid option is `'dopri5'`.
+*  <b>`options`</b>: optional dict of configuring options for the indicated integration
+    method. Can only be provided if a `method` is explicitly set. For
+    `'dopri5'`, valid options include:
+    * first_step: an initial guess for the size of the first integration
+      (current default: 1.0, but may later be changed to use heuristics based
+      on the gradient).
+    * safety: safety factor for adaptive step control, generally a constant
+      in the range 0.8-1 (default: 0.9).
+    * ifactor: maximum factor by which the adaptive step may be increased
+      (default: 10.0).
+    * dfactor: maximum factor by which the adpative step may be decreased
+      (default: 0.2).
+    * max_num_steps: integer maximum number of integrate steps between time
+      points in `t` (default: 1000).
+*  <b>`full_output`</b>: optional boolean. If True, `odeint` returns a tuple
+    `(y, info_dict)` describing the integration process.
+*  <b>`name`</b>: Optional name for this operation.
+
+##### Returns:
+
+
+*  <b>`y`</b>: (N+1)-D tensor, where the first dimension corresponds to different
+    time points. Contains the solved value of y for each desired time point in
+    `t`, with the initial value `y0` being the first element along the first
+    dimension.
+*  <b>`info_dict`</b>: only if `full_output == True`. A dict with the following values:
+    * num_func_evals: integer Tensor counting the number of function
+      evaluations.
+    * integrate_points: 1D float64 Tensor with the upper bound of each
+      integration time step.
+    * error_ratio: 1D float Tensor with the estimated ratio of the integration
+      error to the error tolerance at each integration step. An ratio greater
+      than 1 corresponds to rejected steps.
+
+##### Raises:
+
+
+*  <b>`ValueError`</b>: if an invalid `method` is provided.
+*  <b>`TypeError`</b>: if `options` is supplied without `method`, or if `t` or `y0` has
+    an invalid dtype.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.learn.LinearClassifier.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.learn.LinearClassifier.md
index 9327ccc2c1f..3f6584c1f82 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.learn.LinearClassifier.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.contrib.learn.LinearClassifier.md
@@ -6,21 +6,18 @@ classes. When number of possible classes is 2, this is binary classification.
 Example:
 
 ```python
-education = sparse_column_with_hash_bucket(column_name="education",
-                                           hash_bucket_size=1000)
-occupation = sparse_column_with_hash_bucket(column_name="occupation",
-                                            hash_bucket_size=1000)
+sparse_column_a = sparse_column_with_hash_bucket(...)
+sparse_column_b = sparse_column_with_hash_bucket(...)
 
-education_x_occupation = crossed_column(columns=[education, occupation],
-                                        hash_bucket_size=10000)
+sparse_feature_a_x_sparse_feature_b = crossed_column(...)
 
 # Estimator using the default optimizer.
 estimator = LinearClassifier(
-    feature_columns=[occupation, education_x_occupation])
+    feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b])
 
 # Or estimator using the FTRL optimizer with regularization.
 estimator = LinearClassifier(
-    feature_columns=[occupation, education_x_occupation],
+    feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b],
     optimizer=tf.train.FtrlOptimizer(
       learning_rate=0.1,
       l1_regularization_strength=0.001
@@ -28,7 +25,7 @@ estimator = LinearClassifier(
 
 # Or estimator using the SDCAOptimizer.
 estimator = LinearClassifier(
-   feature_columns=[occupation, education_x_occupation],
+   feature_columns=[sparse_column_a, sparse_feature_a_x_sparse_feature_b],
    optimizer=tf.contrib.linear_optimizer.SDCAOptimizer(
      example_id_column='example_id',
      num_loss_partitions=...,
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.fake_quant_with_min_max_args_gradient.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.fake_quant_with_min_max_args_gradient.md
new file mode 100644
index 00000000000..5c93c3e0468
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.fake_quant_with_min_max_args_gradient.md
@@ -0,0 +1,21 @@
+### `tf.fake_quant_with_min_max_args_gradient(gradients, inputs, min=None, max=None, name=None)` {#fake_quant_with_min_max_args_gradient}
+
+Compute gradients for a FakeQuantWithMinMaxArgs operation.
+
+##### Args:
+
+
+*  <b>`gradients`</b>: A `Tensor` of type `float32`.
+    Backpropagated gradients above the FakeQuantWithMinMaxArgs operation.
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+    Values passed as inputs to the FakeQuantWithMinMaxArgs operation.
+*  <b>`min`</b>: An optional `float`. Defaults to `-6`.
+*  <b>`max`</b>: An optional `float`. Defaults to `6`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor` of type `float32`.
+  Backpropagated gradients below the FakeQuantWithMinMaxArgs operation:
+  `gradients * (inputs >= min && inputs <= max)`.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.sparse_minimum.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.sparse_minimum.md
index 4419f736b94..1455e3e533e 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.sparse_minimum.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard1/tf.sparse_minimum.md
@@ -6,8 +6,8 @@ Assumes the two SparseTensors have the same shape, i.e., no broadcasting.
 Example:
 
 ```python
-sp_zero = ops.SparseTensor([[0]], [0], [7])
-sp_one = ops.SparseTensor([[1]], [1], [7])
+sp_zero = sparse_tensor.SparseTensor([[0]], [0], [7])
+sp_one = sparse_tensor.SparseTensor([[1]], [1], [7])
 res = tf.sparse_minimum(sp_zero, sp_one).eval()
 # "res" should be equal to SparseTensor([[0], [1]], [0, 0], [7]).
 ```
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.md
deleted file mode 100644
index 9628ddbb8bb..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`MultivariateNormalDiagTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalDiag`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalDiagTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.clone(name=None, **dist_args)` {#MultivariateNormalDiagTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.distribution` {#MultivariateNormalDiagTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.dtype` {#MultivariateNormalDiagTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.entropy(name='entropy')` {#MultivariateNormalDiagTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.graph` {#MultivariateNormalDiagTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.input_dict` {#MultivariateNormalDiagTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.loss(final_loss, name='Loss')` {#MultivariateNormalDiagTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.mean(name='mean')` {#MultivariateNormalDiagTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.name` {#MultivariateNormalDiagTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.value(name='value')` {#MultivariateNormalDiagTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagTensor.value_type` {#MultivariateNormalDiagTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.md
deleted file mode 100644
index 9e831a2b508..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`MultivariateNormalDiagWithSoftplusStDevTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalDiagWithSoftplusStDev`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalDiagWithSoftplusStDevTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.clone(name=None, **dist_args)` {#MultivariateNormalDiagWithSoftplusStDevTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.distribution` {#MultivariateNormalDiagWithSoftplusStDevTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.dtype` {#MultivariateNormalDiagWithSoftplusStDevTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.entropy(name='entropy')` {#MultivariateNormalDiagWithSoftplusStDevTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.graph` {#MultivariateNormalDiagWithSoftplusStDevTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.input_dict` {#MultivariateNormalDiagWithSoftplusStDevTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.loss(final_loss, name='Loss')` {#MultivariateNormalDiagWithSoftplusStDevTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.mean(name='mean')` {#MultivariateNormalDiagWithSoftplusStDevTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.name` {#MultivariateNormalDiagWithSoftplusStDevTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.value(name='value')` {#MultivariateNormalDiagWithSoftplusStDevTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalDiagWithSoftplusStDevTensor.value_type` {#MultivariateNormalDiagWithSoftplusStDevTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.md
deleted file mode 100644
index fdf5e0f7f6e..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`PoissonTensor` is a `StochasticTensor` backed by the distribution `Poisson`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#PoissonTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.clone(name=None, **dist_args)` {#PoissonTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.distribution` {#PoissonTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.dtype` {#PoissonTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.entropy(name='entropy')` {#PoissonTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.graph` {#PoissonTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.input_dict` {#PoissonTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.loss(final_loss, name='Loss')` {#PoissonTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.mean(name='mean')` {#PoissonTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.name` {#PoissonTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.value(name='value')` {#PoissonTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.PoissonTensor.value_type` {#PoissonTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.md
deleted file mode 100644
index 460980870ba..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`WishartFullTensor` is a `StochasticTensor` backed by the distribution `WishartFull`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#WishartFullTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.clone(name=None, **dist_args)` {#WishartFullTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.distribution` {#WishartFullTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.dtype` {#WishartFullTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.entropy(name='entropy')` {#WishartFullTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.graph` {#WishartFullTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.input_dict` {#WishartFullTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.loss(final_loss, name='Loss')` {#WishartFullTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.mean(name='mean')` {#WishartFullTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.name` {#WishartFullTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.value(name='value')` {#WishartFullTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartFullTensor.value_type` {#WishartFullTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.metrics.streaming_auc.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.metrics.streaming_auc.md
index 8912eee3d40..aba3101a9f7 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.metrics.streaming_auc.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.contrib.metrics.streaming_auc.md
@@ -14,7 +14,12 @@ This value is ultimately returned as `auc`, an idempotent operation that
 computes the area under a discretized curve of precision versus recall values
 (computed using the aforementioned variables). The `num_thresholds` variable
 controls the degree of discretization with larger numbers of thresholds more
-closely approximating the true AUC.
+closely approximating the true AUC. The quality of the approximation may vary
+dramatically depending on `num_thresholds`.
+
+For best results, `predictions` should be distributed approximately uniformly
+in the range [0, 1] and not peaked around 0 or 1. The quality of the AUC
+approximation may be poor if this is not the case.
 
 For estimation of the metric over a stream of data, the function creates an
 `update_op` operation that updates these variables and returns the `auc`.
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.global_variables_initializer.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.global_variables_initializer.md
new file mode 100644
index 00000000000..b1ebdcc3270
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.global_variables_initializer.md
@@ -0,0 +1,10 @@
+### `tf.global_variables_initializer()` {#global_variables_initializer}
+
+Returns an Op that initializes global variables.
+
+This is just a shortcut for `variable_initializers(global_variables())`
+
+##### Returns:
+
+  An Op that initializes global variables in the graph.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.initialize_all_variables.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.initialize_all_variables.md
index 9a0e5d8261b..ec240fc6088 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.initialize_all_variables.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.initialize_all_variables.md
@@ -1,10 +1,8 @@
-### `tf.initialize_all_variables()` {#initialize_all_variables}
+### `tf.initialize_all_variables(*args, **kwargs)` {#initialize_all_variables}
 
-Returns an Op that initializes all variables.
+See `tf.global_variables_initializer`. (deprecated)
 
-This is just a shortcut for `initialize_variables(all_variables())`
-
-##### Returns:
-
-  An Op that initializes all variables in the graph.
+THIS FUNCTION IS DEPRECATED. It will be removed after 2017-03-02.
+Instructions for updating:
+Use `tf.global_variables_initializer` instead.
 
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.initialize_local_variables.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.initialize_local_variables.md
index 2a56dbb9d69..a6c1395e918 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.initialize_local_variables.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.initialize_local_variables.md
@@ -1,10 +1,8 @@
-### `tf.initialize_local_variables()` {#initialize_local_variables}
+### `tf.initialize_local_variables(*args, **kwargs)` {#initialize_local_variables}
 
-Returns an Op that initializes all local variables.
+See `tf.local_variables_initializer`. (deprecated)
 
-This is just a shortcut for `initialize_variables(local_variables())`
-
-##### Returns:
-
-  An Op that initializes all local variables in the graph.
+THIS FUNCTION IS DEPRECATED. It will be removed after 2017-03-02.
+Instructions for updating:
+Use `tf.local_variables_initializer` instead.
 
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.local_variables_initializer.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.local_variables_initializer.md
new file mode 100644
index 00000000000..3f726bdf7ad
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.local_variables_initializer.md
@@ -0,0 +1,10 @@
+### `tf.local_variables_initializer()` {#local_variables_initializer}
+
+Returns an Op that initializes all local variables.
+
+This is just a shortcut for `variable_initializers(local_variables())`
+
+##### Returns:
+
+  An Op that initializes all local variables in the graph.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.report_uninitialized_variables.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.report_uninitialized_variables.md
index 59c1394a4aa..e3ecdf7733b 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.report_uninitialized_variables.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.report_uninitialized_variables.md
@@ -9,7 +9,7 @@ variables if there are any, or an empty array if there are none.
 
 
 *  <b>`var_list`</b>: List of `Variable` objects to check. Defaults to the
-    value of `all_variables() + local_variables()`
+    value of `global_variables() + local_variables()`
 *  <b>`name`</b>: Optional name of the `Operation`.
 
 ##### Returns:
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.scatter_nd_sub.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.scatter_nd_sub.md
new file mode 100644
index 00000000000..c64e3793754
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.scatter_nd_sub.md
@@ -0,0 +1,52 @@
+### `tf.scatter_nd_sub(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_sub}
+
+Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to subtract 4 scattered elements from a rank-1 tensor with 8 elements. In Python, that subtraction would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    sub = tf.scatter_nd_sub(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(sub)
+
+The resulting update to ref would look like this:
+
+    [1, -9, 3, -6, -4, 6, 7, -4]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. Must be one of the following types: `float32`, `float64`, `int64`, `int32`, `uint8`, `uint16`, `int16`, `int8`, `complex64`, `complex128`, `qint8`, `quint8`, `qint32`, `half`.
+    A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `False`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.variables_initializer.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.variables_initializer.md
new file mode 100644
index 00000000000..ec779e79f66
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard2/tf.variables_initializer.md
@@ -0,0 +1,24 @@
+### `tf.variables_initializer(var_list, name='init')` {#variables_initializer}
+
+Returns an Op that initializes a list of variables.
+
+After you launch the graph in a session, you can run the returned Op to
+initialize all the variables in `var_list`. This Op runs all the
+initializers of the variables in `var_list` in parallel.
+
+Calling `initialize_variables()` is equivalent to passing the list of
+initializers to `Group()`.
+
+If `var_list` is empty, however, the function still returns an Op that can
+be run. That Op just has no effect.
+
+##### Args:
+
+
+*  <b>`var_list`</b>: List of `Variable` objects to initialize.
+*  <b>`name`</b>: Optional name for the returned operation.
+
+##### Returns:
+
+  An Op that run the initializers of all the specified variables.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.SparseTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.SparseTensor.md
index 4bead96bc9d..d89b4e70c4c 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.SparseTensor.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.SparseTensor.md
@@ -73,6 +73,17 @@ Creates a `SparseTensor`.
   A `SparseTensor`
 
 
+- - -
+
+#### `tf.SparseTensor.get_shape()` {#SparseTensor.get_shape}
+
+Get the `TensorShape` that represents the shape of the dense tensor.
+
+##### Returns:
+
+  A `TensorShape` object.
+
+
 - - -
 
 #### `tf.SparseTensor.indices` {#SparseTensor.indices}
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.md
deleted file mode 100644
index 3280f5a9448..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`MixtureTensor` is a `StochasticTensor` backed by the distribution `Mixture`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MixtureTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.clone(name=None, **dist_args)` {#MixtureTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.distribution` {#MixtureTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.dtype` {#MixtureTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.entropy(name='entropy')` {#MixtureTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.graph` {#MixtureTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.input_dict` {#MixtureTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.loss(final_loss, name='Loss')` {#MixtureTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.mean(name='mean')` {#MixtureTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.name` {#MixtureTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.value(name='value')` {#MixtureTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MixtureTensor.value_type` {#MixtureTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.md
deleted file mode 100644
index 3f29186182b..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`MultivariateNormalCholeskyTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalCholesky`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalCholeskyTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.clone(name=None, **dist_args)` {#MultivariateNormalCholeskyTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.distribution` {#MultivariateNormalCholeskyTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.dtype` {#MultivariateNormalCholeskyTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.entropy(name='entropy')` {#MultivariateNormalCholeskyTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.graph` {#MultivariateNormalCholeskyTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.input_dict` {#MultivariateNormalCholeskyTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.loss(final_loss, name='Loss')` {#MultivariateNormalCholeskyTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.mean(name='mean')` {#MultivariateNormalCholeskyTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.name` {#MultivariateNormalCholeskyTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.value(name='value')` {#MultivariateNormalCholeskyTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalCholeskyTensor.value_type` {#MultivariateNormalCholeskyTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.md
deleted file mode 100644
index 60976c962bb..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`NormalWithSoftplusSigmaTensor` is a `StochasticTensor` backed by the distribution `NormalWithSoftplusSigma`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#NormalWithSoftplusSigmaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.clone(name=None, **dist_args)` {#NormalWithSoftplusSigmaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.distribution` {#NormalWithSoftplusSigmaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.dtype` {#NormalWithSoftplusSigmaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.entropy(name='entropy')` {#NormalWithSoftplusSigmaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.graph` {#NormalWithSoftplusSigmaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.input_dict` {#NormalWithSoftplusSigmaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.loss(final_loss, name='Loss')` {#NormalWithSoftplusSigmaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.mean(name='mean')` {#NormalWithSoftplusSigmaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.name` {#NormalWithSoftplusSigmaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.value(name='value')` {#NormalWithSoftplusSigmaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalWithSoftplusSigmaTensor.value_type` {#NormalWithSoftplusSigmaTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.fake_quant_with_min_max_vars.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.fake_quant_with_min_max_vars.md
new file mode 100644
index 00000000000..d7815f04146
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.fake_quant_with_min_max_vars.md
@@ -0,0 +1,25 @@
+### `tf.fake_quant_with_min_max_vars(inputs, min, max, name=None)` {#fake_quant_with_min_max_vars}
+
+Fake-quantize the 'inputs' tensor of type float and shape `[b, h, w, d]` via
+
+global float scalars `min` and `max` to 'outputs' tensor of same shape as
+`inputs`.
+
+[min; max] is the clamping range for the 'inputs' data.  Op divides this range
+into 255 steps (total of 256 values), then replaces each 'inputs' value with the
+closest of the quantized step values.
+
+This operation has a gradient and thus allows for training `min` and `max` values.
+
+##### Args:
+
+
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+*  <b>`min`</b>: A `Tensor` of type `float32`.
+*  <b>`max`</b>: A `Tensor` of type `float32`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor` of type `float32`.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.fake_quant_with_min_max_vars_per_channel.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.fake_quant_with_min_max_vars_per_channel.md
new file mode 100644
index 00000000000..bc39cf9570a
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.fake_quant_with_min_max_vars_per_channel.md
@@ -0,0 +1,25 @@
+### `tf.fake_quant_with_min_max_vars_per_channel(inputs, min, max, name=None)` {#fake_quant_with_min_max_vars_per_channel}
+
+Fake-quantize the 'inputs' tensor of type float and one of the shapes: `[d]`,
+
+`[b, d]` `[b, h, w, d]` via per-channel floats `min` and `max` of shape `[d]`
+to 'outputs' tensor of same shape as `inputs`.
+
+[min; max] is the clamping range for the 'inputs' data in the corresponding
+depth channel.  Op divides this range into 255 steps (total of 256 values), then
+replaces each 'inputs' value with the closest of the quantized step values.
+
+This operation has a gradient and thus allows for training `min` and `max` values.
+
+##### Args:
+
+
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+*  <b>`min`</b>: A `Tensor` of type `float32`.
+*  <b>`max`</b>: A `Tensor` of type `float32`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor` of type `float32`.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.global_variables.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.global_variables.md
new file mode 100644
index 00000000000..1939f422248
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.global_variables.md
@@ -0,0 +1,17 @@
+### `tf.global_variables()` {#global_variables}
+
+Returns global variables.
+
+Global variables are variables that are shared across machines in a
+distributed environment. The `Variable()` constructor or `get_variable()`
+automatically adds new variables to the graph collection
+`GraphKeys.GLOBAL_VARIABLES`.
+This convenience function returns the contents of that collection.
+
+An alternative to global variables are local variables. See
+[`tf.local_variables()`](../../api_docs/python/state_ops.md#local_variables)
+
+##### Returns:
+
+  A list of `Variable` objects.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.local_variables.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.local_variables.md
index b3612c7cbf3..26b4d127af5 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.local_variables.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.local_variables.md
@@ -1,8 +1,19 @@
 ### `tf.local_variables()` {#local_variables}
 
-Returns all variables created with collection=[LOCAL_VARIABLES].
+Returns local variables.
+
+Local variables - per process variables, usually not saved/restored to
+checkpoint and used for temporary or intermediate values.
+For example, they can be used as counters for metrics computation or
+number of epochs this machine has read data.
+The `local_variable()` automatically adds new variable to
+`GraphKeys.LOCAL_VARIABLES`.
+This convenience function returns the contents of that collection.
+
+An alternative to local variables are global variables. See
+[`tf.global_variables()`](../../api_docs/python/state_ops.md#global_variables)
 
 ##### Returns:
 
-  A list of local Variable objects.
+  A list of local `Variable` objects.
 
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.scatter_nd_add.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.scatter_nd_add.md
new file mode 100644
index 00000000000..59eb4dcb020
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.scatter_nd_add.md
@@ -0,0 +1,52 @@
+### `tf.scatter_nd_add(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_add}
+
+Applies sparse addition between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to add 4 scattered elements to a rank-1 tensor to 8 elements. In Python, that addition would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    add = tf.scatter_nd_add(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(add)
+
+The resulting update to ref would look like this:
+
+    [1, 13, 3, 14, 14, 6, 7, 20]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. Must be one of the following types: `float32`, `float64`, `int64`, `int32`, `uint8`, `uint16`, `int16`, `int8`, `complex64`, `complex128`, `qint8`, `quint8`, `qint32`, `half`.
+    A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to add to ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `False`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.scatter_nd_div.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.scatter_nd_div.md
new file mode 100644
index 00000000000..803dcbdb820
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.scatter_nd_div.md
@@ -0,0 +1,52 @@
+### `tf.scatter_nd_div(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_div}
+
+Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to divide a rank-1 tensor with 8 elements by 4 scattered elements. In Python, that division would look like this:
+
+    ref = tf.Variable([10, 20, 30, 40, 50, 60, 70, 80])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([2, 3, 4, 5])
+    sub = tf.scatter_nd_div(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(sub)
+
+The resulting update to ref would look like this:
+
+    [10, 5, 30, 13, 25, 60, 70, 16]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. Must be one of the following types: `float32`, `float64`, `int64`, `int32`, `uint8`, `uint16`, `int16`, `int8`, `complex64`, `complex128`, `qint8`, `quint8`, `qint32`, `half`.
+    A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `False`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.svd.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.svd.md
index a11df39a136..b985bd7e581 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.svd.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard3/tf.svd.md
@@ -1,4 +1,4 @@
-### `tf.svd(tensor, compute_uv=True, full_matrices=False, name=None)` {#svd}
+### `tf.svd(tensor, full_matrices=False, compute_uv=True, name=None)` {#svd}
 
 Computes the singular value decompositions of one or more matrices.
 
@@ -20,12 +20,12 @@ s = svd(a, compute_uv=False)
 
 *  <b>`matrix`</b>: `Tensor` of shape `[..., M, N]`. Let `P` be the minimum of `M` and
     `N`.
-*  <b>`compute_uv`</b>: If `True` then left and right singular vectors will be
-    computed and returned in `u` and `v`, respectively. Otherwise, only the
-    singular values will be computed, which can be significantly faster.
 *  <b>`full_matrices`</b>: If true, compute full-sized `u` and `v`. If false
     (the default), compute only the leading `P` singular vectors.
     Ignored if `compute_uv` is `False`.
+*  <b>`compute_uv`</b>: If `True` then left and right singular vectors will be
+    computed and returned in `u` and `v`, respectively. Otherwise, only the
+    singular values will be computed, which can be significantly faster.
 *  <b>`name`</b>: string, optional name of the operation.
 
 ##### Returns:
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.md
deleted file mode 100644
index df77e8c03a6..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`BinomialTensor` is a `StochasticTensor` backed by the distribution `Binomial`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BinomialTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.clone(name=None, **dist_args)` {#BinomialTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.distribution` {#BinomialTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.dtype` {#BinomialTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.entropy(name='entropy')` {#BinomialTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.graph` {#BinomialTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.input_dict` {#BinomialTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.loss(final_loss, name='Loss')` {#BinomialTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.mean(name='mean')` {#BinomialTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.name` {#BinomialTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.value(name='value')` {#BinomialTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BinomialTensor.value_type` {#BinomialTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.md
deleted file mode 100644
index 233ece8e1fe..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`DirichletMultinomialTensor` is a `StochasticTensor` backed by the distribution `DirichletMultinomial`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#DirichletMultinomialTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.clone(name=None, **dist_args)` {#DirichletMultinomialTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.distribution` {#DirichletMultinomialTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.dtype` {#DirichletMultinomialTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.entropy(name='entropy')` {#DirichletMultinomialTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.graph` {#DirichletMultinomialTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.input_dict` {#DirichletMultinomialTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.loss(final_loss, name='Loss')` {#DirichletMultinomialTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.mean(name='mean')` {#DirichletMultinomialTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.name` {#DirichletMultinomialTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.value(name='value')` {#DirichletMultinomialTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletMultinomialTensor.value_type` {#DirichletMultinomialTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.md
deleted file mode 100644
index bbc0f007b4e..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`InverseGammaTensor` is a `StochasticTensor` backed by the distribution `InverseGamma`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#InverseGammaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.clone(name=None, **dist_args)` {#InverseGammaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.distribution` {#InverseGammaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.dtype` {#InverseGammaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.entropy(name='entropy')` {#InverseGammaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.graph` {#InverseGammaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.input_dict` {#InverseGammaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.loss(final_loss, name='Loss')` {#InverseGammaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.mean(name='mean')` {#InverseGammaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.name` {#InverseGammaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.value(name='value')` {#InverseGammaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaTensor.value_type` {#InverseGammaTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.md
index d92f209f877..71d1af5add2 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.md
@@ -1,14 +1,14 @@
 StochasticTensor is a BaseStochasticTensor backed by a distribution.
 - - -
 
-#### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.__init__(dist_cls, name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#StochasticTensor.__init__}
+#### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.__init__(dist, name='StochasticTensor', dist_value_type=None, loss_fn=score_function)` {#StochasticTensor.__init__}
 
 Construct a `StochasticTensor`.
 
-`StochasticTensor` will instantiate a distribution from `dist_cls` and
-`dist_args` and its `value` method will return the same value each time
-it is called. What `value` is returned is controlled by the
-`dist_value_type` (defaults to `SampleAndReshapeValue`).
+`StochasticTensor` is backed by the `dist` distribution and its `value`
+method will return the same value each time it is called. What `value` is
+returned is controlled by the `dist_value_type` (defaults to
+`SampleAndReshapeValue`).
 
 Some distributions' sample functions are not differentiable (e.g. a sample
 from a discrete distribution like a Bernoulli) and so to differentiate
@@ -26,34 +26,26 @@ reparameterized distributions; it will also return None if the value type is
 ##### Args:
 
 
-*  <b>`dist_cls`</b>: a `Distribution` class.
+*  <b>`dist`</b>: an instance of `Distribution`.
 *  <b>`name`</b>: a name for this `StochasticTensor` and its ops.
 *  <b>`dist_value_type`</b>: a `_StochasticValueType`, which will determine what the
       `value` of this `StochasticTensor` will be. If not provided, the
       value type set with the `value_type` context manager will be used.
-*  <b>`loss_fn`</b>: callable that takes `(st, st.value(), influenced_loss)`, where
+*  <b>`loss_fn`</b>: callable that takes
+      `(st, st.value(), influenced_loss)`, where
       `st` is this `StochasticTensor`, and returns a `Tensor` loss. By
       default, `loss_fn` is the `score_function`, or more precisely, the
       integral of the score function, such that when the gradient is taken,
       the score function results. See the `stochastic_gradient_estimators`
       module for additional loss functions and baselines.
-*  <b>`**dist_args`</b>: keyword arguments to be passed through to `dist_cls` on
-      construction.
 
 ##### Raises:
 
 
-*  <b>`TypeError`</b>: if `dist_cls` is not a `Distribution`.
+*  <b>`TypeError`</b>: if `dist` is not an instance of `Distribution`.
 *  <b>`TypeError`</b>: if `loss_fn` is not `callable`.
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.clone(name=None, **dist_args)` {#StochasticTensor.clone}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.distribution` {#StochasticTensor.distribution}
@@ -82,13 +74,6 @@ reparameterized distributions; it will also return None if the value type is
 
 
 
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.input_dict` {#StochasticTensor.input_dict}
-
-
-
-
 - - -
 
 #### `tf.contrib.bayesflow.stochastic_tensor.StochasticTensor.loss(final_loss, name='Loss')` {#StochasticTensor.loss}
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.md
deleted file mode 100644
index 855391fdcfa..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`beta_aaTensor` is a `StochasticTensor` backed by the distribution `beta_aa`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#beta_aaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.clone(name=None, **dist_args)` {#beta_aaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.distribution` {#beta_aaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.dtype` {#beta_aaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.entropy(name='entropy')` {#beta_aaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.graph` {#beta_aaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.input_dict` {#beta_aaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.loss(final_loss, name='Loss')` {#beta_aaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.mean(name='mean')` {#beta_aaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.name` {#beta_aaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.value(name='value')` {#beta_aaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_aaTensor.value_type` {#beta_aaTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.initialize_variables.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.initialize_variables.md
index 8941ab48535..3ab51c4b3c6 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.initialize_variables.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.initialize_variables.md
@@ -1,24 +1,8 @@
-### `tf.initialize_variables(var_list, name='init')` {#initialize_variables}
+### `tf.initialize_variables(*args, **kwargs)` {#initialize_variables}
 
-Returns an Op that initializes a list of variables.
+See `tf.variables_initializer`. (deprecated)
 
-After you launch the graph in a session, you can run the returned Op to
-initialize all the variables in `var_list`. This Op runs all the
-initializers of the variables in `var_list` in parallel.
-
-Calling `initialize_variables()` is equivalent to passing the list of
-initializers to `Group()`.
-
-If `var_list` is empty, however, the function still returns an Op that can
-be run. That Op just has no effect.
-
-##### Args:
-
-
-*  <b>`var_list`</b>: List of `Variable` objects to initialize.
-*  <b>`name`</b>: Optional name for the returned operation.
-
-##### Returns:
-
-  An Op that run the initializers of all the specified variables.
+THIS FUNCTION IS DEPRECATED. It will be removed after 2017-03-02.
+Instructions for updating:
+Use `tf.variables_initializer` instead.
 
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.python_io.TFRecordCompressionType.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.python_io.TFRecordCompressionType.md
new file mode 100644
index 00000000000..8b9cbe04451
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard4/tf.python_io.TFRecordCompressionType.md
@@ -0,0 +1 @@
+The type of compression for the record.
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.md
deleted file mode 100644
index b4e5a7b8d88..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`BernoulliWithSigmoidPTensor` is a `StochasticTensor` backed by the distribution `BernoulliWithSigmoidP`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BernoulliWithSigmoidPTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.clone(name=None, **dist_args)` {#BernoulliWithSigmoidPTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.distribution` {#BernoulliWithSigmoidPTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.dtype` {#BernoulliWithSigmoidPTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.entropy(name='entropy')` {#BernoulliWithSigmoidPTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.graph` {#BernoulliWithSigmoidPTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.input_dict` {#BernoulliWithSigmoidPTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.loss(final_loss, name='Loss')` {#BernoulliWithSigmoidPTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.mean(name='mean')` {#BernoulliWithSigmoidPTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.name` {#BernoulliWithSigmoidPTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.value(name='value')` {#BernoulliWithSigmoidPTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliWithSigmoidPTensor.value_type` {#BernoulliWithSigmoidPTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.md
deleted file mode 100644
index 0e3bf1e8af4..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`Chi2Tensor` is a `StochasticTensor` backed by the distribution `Chi2`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#Chi2Tensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.clone(name=None, **dist_args)` {#Chi2Tensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.distribution` {#Chi2Tensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.dtype` {#Chi2Tensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.entropy(name='entropy')` {#Chi2Tensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.graph` {#Chi2Tensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.input_dict` {#Chi2Tensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.loss(final_loss, name='Loss')` {#Chi2Tensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.mean(name='mean')` {#Chi2Tensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.name` {#Chi2Tensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.value(name='value')` {#Chi2Tensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2Tensor.value_type` {#Chi2Tensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.md
deleted file mode 100644
index 6647401eca6..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`LaplaceTensor` is a `StochasticTensor` backed by the distribution `Laplace`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#LaplaceTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.clone(name=None, **dist_args)` {#LaplaceTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.distribution` {#LaplaceTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.dtype` {#LaplaceTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.entropy(name='entropy')` {#LaplaceTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.graph` {#LaplaceTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.input_dict` {#LaplaceTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.loss(final_loss, name='Loss')` {#LaplaceTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.mean(name='mean')` {#LaplaceTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.name` {#LaplaceTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.value(name='value')` {#LaplaceTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.LaplaceTensor.value_type` {#LaplaceTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.scatter_nd.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.scatter_nd.md
new file mode 100644
index 00000000000..c169dab876f
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.scatter_nd.md
@@ -0,0 +1,83 @@
+### `tf.scatter_nd(indices, updates, shape, name=None)` {#scatter_nd}
+
+Creates a new tensor by applying sparse `updates` to individual values or slices within a zero tensor of the given `shape` tensor according to indices.
+
+This operator is the inverse of the [tf.gather_nd](#gather_nd) operator which extracts values or slices from a given tensor.
+
+TODO(simister): Add a link to Variable.__getitem__ documentation on slice syntax.
+
+`shape` is a `TensorShape` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `shape`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `shape`.
+
+`updates` is Tensor of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, shape[K], ..., shape[P-1]].
+```
+
+The simplest form of scatter is to insert individual elements in a tensor by index. For example, say we want to insert 4 scattered elements in a rank-1 tensor with 8 elements.
+
+<div style="width:70%; margin:auto; margin-bottom:10px; margin-top:20px;">
+<img style="width:100%" src="../../images/ScatterNd1.png" alt>
+</div>
+
+In Python, this scatter operation would look like this:
+
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    shape = tf.constant([8])
+    scatter = tf.scatter_nd(indices, updates, shape)
+    with tf.Session() as sess:
+      print sess.run(scatter)
+
+The resulting tensor would look like this:
+
+    [0, 11, 0, 10, 9, 0, 0, 12]
+
+We can also, insert entire slices of a higher rank tensor all at once. For example, if we wanted to insert two slices in the first dimension of a rank-3 tensor with two matrices of new values.
+
+<div style="width:70%; margin:auto; margin-bottom:10px; margin-top:20px;">
+<img style="width:100%" src="../../images/ScatterNd2.png" alt>
+</div>
+
+In Python, this scatter operation would look like this:
+
+    indices = tf.constant([[0], [2]])
+    updates = tf.constant([[[5, 5, 5, 5], [6, 6, 6, 6],
+                            [7, 7, 7, 7], [8, 8, 8, 8]],
+                           [[5, 5, 5, 5], [6, 6, 6, 6],
+                            [7, 7, 7, 7], [8, 8, 8, 8]]])
+    shape = tf.constant([4, 4, 4])
+    scatter = tf.scatter_nd(indices, updates, shape)
+    with tf.Session() as sess:
+      print sess.run(scatter)
+
+The resulting tensor would look like this:
+
+    [[[5, 5, 5, 5], [6, 6, 6, 6], [7, 7, 7, 7], [8, 8, 8, 8]],
+     [[0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0]],
+     [[5, 5, 5, 5], [6, 6, 6, 6], [7, 7, 7, 7], [8, 8, 8, 8]],
+     [[0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0], [0, 0, 0, 0]]]
+
+##### Args:
+
+
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`.
+    A Tensor. Must have the same type as tensor. A tensor of updated values to store in ref.
+*  <b>`shape`</b>: A `Tensor`. Must have the same type as `indices`.
+    A vector. The shape of the resulting tensor.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor`. Has the same type as `updates`.
+  A new tensor with the given shape and updates applied according to the indices.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.sparse_maximum.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.sparse_maximum.md
index b934c3b1cdb..2f2759f2c64 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.sparse_maximum.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.sparse_maximum.md
@@ -6,8 +6,8 @@ Assumes the two SparseTensors have the same shape, i.e., no broadcasting.
 Example:
 
 ```python
-sp_zero = ops.SparseTensor([[0]], [0], [7])
-sp_one = ops.SparseTensor([[1]], [1], [7])
+sp_zero = sparse_tensor.SparseTensor([[0]], [0], [7])
+sp_one = sparse_tensor.SparseTensor([[1]], [1], [7])
 res = tf.sparse_maximum(sp_zero, sp_one).eval()
 # "res" should be equal to SparseTensor([[0], [1]], [0, 1], [7]).
 ```
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.train.Saver.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.train.Saver.md
index 8ce093840f0..cacfed94d2e 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.train.Saver.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard5/tf.train.Saver.md
@@ -305,7 +305,7 @@ Builds saver_def.
 
 - - -
 
-#### `tf.train.Saver.export_meta_graph(filename=None, collection_list=None, as_text=False, export_scope=None)` {#Saver.export_meta_graph}
+#### `tf.train.Saver.export_meta_graph(filename=None, collection_list=None, as_text=False, export_scope=None, clear_devices=False)` {#Saver.export_meta_graph}
 
 Writes `MetaGraphDef` to save_path/filename.
 
@@ -316,6 +316,8 @@ Writes `MetaGraphDef` to save_path/filename.
 *  <b>`collection_list`</b>: List of string keys to collect.
 *  <b>`as_text`</b>: If `True`, writes the meta_graph as an ASCII proto.
 *  <b>`export_scope`</b>: Optional `string`. Name scope to remove.
+*  <b>`clear_devices`</b>: Whether or not to clear the device field for an `Operation`
+    or `Tensor` during export.
 
 ##### Returns:
 
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.md
deleted file mode 100644
index cf1bd14d49a..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`ExponentialWithSoftplusLamTensor` is a `StochasticTensor` backed by the distribution `ExponentialWithSoftplusLam`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#ExponentialWithSoftplusLamTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.clone(name=None, **dist_args)` {#ExponentialWithSoftplusLamTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.distribution` {#ExponentialWithSoftplusLamTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.dtype` {#ExponentialWithSoftplusLamTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.entropy(name='entropy')` {#ExponentialWithSoftplusLamTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.graph` {#ExponentialWithSoftplusLamTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.input_dict` {#ExponentialWithSoftplusLamTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.loss(final_loss, name='Loss')` {#ExponentialWithSoftplusLamTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.mean(name='mean')` {#ExponentialWithSoftplusLamTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.name` {#ExponentialWithSoftplusLamTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.value(name='value')` {#ExponentialWithSoftplusLamTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialWithSoftplusLamTensor.value_type` {#ExponentialWithSoftplusLamTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.GammaTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.GammaTensor.md
deleted file mode 100644
index a6a8a6d88ab..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.GammaTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`GammaTensor` is a `StochasticTensor` backed by the distribution `Gamma`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#GammaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.clone(name=None, **dist_args)` {#GammaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.distribution` {#GammaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.dtype` {#GammaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.entropy(name='entropy')` {#GammaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.graph` {#GammaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.input_dict` {#GammaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.loss(final_loss, name='Loss')` {#GammaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.mean(name='mean')` {#GammaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.name` {#GammaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.value(name='value')` {#GammaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.GammaTensor.value_type` {#GammaTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.md
deleted file mode 100644
index 03f39cd501a..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`InverseGammaWithSoftplusAlphaBetaTensor` is a `StochasticTensor` backed by the distribution `InverseGammaWithSoftplusAlphaBeta`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#InverseGammaWithSoftplusAlphaBetaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.clone(name=None, **dist_args)` {#InverseGammaWithSoftplusAlphaBetaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.distribution` {#InverseGammaWithSoftplusAlphaBetaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.dtype` {#InverseGammaWithSoftplusAlphaBetaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.entropy(name='entropy')` {#InverseGammaWithSoftplusAlphaBetaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.graph` {#InverseGammaWithSoftplusAlphaBetaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.input_dict` {#InverseGammaWithSoftplusAlphaBetaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.loss(final_loss, name='Loss')` {#InverseGammaWithSoftplusAlphaBetaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.mean(name='mean')` {#InverseGammaWithSoftplusAlphaBetaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.name` {#InverseGammaWithSoftplusAlphaBetaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.value(name='value')` {#InverseGammaWithSoftplusAlphaBetaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.InverseGammaWithSoftplusAlphaBetaTensor.value_type` {#InverseGammaWithSoftplusAlphaBetaTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.md
deleted file mode 100644
index 7ee10de96a0..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`MultivariateNormalFullTensor` is a `StochasticTensor` backed by the distribution `MultivariateNormalFull`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultivariateNormalFullTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.clone(name=None, **dist_args)` {#MultivariateNormalFullTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.distribution` {#MultivariateNormalFullTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.dtype` {#MultivariateNormalFullTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.entropy(name='entropy')` {#MultivariateNormalFullTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.graph` {#MultivariateNormalFullTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.input_dict` {#MultivariateNormalFullTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.loss(final_loss, name='Loss')` {#MultivariateNormalFullTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.mean(name='mean')` {#MultivariateNormalFullTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.name` {#MultivariateNormalFullTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.value(name='value')` {#MultivariateNormalFullTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultivariateNormalFullTensor.value_type` {#MultivariateNormalFullTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.NormalTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.NormalTensor.md
deleted file mode 100644
index 7140c36d319..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.NormalTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`NormalTensor` is a `StochasticTensor` backed by the distribution `Normal`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#NormalTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.clone(name=None, **dist_args)` {#NormalTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.distribution` {#NormalTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.dtype` {#NormalTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.entropy(name='entropy')` {#NormalTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.graph` {#NormalTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.input_dict` {#NormalTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.loss(final_loss, name='Loss')` {#NormalTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.mean(name='mean')` {#NormalTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.name` {#NormalTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.value(name='value')` {#NormalTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.NormalTensor.value_type` {#NormalTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.md
deleted file mode 100644
index 30b3c95e02a..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`StudentTTensor` is a `StochasticTensor` backed by the distribution `StudentT`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#StudentTTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.clone(name=None, **dist_args)` {#StudentTTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.distribution` {#StudentTTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.dtype` {#StudentTTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.entropy(name='entropy')` {#StudentTTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.graph` {#StudentTTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.input_dict` {#StudentTTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.loss(final_loss, name='Loss')` {#StudentTTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.mean(name='mean')` {#StudentTTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.name` {#StudentTTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.value(name='value')` {#StudentTTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTTensor.value_type` {#StudentTTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.md
deleted file mode 100644
index 8bdef9250e0..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`beta_bbTensor` is a `StochasticTensor` backed by the distribution `beta_bb`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#beta_bbTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.clone(name=None, **dist_args)` {#beta_bbTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.distribution` {#beta_bbTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.dtype` {#beta_bbTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.entropy(name='entropy')` {#beta_bbTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.graph` {#beta_bbTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.input_dict` {#beta_bbTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.loss(final_loss, name='Loss')` {#beta_bbTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.mean(name='mean')` {#beta_bbTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.name` {#beta_bbTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.value(name='value')` {#beta_bbTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.beta_bbTensor.value_type` {#beta_bbTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.fake_quant_with_min_max_args.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.fake_quant_with_min_max_args.md
new file mode 100644
index 00000000000..fcad8cb5001
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard6/tf.fake_quant_with_min_max_args.md
@@ -0,0 +1,22 @@
+### `tf.fake_quant_with_min_max_args(inputs, min=None, max=None, name=None)` {#fake_quant_with_min_max_args}
+
+Fake-quantize the 'inputs' tensor, type float to 'outputs' tensor of same type.
+
+Attributes [min; max] define the clamping range for the 'inputs' data.  Op
+divides this range into 255 steps (total of 256 values), then replaces each
+'inputs' value with the closest of the quantized step values.
+
+Quantization is called fake since the output is still in floating point.
+
+##### Args:
+
+
+*  <b>`inputs`</b>: A `Tensor` of type `float32`.
+*  <b>`min`</b>: An optional `float`. Defaults to `-6`.
+*  <b>`max`</b>: An optional `float`. Defaults to `6`.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A `Tensor` of type `float32`.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.assert_variables_initialized.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.assert_variables_initialized.md
index ef61848aa87..ac8604579de 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.assert_variables_initialized.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.assert_variables_initialized.md
@@ -16,7 +16,7 @@ logged by the C++ runtime. This is expected.
 
 
 *  <b>`var_list`</b>: List of `Variable` objects to check. Defaults to the
-    value of `all_variables().`
+    value of `global_variables().`
 
 ##### Returns:
 
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.md
deleted file mode 100644
index 68ff0573cfd..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`StudentTWithAbsDfSoftplusSigmaTensor` is a `StochasticTensor` backed by the distribution `StudentTWithAbsDfSoftplusSigma`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#StudentTWithAbsDfSoftplusSigmaTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.clone(name=None, **dist_args)` {#StudentTWithAbsDfSoftplusSigmaTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.distribution` {#StudentTWithAbsDfSoftplusSigmaTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.dtype` {#StudentTWithAbsDfSoftplusSigmaTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.entropy(name='entropy')` {#StudentTWithAbsDfSoftplusSigmaTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.graph` {#StudentTWithAbsDfSoftplusSigmaTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.input_dict` {#StudentTWithAbsDfSoftplusSigmaTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.loss(final_loss, name='Loss')` {#StudentTWithAbsDfSoftplusSigmaTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.mean(name='mean')` {#StudentTWithAbsDfSoftplusSigmaTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.name` {#StudentTWithAbsDfSoftplusSigmaTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.value(name='value')` {#StudentTWithAbsDfSoftplusSigmaTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.StudentTWithAbsDfSoftplusSigmaTensor.value_type` {#StudentTWithAbsDfSoftplusSigmaTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.scatter_nd_update.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.scatter_nd_update.md
new file mode 100644
index 00000000000..ab1e83ae145
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.scatter_nd_update.md
@@ -0,0 +1,51 @@
+### `tf.scatter_nd_update(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_update}
+
+Applies sparse `updates` to individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to update 4 scattered elements to a rank-1 tensor to 8 elements. In Python, that update would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1] ,[7]])
+    updates = tf.constant([9, 10, 11, 12])
+    update = tf.scatter_nd_update(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(update)
+
+The resulting update to ref would look like this:
+
+    [1, 11, 3, 10, 9, 6, 7, 12]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to add to ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `True`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.train.export_meta_graph.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.train.export_meta_graph.md
index fcd666bac0a..dd318197593 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.train.export_meta_graph.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard7/tf.train.export_meta_graph.md
@@ -1,4 +1,4 @@
-### `tf.train.export_meta_graph(filename=None, meta_info_def=None, graph_def=None, saver_def=None, collection_list=None, as_text=False, graph=None, export_scope=None, **kwargs)` {#export_meta_graph}
+### `tf.train.export_meta_graph(filename=None, meta_info_def=None, graph_def=None, saver_def=None, collection_list=None, as_text=False, graph=None, export_scope=None, clear_devices=False, **kwargs)` {#export_meta_graph}
 
 Returns `MetaGraphDef` proto. Optionally writes it to filename.
 
@@ -22,6 +22,8 @@ a subgraph.
     the subgraph. The scope name will be striped from the node definitions
     for easy import later into new name scopes. If `None`, the whole graph
     is exported. graph_def and export_scope cannot both be specified.
+*  <b>`clear_devices`</b>: Whether or not to clear the device field for an `Operation`
+    or `Tensor` during export.
 *  <b>`**kwargs`</b>: Optional keyed arguments.
 
 ##### Returns:
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.GraphKeys.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.GraphKeys.md
index 1d656f40180..965097f2b00 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.GraphKeys.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.GraphKeys.md
@@ -9,10 +9,18 @@ variables.
 
 The following standard keys are defined:
 
-* `VARIABLES`: the `Variable` objects that comprise a model, and
-  must be saved and restored together. See
-  [`tf.all_variables()`](../../api_docs/python/state_ops.md#all_variables)
+* `GLOBAL_VARIABLES`: the default collection of `Variable` objects, shared
+  across distributed environment (model variables are subset of these). See
+  [`tf.global_variables()`](../../api_docs/python/state_ops.md#global_variables)
   for more details.
+  Commonly, all `TRAINABLE_VARIABLES` variables will be in `MODEL_VARIABLES`,
+  and all `MODEL_VARIABLES` variables will be in `GLOBAL_VARIABLES`.
+* `LOCAL_VARIABLES`: the subset of `Variable` objects that are local to each
+  machine. Usually used for temporarily variables, like counters.
+  Note: use `tf.contrib.framework.local_variable` to add to this collection.
+* `MODEL_VARIABLES`: the subset of `Variable` objects that are used in the
+  model for inference (feed forward). Note: use
+  `tf.contrib.framework.model_variable` to add to this collection.
 * `TRAINABLE_VARIABLES`: the subset of `Variable` objects that will
   be trained by an optimizer. See
   [`tf.trainable_variables()`](../../api_docs/python/state_ops.md#trainable_variables)
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.Variable.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.Variable.md
index 44fac742c80..777d56be50d 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.Variable.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.Variable.md
@@ -51,16 +51,16 @@ with tf.Session() as sess:
 ```
 
 The most common initialization pattern is to use the convenience function
-`initialize_all_variables()` to add an Op to the graph that initializes
+`global_variable_initializers()` to add an Op to the graph that initializes
 all the variables. You then run that Op after launching the graph.
 
 ```python
-# Add an Op to initialize all variables.
-init_op = tf.initialize_all_variables()
+# Add an Op to initialize global variables.
+init_op = tf.global_variable_initializers()
 
 # Launch the graph in a session.
 with tf.Session() as sess:
-    # Run the Op that initializes all variables.
+    # Run the Op that initializes global variables.
     sess.run(init_op)
     # ...you can now run any Op that uses variable values...
 ```
@@ -71,8 +71,8 @@ variables are initialized in the right order.
 
 All variables are automatically collected in the graph where they are
 created. By default, the constructor adds the new variable to the graph
-collection `GraphKeys.VARIABLES`. The convenience function
-`all_variables()` returns the contents of that collection.
+collection `GraphKeys.GLOBAL_VARIABLES`. The convenience function
+`global_variables()` returns the contents of that collection.
 
 When building a machine learning model it is often convenient to distinguish
 between variables holding the trainable model parameters and other variables
@@ -94,7 +94,7 @@ Creating a variable.
 Creates a new variable with value `initial_value`.
 
 The new variable is added to the graph collections listed in `collections`,
-which defaults to `[GraphKeys.VARIABLES]`.
+which defaults to `[GraphKeys.GLOBAL_VARIABLES]`.
 
 If `trainable` is `True` the variable is also added to the graph collection
 `GraphKeys.TRAINABLE_VARIABLES`.
@@ -115,7 +115,7 @@ variable to its initial value.
     collection `GraphKeys.TRAINABLE_VARIABLES`. This collection is used as
     the default list of variables to use by the `Optimizer` classes.
 *  <b>`collections`</b>: List of graph collections keys. The new variable is added to
-    these collections. Defaults to `[GraphKeys.VARIABLES]`.
+    these collections. Defaults to `[GraphKeys.GLOBAL_VARIABLES]`.
 *  <b>`validate_shape`</b>: If `False`, allows the variable to be initialized with a
     value of unknown shape. If `True`, the default, the shape of
     `initial_value` must be known.
@@ -301,7 +301,7 @@ more information on launching a graph and on sessions.
 
 ```python
 v = tf.Variable([1, 2])
-init = tf.initialize_all_variables()
+init = tf.global_variable_initializers()
 
 with tf.Session() as sess:
     sess.run(init)
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.md
deleted file mode 100644
index 8386eea649e..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`ExponentialTensor` is a `StochasticTensor` backed by the distribution `Exponential`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#ExponentialTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.clone(name=None, **dist_args)` {#ExponentialTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.distribution` {#ExponentialTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.dtype` {#ExponentialTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.entropy(name='entropy')` {#ExponentialTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.graph` {#ExponentialTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.input_dict` {#ExponentialTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.loss(final_loss, name='Loss')` {#ExponentialTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.mean(name='mean')` {#ExponentialTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.name` {#ExponentialTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.value(name='value')` {#ExponentialTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.ExponentialTensor.value_type` {#ExponentialTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.md
deleted file mode 100644
index 2f00dfa7d30..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`MultinomialTensor` is a `StochasticTensor` backed by the distribution `Multinomial`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#MultinomialTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.clone(name=None, **dist_args)` {#MultinomialTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.distribution` {#MultinomialTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.dtype` {#MultinomialTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.entropy(name='entropy')` {#MultinomialTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.graph` {#MultinomialTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.input_dict` {#MultinomialTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.loss(final_loss, name='Loss')` {#MultinomialTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.mean(name='mean')` {#MultinomialTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.name` {#MultinomialTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.value(name='value')` {#MultinomialTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.MultinomialTensor.value_type` {#MultinomialTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.md
deleted file mode 100644
index f35b05859c1..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`QuantizedDistributionTensor` is a `StochasticTensor` backed by the distribution `QuantizedDistribution`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#QuantizedDistributionTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.clone(name=None, **dist_args)` {#QuantizedDistributionTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.distribution` {#QuantizedDistributionTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.dtype` {#QuantizedDistributionTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.entropy(name='entropy')` {#QuantizedDistributionTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.graph` {#QuantizedDistributionTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.input_dict` {#QuantizedDistributionTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.loss(final_loss, name='Loss')` {#QuantizedDistributionTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.mean(name='mean')` {#QuantizedDistributionTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.name` {#QuantizedDistributionTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.value(name='value')` {#QuantizedDistributionTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.QuantizedDistributionTensor.value_type` {#QuantizedDistributionTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.python_io.TFRecordOptions.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.python_io.TFRecordOptions.md
new file mode 100644
index 00000000000..3c05efe8343
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.python_io.TFRecordOptions.md
@@ -0,0 +1,15 @@
+Options used for manipulating TFRecord files.
+- - -
+
+#### `tf.python_io.TFRecordOptions.__init__(compression_type)` {#TFRecordOptions.__init__}
+
+
+
+
+- - -
+
+#### `tf.python_io.TFRecordOptions.get_compression_type_string(cls, options)` {#TFRecordOptions.get_compression_type_string}
+
+
+
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.scatter_nd_mul.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.scatter_nd_mul.md
new file mode 100644
index 00000000000..734dfa8d1b7
--- /dev/null
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard8/tf.scatter_nd_mul.md
@@ -0,0 +1,52 @@
+### `tf.scatter_nd_mul(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_mul}
+
+Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to multiply 4 scattered elements with a rank-1 tensor with 8 elements. In Python, that multiplication would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    sub = tf.scatter_nd_mul(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(sub)
+
+The resulting update to ref would look like this:
+
+    [1, 22, 3, 40, 45, 6, 7, 96]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. Must be one of the following types: `float32`, `float64`, `int64`, `int32`, `uint8`, `uint16`, `int16`, `int8`, `complex64`, `complex128`, `qint8`, `quint8`, `qint32`, `half`.
+    A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `False`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.md
deleted file mode 100644
index 328f8e79833..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`BernoulliTensor` is a `StochasticTensor` backed by the distribution `Bernoulli`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#BernoulliTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.clone(name=None, **dist_args)` {#BernoulliTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.distribution` {#BernoulliTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.dtype` {#BernoulliTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.entropy(name='entropy')` {#BernoulliTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.graph` {#BernoulliTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.input_dict` {#BernoulliTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.loss(final_loss, name='Loss')` {#BernoulliTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.mean(name='mean')` {#BernoulliTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.name` {#BernoulliTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.value(name='value')` {#BernoulliTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.BernoulliTensor.value_type` {#BernoulliTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.md
deleted file mode 100644
index 2e1217b686f..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`CategoricalTensor` is a `StochasticTensor` backed by the distribution `Categorical`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#CategoricalTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.clone(name=None, **dist_args)` {#CategoricalTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.distribution` {#CategoricalTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.dtype` {#CategoricalTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.entropy(name='entropy')` {#CategoricalTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.graph` {#CategoricalTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.input_dict` {#CategoricalTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.loss(final_loss, name='Loss')` {#CategoricalTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.mean(name='mean')` {#CategoricalTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.name` {#CategoricalTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.value(name='value')` {#CategoricalTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.CategoricalTensor.value_type` {#CategoricalTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.md
deleted file mode 100644
index bec5b175269..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`Chi2WithAbsDfTensor` is a `StochasticTensor` backed by the distribution `Chi2WithAbsDf`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#Chi2WithAbsDfTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.clone(name=None, **dist_args)` {#Chi2WithAbsDfTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.distribution` {#Chi2WithAbsDfTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.dtype` {#Chi2WithAbsDfTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.entropy(name='entropy')` {#Chi2WithAbsDfTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.graph` {#Chi2WithAbsDfTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.input_dict` {#Chi2WithAbsDfTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.loss(final_loss, name='Loss')` {#Chi2WithAbsDfTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.mean(name='mean')` {#Chi2WithAbsDfTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.name` {#Chi2WithAbsDfTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.value(name='value')` {#Chi2WithAbsDfTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.Chi2WithAbsDfTensor.value_type` {#Chi2WithAbsDfTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.md
deleted file mode 100644
index 0d6792f7538..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`DirichletTensor` is a `StochasticTensor` backed by the distribution `Dirichlet`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#DirichletTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.clone(name=None, **dist_args)` {#DirichletTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.distribution` {#DirichletTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.dtype` {#DirichletTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.entropy(name='entropy')` {#DirichletTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.graph` {#DirichletTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.input_dict` {#DirichletTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.loss(final_loss, name='Loss')` {#DirichletTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.mean(name='mean')` {#DirichletTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.name` {#DirichletTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.value(name='value')` {#DirichletTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.DirichletTensor.value_type` {#DirichletTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.UniformTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.UniformTensor.md
deleted file mode 100644
index a09a7ea3ae6..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.UniformTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`UniformTensor` is a `StochasticTensor` backed by the distribution `Uniform`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#UniformTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.clone(name=None, **dist_args)` {#UniformTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.distribution` {#UniformTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.dtype` {#UniformTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.entropy(name='entropy')` {#UniformTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.graph` {#UniformTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.input_dict` {#UniformTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.loss(final_loss, name='Loss')` {#UniformTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.mean(name='mean')` {#UniformTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.name` {#UniformTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.value(name='value')` {#UniformTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.UniformTensor.value_type` {#UniformTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.md
deleted file mode 100644
index 2284a252691..00000000000
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.md
+++ /dev/null
@@ -1,85 +0,0 @@
-`WishartCholeskyTensor` is a `StochasticTensor` backed by the distribution `WishartCholesky`.
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.__init__(name=None, dist_value_type=None, loss_fn=score_function, **dist_args)` {#WishartCholeskyTensor.__init__}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.clone(name=None, **dist_args)` {#WishartCholeskyTensor.clone}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.distribution` {#WishartCholeskyTensor.distribution}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.dtype` {#WishartCholeskyTensor.dtype}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.entropy(name='entropy')` {#WishartCholeskyTensor.entropy}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.graph` {#WishartCholeskyTensor.graph}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.input_dict` {#WishartCholeskyTensor.input_dict}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.loss(final_loss, name='Loss')` {#WishartCholeskyTensor.loss}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.mean(name='mean')` {#WishartCholeskyTensor.mean}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.name` {#WishartCholeskyTensor.name}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.value(name='value')` {#WishartCholeskyTensor.value}
-
-
-
-
-- - -
-
-#### `tf.contrib.bayesflow.stochastic_tensor.WishartCholeskyTensor.value_type` {#WishartCholeskyTensor.value_type}
-
-
-
-
diff --git a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.nn.raw_rnn.md b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.nn.raw_rnn.md
index 9d892d1ecb6..8c0d9bd027b 100644
--- a/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.nn.raw_rnn.md
+++ b/tensorflow/g3doc/api_docs/python/functions_and_classes/shard9/tf.nn.raw_rnn.md
@@ -29,8 +29,8 @@ while not all(finished):
       time=time + 1, cell_output=output, cell_state=cell_state,
       loop_state=loop_state)
   # Emit zeros and copy forward state for minibatch entries that are finished.
-  state = tf.select(finished, state, next_state)
-  emit = tf.select(finished, tf.zeros_like(emit), emit)
+  state = tf.where(finished, state, next_state)
+  emit = tf.where(finished, tf.zeros_like(emit), emit)
   emit_ta = emit_ta.write(time, emit)
   # If any new minibatch entries are marked as finished, mark these.
   finished = tf.logical_or(finished, next_finished)
diff --git a/tensorflow/g3doc/api_docs/python/index.md b/tensorflow/g3doc/api_docs/python/index.md
index 3f5c7f83413..3e5f2807658 100644
--- a/tensorflow/g3doc/api_docs/python/index.md
+++ b/tensorflow/g3doc/api_docs/python/index.md
@@ -85,6 +85,8 @@
   * [`get_checkpoint_state`](../../api_docs/python/state_ops.md#get_checkpoint_state)
   * [`get_variable`](../../api_docs/python/state_ops.md#get_variable)
   * [`get_variable_scope`](../../api_docs/python/state_ops.md#get_variable_scope)
+  * [`global_variables`](../../api_docs/python/state_ops.md#global_variables)
+  * [`global_variables_initializer`](../../api_docs/python/state_ops.md#global_variables_initializer)
   * [`import_meta_graph`](../../api_docs/python/state_ops.md#import_meta_graph)
   * [`IndexedSlices`](../../api_docs/python/state_ops.md#IndexedSlices)
   * [`initialize_all_tables`](../../api_docs/python/state_ops.md#initialize_all_tables)
@@ -94,6 +96,7 @@
   * [`is_variable_initialized`](../../api_docs/python/state_ops.md#is_variable_initialized)
   * [`latest_checkpoint`](../../api_docs/python/state_ops.md#latest_checkpoint)
   * [`local_variables`](../../api_docs/python/state_ops.md#local_variables)
+  * [`local_variables_initializer`](../../api_docs/python/state_ops.md#local_variables_initializer)
   * [`make_template`](../../api_docs/python/state_ops.md#make_template)
   * [`min_max_variable_partitioner`](../../api_docs/python/state_ops.md#min_max_variable_partitioner)
   * [`model_variables`](../../api_docs/python/state_ops.md#model_variables)
@@ -107,6 +110,11 @@
   * [`scatter_add`](../../api_docs/python/state_ops.md#scatter_add)
   * [`scatter_div`](../../api_docs/python/state_ops.md#scatter_div)
   * [`scatter_mul`](../../api_docs/python/state_ops.md#scatter_mul)
+  * [`scatter_nd_add`](../../api_docs/python/state_ops.md#scatter_nd_add)
+  * [`scatter_nd_div`](../../api_docs/python/state_ops.md#scatter_nd_div)
+  * [`scatter_nd_mul`](../../api_docs/python/state_ops.md#scatter_nd_mul)
+  * [`scatter_nd_sub`](../../api_docs/python/state_ops.md#scatter_nd_sub)
+  * [`scatter_nd_update`](../../api_docs/python/state_ops.md#scatter_nd_update)
   * [`scatter_sub`](../../api_docs/python/state_ops.md#scatter_sub)
   * [`scatter_update`](../../api_docs/python/state_ops.md#scatter_update)
   * [`sparse_mask`](../../api_docs/python/state_ops.md#sparse_mask)
@@ -118,6 +126,7 @@
   * [`variable_axis_size_partitioner`](../../api_docs/python/state_ops.md#variable_axis_size_partitioner)
   * [`variable_op_scope`](../../api_docs/python/state_ops.md#variable_op_scope)
   * [`variable_scope`](../../api_docs/python/state_ops.md#variable_scope)
+  * [`variables_initializer`](../../api_docs/python/state_ops.md#variables_initializer)
   * [`VariableScope`](../../api_docs/python/state_ops.md#VariableScope)
   * [`zeros_initializer`](../../api_docs/python/state_ops.md#zeros_initializer)
 
@@ -134,6 +143,12 @@
   * [`dynamic_stitch`](../../api_docs/python/array_ops.md#dynamic_stitch)
   * [`expand_dims`](../../api_docs/python/array_ops.md#expand_dims)
   * [`extract_image_patches`](../../api_docs/python/array_ops.md#extract_image_patches)
+  * [`fake_quant_with_min_max_args`](../../api_docs/python/array_ops.md#fake_quant_with_min_max_args)
+  * [`fake_quant_with_min_max_args_gradient`](../../api_docs/python/array_ops.md#fake_quant_with_min_max_args_gradient)
+  * [`fake_quant_with_min_max_vars`](../../api_docs/python/array_ops.md#fake_quant_with_min_max_vars)
+  * [`fake_quant_with_min_max_vars_gradient`](../../api_docs/python/array_ops.md#fake_quant_with_min_max_vars_gradient)
+  * [`fake_quant_with_min_max_vars_per_channel`](../../api_docs/python/array_ops.md#fake_quant_with_min_max_vars_per_channel)
+  * [`fake_quant_with_min_max_vars_per_channel_gradient`](../../api_docs/python/array_ops.md#fake_quant_with_min_max_vars_per_channel_gradient)
   * [`gather`](../../api_docs/python/array_ops.md#gather)
   * [`gather_nd`](../../api_docs/python/array_ops.md#gather_nd)
   * [`meshgrid`](../../api_docs/python/array_ops.md#meshgrid)
@@ -148,6 +163,7 @@
   * [`reverse`](../../api_docs/python/array_ops.md#reverse)
   * [`reverse_sequence`](../../api_docs/python/array_ops.md#reverse_sequence)
   * [`saturate_cast`](../../api_docs/python/array_ops.md#saturate_cast)
+  * [`scatter_nd`](../../api_docs/python/array_ops.md#scatter_nd)
   * [`sequence_mask`](../../api_docs/python/array_ops.md#sequence_mask)
   * [`setdiff1d`](../../api_docs/python/array_ops.md#setdiff1d)
   * [`shape`](../../api_docs/python/array_ops.md#shape)
@@ -454,6 +470,8 @@
 
 * **[Data IO (Python functions)](../../api_docs/python/python_io.md)**:
   * [`tf_record_iterator`](../../api_docs/python/python_io.md#tf_record_iterator)
+  * [`TFRecordCompressionType`](../../api_docs/python/python_io.md#TFRecordCompressionType)
+  * [`TFRecordOptions`](../../api_docs/python/python_io.md#TFRecordOptions)
   * [`TFRecordWriter`](../../api_docs/python/python_io.md#TFRecordWriter)
 
 * **[Neural Network](../../api_docs/python/nn.md)**:
@@ -678,50 +696,13 @@
 
 * **[BayesFlow Stochastic Tensors (contrib)](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md)**:
   * [`BaseStochasticTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#BaseStochasticTensor)
-  * [`BernoulliTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#BernoulliTensor)
-  * [`BernoulliWithSigmoidPTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#BernoulliWithSigmoidPTensor)
-  * [`beta_aaTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#beta_aaTensor)
-  * [`beta_bbTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#beta_bbTensor)
-  * [`BetaTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#BetaTensor)
-  * [`BetaWithSoftplusABTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#BetaWithSoftplusABTensor)
-  * [`BinomialTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#BinomialTensor)
-  * [`CategoricalTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#CategoricalTensor)
-  * [`Chi2Tensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#Chi2Tensor)
-  * [`Chi2WithAbsDfTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#Chi2WithAbsDfTensor)
-  * [`DirichletMultinomialTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#DirichletMultinomialTensor)
-  * [`DirichletTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#DirichletTensor)
-  * [`ExponentialTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#ExponentialTensor)
-  * [`ExponentialWithSoftplusLamTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#ExponentialWithSoftplusLamTensor)
-  * [`GammaTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#GammaTensor)
-  * [`GammaWithSoftplusAlphaBetaTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#GammaWithSoftplusAlphaBetaTensor)
   * [`get_current_value_type`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#get_current_value_type)
-  * [`InverseGammaTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#InverseGammaTensor)
-  * [`InverseGammaWithSoftplusAlphaBetaTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#InverseGammaWithSoftplusAlphaBetaTensor)
-  * [`LaplaceTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#LaplaceTensor)
-  * [`LaplaceWithSoftplusScaleTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#LaplaceWithSoftplusScaleTensor)
   * [`MeanValue`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#MeanValue)
-  * [`MixtureTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#MixtureTensor)
-  * [`MultinomialTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#MultinomialTensor)
-  * [`MultivariateNormalCholeskyTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#MultivariateNormalCholeskyTensor)
-  * [`MultivariateNormalDiagPlusVDVTTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#MultivariateNormalDiagPlusVDVTTensor)
-  * [`MultivariateNormalDiagTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#MultivariateNormalDiagTensor)
-  * [`MultivariateNormalDiagWithSoftplusStDevTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#MultivariateNormalDiagWithSoftplusStDevTensor)
-  * [`MultivariateNormalFullTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#MultivariateNormalFullTensor)
-  * [`NormalTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#NormalTensor)
-  * [`NormalWithSoftplusSigmaTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#NormalWithSoftplusSigmaTensor)
   * [`ObservedStochasticTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#ObservedStochasticTensor)
-  * [`PoissonTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#PoissonTensor)
-  * [`QuantizedDistributionTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#QuantizedDistributionTensor)
   * [`SampleAndReshapeValue`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#SampleAndReshapeValue)
   * [`SampleValue`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#SampleValue)
   * [`StochasticTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#StochasticTensor)
-  * [`StudentTTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#StudentTTensor)
-  * [`StudentTWithAbsDfSoftplusSigmaTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#StudentTWithAbsDfSoftplusSigmaTensor)
-  * [`TransformedDistributionTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#TransformedDistributionTensor)
-  * [`UniformTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#UniformTensor)
   * [`value_type`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#value_type)
-  * [`WishartCholeskyTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#WishartCholeskyTensor)
-  * [`WishartFullTensor`](../../api_docs/python/contrib.bayesflow.stochastic_tensor.md#WishartFullTensor)
 
 * **[BayesFlow Variational Inference (contrib)](../../api_docs/python/contrib.bayesflow.variational_inference.md)**:
   * [`elbo`](../../api_docs/python/contrib.bayesflow.variational_inference.md#elbo)
@@ -911,6 +892,9 @@
   * [`Transformer`](../../api_docs/python/contrib.graph_editor.md#Transformer)
   * [`ts`](../../api_docs/python/contrib.graph_editor.md#ts)
 
+* **[Integrate (contrib)](../../api_docs/python/contrib.integrate.md)**:
+  * [`odeint`](../../api_docs/python/contrib.integrate.md#odeint)
+
 * **[Layers (contrib)](../../api_docs/python/contrib.layers.md)**:
   * [`apply_regularization`](../../api_docs/python/contrib.layers.md#apply_regularization)
   * [`avg_pool2d`](../../api_docs/python/contrib.layers.md#avg_pool2d)
diff --git a/tensorflow/g3doc/api_docs/python/math_ops.md b/tensorflow/g3doc/api_docs/python/math_ops.md
index 71e6b9a26f7..bc40bfa4043 100644
--- a/tensorflow/g3doc/api_docs/python/math_ops.md
+++ b/tensorflow/g3doc/api_docs/python/math_ops.md
@@ -1832,7 +1832,7 @@ Computes the eigenvalues of one or more self-adjoint matrices.
 
 - - -
 
-### `tf.svd(tensor, compute_uv=True, full_matrices=False, name=None)` {#svd}
+### `tf.svd(tensor, full_matrices=False, compute_uv=True, name=None)` {#svd}
 
 Computes the singular value decompositions of one or more matrices.
 
@@ -1854,12 +1854,12 @@ s = svd(a, compute_uv=False)
 
 *  <b>`matrix`</b>: `Tensor` of shape `[..., M, N]`. Let `P` be the minimum of `M` and
     `N`.
-*  <b>`compute_uv`</b>: If `True` then left and right singular vectors will be
-    computed and returned in `u` and `v`, respectively. Otherwise, only the
-    singular values will be computed, which can be significantly faster.
 *  <b>`full_matrices`</b>: If true, compute full-sized `u` and `v`. If false
     (the default), compute only the leading `P` singular vectors.
     Ignored if `compute_uv` is `False`.
+*  <b>`compute_uv`</b>: If `True` then left and right singular vectors will be
+    computed and returned in `u` and `v`, respectively. Otherwise, only the
+    singular values will be computed, which can be significantly faster.
 *  <b>`name`</b>: string, optional name of the operation.
 
 ##### Returns:
diff --git a/tensorflow/g3doc/api_docs/python/nn.md b/tensorflow/g3doc/api_docs/python/nn.md
index eaf42b9de5b..dde5c9c3752 100644
--- a/tensorflow/g3doc/api_docs/python/nn.md
+++ b/tensorflow/g3doc/api_docs/python/nn.md
@@ -2418,8 +2418,8 @@ while not all(finished):
       time=time + 1, cell_output=output, cell_state=cell_state,
       loop_state=loop_state)
   # Emit zeros and copy forward state for minibatch entries that are finished.
-  state = tf.select(finished, state, next_state)
-  emit = tf.select(finished, tf.zeros_like(emit), emit)
+  state = tf.where(finished, state, next_state)
+  emit = tf.where(finished, tf.zeros_like(emit), emit)
   emit_ta = emit_ta.write(time, emit)
   # If any new minibatch entries are marked as finished, mark these.
   finished = tf.logical_or(finished, next_finished)
diff --git a/tensorflow/g3doc/api_docs/python/python_io.md b/tensorflow/g3doc/api_docs/python/python_io.md
index f8cc23caf0d..d9dd38bcd60 100644
--- a/tensorflow/g3doc/api_docs/python/python_io.md
+++ b/tensorflow/g3doc/api_docs/python/python_io.md
@@ -94,6 +94,32 @@ An iterator that read the records from a TFRecords file.
 *  <b>`IOError`</b>: If `path` cannot be opened for reading.
 
 
+- - -
+
+### `class tf.python_io.TFRecordCompressionType` {#TFRecordCompressionType}
+
+The type of compression for the record.
+
+- - -
+
+### `class tf.python_io.TFRecordOptions` {#TFRecordOptions}
+
+Options used for manipulating TFRecord files.
+- - -
+
+#### `tf.python_io.TFRecordOptions.__init__(compression_type)` {#TFRecordOptions.__init__}
+
+
+
+
+- - -
+
+#### `tf.python_io.TFRecordOptions.get_compression_type_string(cls, options)` {#TFRecordOptions.get_compression_type_string}
+
+
+
+
+
 
 - - -
 
diff --git a/tensorflow/g3doc/api_docs/python/sparse_ops.md b/tensorflow/g3doc/api_docs/python/sparse_ops.md
index f3f241672df..51968de26f7 100644
--- a/tensorflow/g3doc/api_docs/python/sparse_ops.md
+++ b/tensorflow/g3doc/api_docs/python/sparse_ops.md
@@ -93,6 +93,17 @@ Creates a `SparseTensor`.
   A `SparseTensor`
 
 
+- - -
+
+#### `tf.SparseTensor.get_shape()` {#SparseTensor.get_shape}
+
+Get the `TensorShape` that represents the shape of the dense tensor.
+
+##### Returns:
+
+  A `TensorShape` object.
+
+
 - - -
 
 #### `tf.SparseTensor.indices` {#SparseTensor.indices}
@@ -1368,8 +1379,8 @@ Assumes the two SparseTensors have the same shape, i.e., no broadcasting.
 Example:
 
 ```python
-sp_zero = ops.SparseTensor([[0]], [0], [7])
-sp_one = ops.SparseTensor([[1]], [1], [7])
+sp_zero = sparse_tensor.SparseTensor([[0]], [0], [7])
+sp_one = sparse_tensor.SparseTensor([[1]], [1], [7])
 res = tf.sparse_maximum(sp_zero, sp_one).eval()
 # "res" should be equal to SparseTensor([[0], [1]], [0, 1], [7]).
 ```
@@ -1399,8 +1410,8 @@ Assumes the two SparseTensors have the same shape, i.e., no broadcasting.
 Example:
 
 ```python
-sp_zero = ops.SparseTensor([[0]], [0], [7])
-sp_one = ops.SparseTensor([[1]], [1], [7])
+sp_zero = sparse_tensor.SparseTensor([[0]], [0], [7])
+sp_one = sparse_tensor.SparseTensor([[1]], [1], [7])
 res = tf.sparse_minimum(sp_zero, sp_one).eval()
 # "res" should be equal to SparseTensor([[0], [1]], [0, 0], [7]).
 ```
diff --git a/tensorflow/g3doc/api_docs/python/state_ops.md b/tensorflow/g3doc/api_docs/python/state_ops.md
index 0b5e396aa2d..29765e7c2f6 100644
--- a/tensorflow/g3doc/api_docs/python/state_ops.md
+++ b/tensorflow/g3doc/api_docs/python/state_ops.md
@@ -66,16 +66,16 @@ with tf.Session() as sess:
 ```
 
 The most common initialization pattern is to use the convenience function
-`initialize_all_variables()` to add an Op to the graph that initializes
+`global_variable_initializers()` to add an Op to the graph that initializes
 all the variables. You then run that Op after launching the graph.
 
 ```python
-# Add an Op to initialize all variables.
-init_op = tf.initialize_all_variables()
+# Add an Op to initialize global variables.
+init_op = tf.global_variable_initializers()
 
 # Launch the graph in a session.
 with tf.Session() as sess:
-    # Run the Op that initializes all variables.
+    # Run the Op that initializes global variables.
     sess.run(init_op)
     # ...you can now run any Op that uses variable values...
 ```
@@ -86,8 +86,8 @@ variables are initialized in the right order.
 
 All variables are automatically collected in the graph where they are
 created. By default, the constructor adds the new variable to the graph
-collection `GraphKeys.VARIABLES`. The convenience function
-`all_variables()` returns the contents of that collection.
+collection `GraphKeys.GLOBAL_VARIABLES`. The convenience function
+`global_variables()` returns the contents of that collection.
 
 When building a machine learning model it is often convenient to distinguish
 between variables holding the trainable model parameters and other variables
@@ -109,7 +109,7 @@ Creating a variable.
 Creates a new variable with value `initial_value`.
 
 The new variable is added to the graph collections listed in `collections`,
-which defaults to `[GraphKeys.VARIABLES]`.
+which defaults to `[GraphKeys.GLOBAL_VARIABLES]`.
 
 If `trainable` is `True` the variable is also added to the graph collection
 `GraphKeys.TRAINABLE_VARIABLES`.
@@ -130,7 +130,7 @@ variable to its initial value.
     collection `GraphKeys.TRAINABLE_VARIABLES`. This collection is used as
     the default list of variables to use by the `Optimizer` classes.
 *  <b>`collections`</b>: List of graph collections keys. The new variable is added to
-    these collections. Defaults to `[GraphKeys.VARIABLES]`.
+    these collections. Defaults to `[GraphKeys.GLOBAL_VARIABLES]`.
 *  <b>`validate_shape`</b>: If `False`, allows the variable to be initialized with a
     value of unknown shape. If `True`, the default, the shape of
     `initial_value` must be known.
@@ -316,7 +316,7 @@ more information on launching a graph and on sessions.
 
 ```python
 v = tf.Variable([1, 2])
-init = tf.initialize_all_variables()
+init = tf.global_variable_initializers()
 
 with tf.Session() as sess:
     sess.run(init)
@@ -1178,19 +1178,57 @@ collected in the graph.
 
 - - -
 
-### `tf.all_variables()` {#all_variables}
+### `tf.global_variables()` {#global_variables}
 
-Returns all variables that must be saved/restored.
+Returns global variables.
 
-The `Variable()` constructor automatically adds new variables to the graph
-collection `GraphKeys.VARIABLES`. This convenience function returns the
-contents of that collection.
+Global variables are variables that are shared across machines in a
+distributed environment. The `Variable()` constructor or `get_variable()`
+automatically adds new variables to the graph collection
+`GraphKeys.GLOBAL_VARIABLES`.
+This convenience function returns the contents of that collection.
+
+An alternative to global variables are local variables. See
+[`tf.local_variables()`](../../api_docs/python/state_ops.md#local_variables)
 
 ##### Returns:
 
   A list of `Variable` objects.
 
 
+- - -
+
+### `tf.local_variables()` {#local_variables}
+
+Returns local variables.
+
+Local variables - per process variables, usually not saved/restored to
+checkpoint and used for temporary or intermediate values.
+For example, they can be used as counters for metrics computation or
+number of epochs this machine has read data.
+The `local_variable()` automatically adds new variable to
+`GraphKeys.LOCAL_VARIABLES`.
+This convenience function returns the contents of that collection.
+
+An alternative to local variables are global variables. See
+[`tf.global_variables()`](../../api_docs/python/state_ops.md#global_variables)
+
+##### Returns:
+
+  A list of local `Variable` objects.
+
+
+- - -
+
+### `tf.model_variables()` {#model_variables}
+
+Returns all variables in the MODEL_VARIABLES collection.
+
+##### Returns:
+
+  A list of local Variable objects.
+
+
 - - -
 
 ### `tf.trainable_variables()` {#trainable_variables}
@@ -1207,28 +1245,6 @@ contents of that collection.
   A list of Variable objects.
 
 
-- - -
-
-### `tf.local_variables()` {#local_variables}
-
-Returns all variables created with collection=[LOCAL_VARIABLES].
-
-##### Returns:
-
-  A list of local Variable objects.
-
-
-- - -
-
-### `tf.model_variables()` {#model_variables}
-
-Returns all variables in the MODEL_VARIABLES collection.
-
-##### Returns:
-
-  A list of local Variable objects.
-
-
 - - -
 
 ### `tf.moving_average_variables()` {#moving_average_variables}
@@ -1248,20 +1264,33 @@ This convenience function returns the contents of that collection.
 
 - - -
 
-### `tf.initialize_all_variables()` {#initialize_all_variables}
+### `tf.global_variables_initializer()` {#global_variables_initializer}
 
-Returns an Op that initializes all variables.
+Returns an Op that initializes global variables.
 
-This is just a shortcut for `initialize_variables(all_variables())`
+This is just a shortcut for `variable_initializers(global_variables())`
 
 ##### Returns:
 
-  An Op that initializes all variables in the graph.
+  An Op that initializes global variables in the graph.
 
 
 - - -
 
-### `tf.initialize_variables(var_list, name='init')` {#initialize_variables}
+### `tf.local_variables_initializer()` {#local_variables_initializer}
+
+Returns an Op that initializes all local variables.
+
+This is just a shortcut for `variable_initializers(local_variables())`
+
+##### Returns:
+
+  An Op that initializes all local variables in the graph.
+
+
+- - -
+
+### `tf.variables_initializer(var_list, name='init')` {#variables_initializer}
 
 Returns an Op that initializes a list of variables.
 
@@ -1286,19 +1315,6 @@ be run. That Op just has no effect.
   An Op that run the initializers of all the specified variables.
 
 
-- - -
-
-### `tf.initialize_local_variables()` {#initialize_local_variables}
-
-Returns an Op that initializes all local variables.
-
-This is just a shortcut for `initialize_variables(local_variables())`
-
-##### Returns:
-
-  An Op that initializes all local variables in the graph.
-
-
 - - -
 
 ### `tf.is_variable_initialized(variable)` {#is_variable_initialized}
@@ -1329,7 +1345,7 @@ variables if there are any, or an empty array if there are none.
 
 
 *  <b>`var_list`</b>: List of `Variable` objects to check. Defaults to the
-    value of `all_variables() + local_variables()`
+    value of `global_variables() + local_variables()`
 *  <b>`name`</b>: Optional name of the `Operation`.
 
 ##### Returns:
@@ -1358,7 +1374,7 @@ logged by the C++ runtime. This is expected.
 
 
 *  <b>`var_list`</b>: List of `Variable` objects to check. Defaults to the
-    value of `all_variables().`
+    value of `global_variables().`
 
 ##### Returns:
 
@@ -1765,7 +1781,7 @@ Builds saver_def.
 
 - - -
 
-#### `tf.train.Saver.export_meta_graph(filename=None, collection_list=None, as_text=False, export_scope=None)` {#Saver.export_meta_graph}
+#### `tf.train.Saver.export_meta_graph(filename=None, collection_list=None, as_text=False, export_scope=None, clear_devices=False)` {#Saver.export_meta_graph}
 
 Writes `MetaGraphDef` to save_path/filename.
 
@@ -1776,6 +1792,8 @@ Writes `MetaGraphDef` to save_path/filename.
 *  <b>`collection_list`</b>: List of string keys to collect.
 *  <b>`as_text`</b>: If `True`, writes the meta_graph as an ASCII proto.
 *  <b>`export_scope`</b>: Optional `string`. Name scope to remove.
+*  <b>`clear_devices`</b>: Whether or not to clear the device field for an `Operation`
+    or `Tensor` during export.
 
 ##### Returns:
 
@@ -2940,6 +2958,280 @@ Requires `updates.shape = indices.shape + ref.shape[1:]`.
   to use the updated values after the update is done.
 
 
+- - -
+
+### `tf.scatter_nd_update(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_update}
+
+Applies sparse `updates` to individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to update 4 scattered elements to a rank-1 tensor to 8 elements. In Python, that update would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1] ,[7]])
+    updates = tf.constant([9, 10, 11, 12])
+    update = tf.scatter_nd_update(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(update)
+
+The resulting update to ref would look like this:
+
+    [1, 11, 3, 10, 9, 6, 7, 12]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to add to ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `True`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
+
+- - -
+
+### `tf.scatter_nd_add(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_add}
+
+Applies sparse addition between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to add 4 scattered elements to a rank-1 tensor to 8 elements. In Python, that addition would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    add = tf.scatter_nd_add(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(add)
+
+The resulting update to ref would look like this:
+
+    [1, 13, 3, 14, 14, 6, 7, 20]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. Must be one of the following types: `float32`, `float64`, `int64`, `int32`, `uint8`, `uint16`, `int16`, `int8`, `complex64`, `complex128`, `qint8`, `quint8`, `qint32`, `half`.
+    A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to add to ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `False`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
+
+- - -
+
+### `tf.scatter_nd_sub(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_sub}
+
+Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to subtract 4 scattered elements from a rank-1 tensor with 8 elements. In Python, that subtraction would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    sub = tf.scatter_nd_sub(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(sub)
+
+The resulting update to ref would look like this:
+
+    [1, -9, 3, -6, -4, 6, 7, -4]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. Must be one of the following types: `float32`, `float64`, `int64`, `int32`, `uint8`, `uint16`, `int16`, `int8`, `complex64`, `complex128`, `qint8`, `quint8`, `qint32`, `half`.
+    A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `False`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
+
+- - -
+
+### `tf.scatter_nd_mul(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_mul}
+
+Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to multiply 4 scattered elements with a rank-1 tensor with 8 elements. In Python, that multiplication would look like this:
+
+    ref = tf.Variable([1, 2, 3, 4, 5, 6, 7, 8])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([9, 10, 11, 12])
+    sub = tf.scatter_nd_mul(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(sub)
+
+The resulting update to ref would look like this:
+
+    [1, 22, 3, 40, 45, 6, 7, 96]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. Must be one of the following types: `float32`, `float64`, `int64`, `int32`, `uint8`, `uint16`, `int16`, `int8`, `complex64`, `complex128`, `qint8`, `quint8`, `qint32`, `half`.
+    A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `False`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
+
+- - -
+
+### `tf.scatter_nd_div(ref, indices, updates, use_locking=None, name=None)` {#scatter_nd_div}
+
+Applies sparse subtraction between `updates` and individual values or slices within a given variable according to `indices`.
+
+`ref` is a `Tensor` with rank `P` and `indices` is a `Tensor` of rank `Q`.
+
+`indices` must be integer tensor, containing indices into `ref`.
+It must be shape `[d_0, ..., d_{Q-2}, K]` where `0 < K <= P`.
+
+The innermost dimension of `indices` (with length `K`) corresponds to
+indices into elements (if `K = P`) or slices (if `K < P`) along the `K`th
+dimension of `ref`.
+
+`updates` is `Tensor` of rank `Q-1+P-K` with shape:
+
+```
+[d_0, ..., d_{Q-2}, ref.shape[K], ..., ref.shape[P-1]].
+```
+
+For example, say we want to divide a rank-1 tensor with 8 elements by 4 scattered elements. In Python, that division would look like this:
+
+    ref = tf.Variable([10, 20, 30, 40, 50, 60, 70, 80])
+    indices = tf.constant([[4], [3], [1], [7]])
+    updates = tf.constant([2, 3, 4, 5])
+    sub = tf.scatter_nd_div(ref, indices, updates)
+    with tf.Session() as sess:
+      print sess.run(sub)
+
+The resulting update to ref would look like this:
+
+    [10, 5, 30, 13, 25, 60, 70, 16]
+
+See [tf.scatter_nd](#scatter_nd) for more details about how to make updates to slices.
+
+##### Args:
+
+
+*  <b>`ref`</b>: A mutable `Tensor`. Must be one of the following types: `float32`, `float64`, `int64`, `int32`, `uint8`, `uint16`, `int16`, `int8`, `complex64`, `complex128`, `qint8`, `quint8`, `qint32`, `half`.
+    A mutable Tensor. Should be from a Variable node.
+*  <b>`indices`</b>: A `Tensor`. Must be one of the following types: `int32`, `int64`.
+    A Tensor. Must be one of the following types: int32, int64. A tensor of indices into ref.
+*  <b>`updates`</b>: A `Tensor`. Must have the same type as `ref`.
+    A Tensor. Must have the same type as ref. A tensor of updated values to subtract from ref.
+*  <b>`use_locking`</b>: An optional `bool`. Defaults to `False`.
+    An optional bool. Defaults to True. If True, the assignment will be protected by a lock; otherwise the behavior is undefined, but may exhibit less contention.
+*  <b>`name`</b>: A name for the operation (optional).
+
+##### Returns:
+
+  A mutable `Tensor`. Has the same type as `ref`.
+  Same as ref. Returned as a convenience for operations that want to use the updated values after the update is done.
+
+
 - - -
 
 ### `tf.sparse_mask(a, mask_indices, name=None)` {#sparse_mask}
@@ -3120,7 +3412,7 @@ Returns an Op that initializes all tables of the default graph.
 
 - - -
 
-### `tf.train.export_meta_graph(filename=None, meta_info_def=None, graph_def=None, saver_def=None, collection_list=None, as_text=False, graph=None, export_scope=None, **kwargs)` {#export_meta_graph}
+### `tf.train.export_meta_graph(filename=None, meta_info_def=None, graph_def=None, saver_def=None, collection_list=None, as_text=False, graph=None, export_scope=None, clear_devices=False, **kwargs)` {#export_meta_graph}
 
 Returns `MetaGraphDef` proto. Optionally writes it to filename.
 
@@ -3144,6 +3436,8 @@ a subgraph.
     the subgraph. The scope name will be striped from the node definitions
     for easy import later into new name scopes. If `None`, the whole graph
     is exported. graph_def and export_scope cannot both be specified.
+*  <b>`clear_devices`</b>: Whether or not to clear the device field for an `Operation`
+    or `Tensor` during export.
 *  <b>`**kwargs`</b>: Optional keyed arguments.
 
 ##### Returns:
@@ -3229,3 +3523,50 @@ device assignments have not changed.
   (i.e., there are no variables to restore).
 
 
+
+# Deprecated functions (removed after 2017-03-02). Please don't use them.
+
+- - -
+
+### `tf.all_variables(*args, **kwargs)` {#all_variables}
+
+See `tf.global_variables`. (deprecated)
+
+THIS FUNCTION IS DEPRECATED. It will be removed after 2016-03-02.
+Instructions for updating:
+Please use tf.global_variables instead.
+
+
+- - -
+
+### `tf.initialize_all_variables(*args, **kwargs)` {#initialize_all_variables}
+
+See `tf.global_variables_initializer`. (deprecated)
+
+THIS FUNCTION IS DEPRECATED. It will be removed after 2017-03-02.
+Instructions for updating:
+Use `tf.global_variables_initializer` instead.
+
+
+- - -
+
+### `tf.initialize_local_variables(*args, **kwargs)` {#initialize_local_variables}
+
+See `tf.local_variables_initializer`. (deprecated)
+
+THIS FUNCTION IS DEPRECATED. It will be removed after 2017-03-02.
+Instructions for updating:
+Use `tf.local_variables_initializer` instead.
+
+
+- - -
+
+### `tf.initialize_variables(*args, **kwargs)` {#initialize_variables}
+
+See `tf.variables_initializer`. (deprecated)
+
+THIS FUNCTION IS DEPRECATED. It will be removed after 2017-03-02.
+Instructions for updating:
+Use `tf.variables_initializer` instead.
+
+
diff --git a/tensorflow/g3doc/get_started/basic_usage.md b/tensorflow/g3doc/get_started/basic_usage.md
index 1603df9335f..b6d0222ab54 100644
--- a/tensorflow/g3doc/get_started/basic_usage.md
+++ b/tensorflow/g3doc/get_started/basic_usage.md
@@ -99,7 +99,7 @@ sess = tf.Session()
 # The call 'run(product)' thus causes the execution of three ops in the
 # graph: the two constants and matmul.
 #
-# The output of the op is returned in 'result' as a numpy `ndarray` object.
+# The output of the matmul is returned in 'result' as a numpy `ndarray` object.
 result = sess.run(product)
 print(result)
 # ==> [[ 12.]]
diff --git a/tensorflow/g3doc/get_started/os_setup.md b/tensorflow/g3doc/get_started/os_setup.md
index 04861edcf74..1535f094c5d 100644
--- a/tensorflow/g3doc/get_started/os_setup.md
+++ b/tensorflow/g3doc/get_started/os_setup.md
@@ -7,7 +7,7 @@ github source.
 
 The TensorFlow Python API supports Python 2.7 and Python 3.3+.
 
-The GPU version works best with Cuda Toolkit 7.5 and
+The GPU version works best with Cuda Toolkit 8.0 and
 cuDNN v5.  Other versions are supported (Cuda toolkit >= 7.0 and
 cuDNN >= v3) only when installing from sources.
 Please see [Cuda installation](#optional-install-cuda-gpus-on-linux) for
@@ -63,37 +63,37 @@ Then, select the correct binary to install:
 
 ```bash
 # Ubuntu/Linux 64-bit, CPU only, Python 2.7
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc1-cp27-none-linux_x86_64.whl
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc2-cp27-none-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, GPU enabled, Python 2.7
-# Requires CUDA toolkit 7.5 and CuDNN v5. For other versions, see "Installing from sources" below.
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc1-cp27-none-linux_x86_64.whl
+# Requires CUDA toolkit 8.0 and CuDNN v5. For other versions, see "Installing from sources" below.
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc2-cp27-none-linux_x86_64.whl
 
 # Mac OS X, CPU only, Python 2.7:
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc1-py2-none-any.whl
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc2-py2-none-any.whl
 
 # Mac OS X, GPU enabled, Python 2.7:
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc1-py2-none-any.whl
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc2-py2-none-any.whl
 
 # Ubuntu/Linux 64-bit, CPU only, Python 3.4
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc1-cp34-cp34m-linux_x86_64.whl
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc2-cp34-cp34m-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, GPU enabled, Python 3.4
-# Requires CUDA toolkit 7.5 and CuDNN v5. For other versions, see "Installing from sources" below.
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc1-cp34-cp34m-linux_x86_64.whl
+# Requires CUDA toolkit 8.0 and CuDNN v5. For other versions, see "Installing from sources" below.
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc2-cp34-cp34m-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, CPU only, Python 3.5
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc1-cp35-cp35m-linux_x86_64.whl
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc2-cp35-cp35m-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, GPU enabled, Python 3.5
-# Requires CUDA toolkit 7.5 and CuDNN v5. For other versions, see "Installing from sources" below.
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc1-cp35-cp35m-linux_x86_64.whl
+# Requires CUDA toolkit 8.0 and CuDNN v5. For other versions, see "Installing from sources" below.
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc2-cp35-cp35m-linux_x86_64.whl
 
 # Mac OS X, CPU only, Python 3.4 or 3.5:
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc1-py3-none-any.whl
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc2-py3-none-any.whl
 
 # Mac OS X, GPU enabled, Python 3.4 or 3.5:
-$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc1-py3-none-any.whl
+$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc2-py3-none-any.whl
 ```
 
 Install TensorFlow:
@@ -159,37 +159,37 @@ Now, install TensorFlow just as you would for a regular Pip installation. First
 
 ```bash
 # Ubuntu/Linux 64-bit, CPU only, Python 2.7
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc1-cp27-none-linux_x86_64.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc2-cp27-none-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, GPU enabled, Python 2.7
-# Requires CUDA toolkit 7.5 and CuDNN v5. For other versions, see "Installing from sources" below.
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc1-cp27-none-linux_x86_64.whl
+# Requires CUDA toolkit 8.0 and CuDNN v5. For other versions, see "Installing from sources" below.
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc2-cp27-none-linux_x86_64.whl
 
 # Mac OS X, CPU only, Python 2.7:
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc1-py2-none-any.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc2-py2-none-any.whl
 
 # Mac OS X, GPU enabled, Python 2.7:
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc1-py2-none-any.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc2-py2-none-any.whl
 
 # Ubuntu/Linux 64-bit, CPU only, Python 3.4
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc1-cp34-cp34m-linux_x86_64.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc2-cp34-cp34m-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, GPU enabled, Python 3.4
-# Requires CUDA toolkit 7.5 and CuDNN v5. For other versions, see "Installing from sources" below.
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc1-cp34-cp34m-linux_x86_64.whl
+# Requires CUDA toolkit 8.0 and CuDNN v5. For other versions, see "Installing from sources" below.
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc2-cp34-cp34m-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, CPU only, Python 3.5
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc1-cp35-cp35m-linux_x86_64.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc2-cp35-cp35m-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, GPU enabled, Python 3.5
-# Requires CUDA toolkit 7.5 and CuDNN v5. For other versions, see "Installing from sources" below.
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc1-cp35-cp35m-linux_x86_64.whl
+# Requires CUDA toolkit 8.0 and CuDNN v5. For other versions, see "Installing from sources" below.
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc2-cp35-cp35m-linux_x86_64.whl
 
 # Mac OS X, CPU only, Python 3.4 or 3.5:
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc1-py3-none-any.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc2-py3-none-any.whl
 
 # Mac OS X, GPU enabled, Python 3.4 or 3.5:
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc1-py3-none-any.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc2-py3-none-any.whl
 ```
 
 Finally install TensorFlow:
@@ -298,37 +298,37 @@ select the correct binary to install:
 
 ```bash
 # Ubuntu/Linux 64-bit, CPU only, Python 2.7
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc1-cp27-none-linux_x86_64.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc2-cp27-none-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, GPU enabled, Python 2.7
-# Requires CUDA toolkit 7.5 and CuDNN v5. For other versions, see "Installing from sources" below.
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc1-cp27-none-linux_x86_64.whl
+# Requires CUDA toolkit 8.0 and CuDNN v5. For other versions, see "Installing from sources" below.
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc2-cp27-none-linux_x86_64.whl
 
 # Mac OS X, CPU only, Python 2.7:
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc1-py2-none-any.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc2-py2-none-any.whl
 
 # Mac OS X, GPU enabled, Python 2.7:
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc1-py2-none-any.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc2-py2-none-any.whl
 
 # Ubuntu/Linux 64-bit, CPU only, Python 3.4
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc1-cp34-cp34m-linux_x86_64.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc2-cp34-cp34m-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, GPU enabled, Python 3.4
-# Requires CUDA toolkit 7.5 and CuDNN v5. For other versions, see "Installing from sources" below.
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc1-cp34-cp34m-linux_x86_64.whl
+# Requires CUDA toolkit 8.0 and CuDNN v5. For other versions, see "Installing from sources" below.
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc2-cp34-cp34m-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, CPU only, Python 3.5
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc1-cp35-cp35m-linux_x86_64.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/cpu/tensorflow-0.11.0rc2-cp35-cp35m-linux_x86_64.whl
 
 # Ubuntu/Linux 64-bit, GPU enabled, Python 3.5
-# Requires CUDA toolkit 7.5 and CuDNN v5. For other versions, see "Installing from sources" below.
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc1-cp35-cp35m-linux_x86_64.whl
+# Requires CUDA toolkit 8.0 and CuDNN v5. For other versions, see "Installing from sources" below.
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/linux/gpu/tensorflow-0.11.0rc2-cp35-cp35m-linux_x86_64.whl
 
 # Mac OS X, CPU only, Python 3.4 or 3.5:
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc1-py3-none-any.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/cpu/tensorflow-0.11.0rc2-py3-none-any.whl
 
 # Mac OS X, GPU enabled, Python 3.4 or 3.5:
-(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc1-py3-none-any.whl
+(tensorflow)$ export TF_BINARY_URL=https://storage.googleapis.com/tensorflow/mac/gpu/tensorflow-0.11.0rc2-py3-none-any.whl
 ```
 
 Finally install TensorFlow:
@@ -396,7 +396,7 @@ code.
 code.
 
 We also have tags with `latest` replaced by a released version (e.g.,
-`0.11.0rc1-gpu`).
+`0.11.0rc2-gpu`).
 
 With Docker the installation is as follows:
 
@@ -454,7 +454,7 @@ the Docker container.
 ### (Optional, Linux) Enable GPU Support
 
 If you installed the GPU version of TensorFlow, you must also install the Cuda
-Toolkit 7.5 and cuDNN v5.  Please see [Cuda
+Toolkit 8.0 and cuDNN v5.  Please see [Cuda
 installation](#optional-install-cuda-gpus-on-linux).
 
 You also need to set the `LD_LIBRARY_PATH` and `CUDA_HOME` environment
@@ -548,7 +548,7 @@ r0.8 and earlier to fetch the protobuf library that TensorFlow depends on.
 
 #### Install Bazel
 
-Follow instructions [here](http://bazel.io/docs/install.html) to install the
+Follow instructions [here](http://bazel.build/docs/install.html) to install the
 dependencies for bazel. Then download the latest stable bazel version using the
 [installer for your system](https://github.com/bazelbuild/bazel/releases) and
 run the installer as mentioned there:
@@ -594,7 +594,7 @@ https://developer.nvidia.com/cuda-gpus
 
 https://developer.nvidia.com/cuda-downloads
 
-Install version 7.5 if using our binary releases.
+Install version 8.0 if using our binary releases.
 
 Install the toolkit into e.g. `/usr/local/cuda`
 
@@ -609,9 +609,9 @@ toolkit is installed in `/usr/local/cuda`, run the following commands (edited
 to reflect the cuDNN version you downloaded):
 
 ``` bash
-tar xvzf cudnn-7.5-linux-x64-v5.1-ga.tgz
-sudo cp cuda/include/cudnn.h /usr/local/cuda/include
-sudo cp cuda/lib64/libcudnn* /usr/local/cuda/lib64
+tar xvzf cudnn-8.0-linux-x64-v5.1-ga.tgz
+sudo cp -P cuda/include/cudnn.h /usr/local/cuda/include
+sudo cp -P cuda/lib64/libcudnn* /usr/local/cuda/lib64
 sudo chmod a+r /usr/local/cuda/include/cudnn.h /usr/local/cuda/lib64/libcudnn*
 ```
 
@@ -622,7 +622,7 @@ and installing python dependencies using easy_install or pip.
 
 #### Dependencies
 
-Follow instructions [here](http://bazel.io/docs/install.html) to install the
+Follow instructions [here](http://bazel.build/docs/install.html) to install the
 dependencies for bazel. You can then use homebrew to install bazel:
 
 ```bash
@@ -682,9 +682,9 @@ Once you have it downloaded locally, you can unzip and move the header and
 libraries to your local CUDA Toolkit folder:
 
 ```bash
-$ sudo mv include/cudnn.h /Developer/NVIDIA/CUDA-7.5/include/
-$ sudo mv lib/libcudnn* /Developer/NVIDIA/CUDA-7.5/lib
-$ sudo ln -s /Developer/NVIDIA/CUDA-7.5/lib/libcudnn* /usr/local/cuda/lib/
+$ sudo mv include/cudnn.h /Developer/NVIDIA/CUDA-8.0/include/
+$ sudo mv lib/libcudnn* /Developer/NVIDIA/CUDA-8.0/lib
+$ sudo ln -s /Developer/NVIDIA/CUDA-8.0/lib/libcudnn* /usr/local/cuda/lib/
 ```
 
 To verify the CUDA installation, you can build and run deviceQuery to make sure
@@ -698,8 +698,9 @@ $ popd
 $ ~/cuda-samples/bin/x86_64/darwin/release/deviceQuery
 ```
 
-If you want to compile tensorflow and have the XCode 7.3 installed, note that
-Xcode 7.3 is not yet compatible with CUDA 7.5. You will need to download Xcode
+If you want to compile tensorflow and have XCode 7.3 and CUDA 7.5 installed, note that
+Xcode 7.3 is not yet compatible with CUDA 7.5. You can either upgrade to CUDA
+8.0, or you will need to download Xcode
 7.2 and select it as your default:
 
 ```bash
@@ -730,8 +731,8 @@ No Google Cloud Platform support will be enabled for TensorFlow
 Do you wish to build TensorFlow with GPU support? [y/N] y
 GPU support will be enabled for TensorFlow
 Please specify which gcc nvcc should use as the host compiler. [Default is /usr/bin/gcc]:
-Please specify the Cuda SDK version you want to use, e.g. 7.0. [Leave empty to use system default]: 7.5
-Please specify the location where CUDA 7.5 toolkit is installed. Refer to README.md for more details. [Default is /usr/local/cuda]:
+Please specify the Cuda SDK version you want to use, e.g. 7.0. [Leave empty to use system default]: 8.0
+Please specify the location where CUDA 8.0 toolkit is installed. Refer to README.md for more details. [Default is /usr/local/cuda]:
 Please specify the cuDNN version you want to use. [Leave empty to use system default]: 5
 Please specify the location where cuDNN 5 library is installed. Refer to README.md for more details. [Default is /usr/local/cuda]:
 Please specify a list of comma-separated Cuda compute capabilities you want to build with.
@@ -780,7 +781,7 @@ $ bazel build -c opt --config=cuda //tensorflow/tools/pip_package:build_pip_pack
 $ bazel-bin/tensorflow/tools/pip_package/build_pip_package /tmp/tensorflow_pkg
 
 # The name of the .whl file will depend on your platform.
-$ sudo pip install /tmp/tensorflow_pkg/tensorflow-0.11.0rc1-py2-none-any.whl
+$ sudo pip install /tmp/tensorflow_pkg/tensorflow-0.11.0rc2-py2-none-any.whl
 ```
 
 ## Setting up TensorFlow for Development
diff --git a/tensorflow/g3doc/how_tos/documentation/index.md b/tensorflow/g3doc/how_tos/documentation/index.md
index cebd4115d01..1ccaba32f51 100755
--- a/tensorflow/g3doc/how_tos/documentation/index.md
+++ b/tensorflow/g3doc/how_tos/documentation/index.md
@@ -233,7 +233,7 @@ def foo(x, y, name="bar"):
 
   Given two 1-D tensors `x` and `y`, this operation computes the foo.
 
-  For example:
+  Example:
 
   ```
   # x is [1, 1]
diff --git a/tensorflow/g3doc/tutorials/wide_and_deep/index.md b/tensorflow/g3doc/tutorials/wide_and_deep/index.md
index 760e4bacfdb..c92cdc18edf 100644
--- a/tensorflow/g3doc/tutorials/wide_and_deep/index.md
+++ b/tensorflow/g3doc/tutorials/wide_and_deep/index.md
@@ -111,7 +111,7 @@ columns:
 
 ```python
 wide_columns = [
-  gender, native_country, education, occupation, workclass, marital_status, relationship, age_buckets,
+  gender, native_country, education, occupation, workclass, relationship, age_buckets,
   tf.contrib.layers.crossed_column([education, occupation], hash_bucket_size=int(1e4)),
   tf.contrib.layers.crossed_column([native_country, occupation], hash_bucket_size=int(1e4)),
   tf.contrib.layers.crossed_column([age_buckets, education, occupation], hash_bucket_size=int(1e6))]
diff --git a/tensorflow/models/image/cifar10/cifar10.py b/tensorflow/models/image/cifar10/cifar10.py
index fb3a42cbb13..7df2149d40d 100644
--- a/tensorflow/models/image/cifar10/cifar10.py
+++ b/tensorflow/models/image/cifar10/cifar10.py
@@ -256,7 +256,10 @@ def inference(images):
     local4 = tf.nn.relu(tf.matmul(local3, weights) + biases, name=scope.name)
     _activation_summary(local4)
 
-  # softmax, i.e. softmax(WX + b)
+  # linear layer(WX + b),
+  # We don't apply softmax here because 
+  # tf.nn.sparse_softmax_cross_entropy_with_logits accepts the unscaled logits 
+  # and performs the softmax internally for efficiency.
   with tf.variable_scope('softmax_linear') as scope:
     weights = _variable_with_weight_decay('weights', [192, NUM_CLASSES],
                                           stddev=1/192.0, wd=0.0)
diff --git a/tensorflow/python/BUILD b/tensorflow/python/BUILD
index da875c081a7..4dc1bcec172 100644
--- a/tensorflow/python/BUILD
+++ b/tensorflow/python/BUILD
@@ -41,6 +41,7 @@ py_library(
         ":summary",
         ":training",
         ":ops",
+        ":test_ops",
         "//tensorflow/python/debug:debug_py",
     ] + if_not_windows([
         "//tensorflow/contrib:contrib_py",
@@ -205,6 +206,24 @@ py_test(
     ],
 )
 
+py_test(
+    name = "decorator_utils_test",
+    srcs = ["util/decorator_utils_test.py"],
+    srcs_version = "PY2AND3",
+    deps = [
+        "//tensorflow:tensorflow_py",
+    ],
+)
+
+py_test(
+    name = "deprecation_test",
+    srcs = ["util/deprecation_test.py"],
+    srcs_version = "PY2AND3",
+    deps = [
+        "//tensorflow:tensorflow_py",
+    ],
+)
+
 cc_library(
     name = "python_op_gen",
     srcs = ["framework/python_op_gen.cc"],
@@ -263,6 +282,8 @@ py_library(
         "framework/load_library.py",
         "framework/meta_graph.py",
         "framework/random_seed.py",
+        "framework/sparse_tensor.py",
+        "framework/subscribe.py",
         "framework/tensor_util.py",
     ],
     srcs_version = "PY2AND3",
@@ -332,6 +353,19 @@ py_test(
     ],
 )
 
+py_test(
+    name = "framework_subscribe_test",
+    size = "small",
+    srcs = ["framework/subscribe_test.py"],
+    main = "framework/subscribe_test.py",
+    srcs_version = "PY2AND3",
+    deps = [
+        ":framework_test_lib",
+        ":platform_test",
+        "//tensorflow:tensorflow_py",
+    ],
+)
+
 py_test(
     name = "contrib_test",
     size = "small",
@@ -483,6 +517,19 @@ py_test(
     ],
 )
 
+py_test(
+    name = "framework_sparse_tensor_test",
+    size = "small",
+    srcs = ["framework/sparse_tensor_test.py"],
+    main = "framework/sparse_tensor_test.py",
+    srcs_version = "PY2AND3",
+    deps = [
+        ":framework_test_lib",
+        ":platform_test",
+        "//tensorflow/core:protos_all_py",
+    ],
+)
+
 py_test(
     name = "framework_device_test",
     size = "small",
@@ -823,7 +870,10 @@ py_library(
 
 py_library(
     name = "gradients",
-    srcs = ["ops/gradients.py"],
+    srcs = [
+        "ops/gradients.py",
+        "ops/gradients_impl.py",
+    ],
     srcs_version = "PY2AND3",
     deps = [
         ":array_grad",
@@ -2035,7 +2085,6 @@ cuda_py_tests(
         "training/proximal_gradient_descent_test.py",
         "training/queue_runner_test.py",
         "training/rmsprop_test.py",
-        "training/saver_test.py",
         "training/slot_creator_test.py",
         "training/tensorboard_logging_test.py",
         "training/training_ops_test.py",
@@ -2046,6 +2095,17 @@ cuda_py_tests(
     ],
 )
 
+cuda_py_test(
+    name = "saver_test",
+    size = "small",
+    srcs = ["training/saver_test.py"],
+    additional_deps = [
+        ":training",
+        "//tensorflow:tensorflow_py",
+    ],
+    tags = ["manual"],
+)
+
 py_test(
     name = "saver_large_variable_test",
     size = "small",
diff --git a/tensorflow/python/client/session.py b/tensorflow/python/client/session.py
index c139f87c323..7518f27c35d 100644
--- a/tensorflow/python/client/session.py
+++ b/tensorflow/python/client/session.py
@@ -28,6 +28,7 @@ from tensorflow.core.protobuf import config_pb2
 from tensorflow.python import pywrap_tensorflow as tf_session
 from tensorflow.python.framework import errors
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import session_ops
 from tensorflow.python.platform import tf_logging as logging
 from tensorflow.python.util import compat
@@ -97,10 +98,10 @@ def _get_feeds_for_indexed_slices(feed, feed_val):
 _REGISTERED_EXPANSIONS = [
     # SparseTensors are fetched as SparseTensorValues. They can be fed
     # SparseTensorValues or normal tuples.
-    (ops.SparseTensor,
+    (sparse_tensor.SparseTensor,
      lambda fetch: (
          [fetch.indices, fetch.values, fetch.shape],
-         lambda fetched_vals: ops.SparseTensorValue(*fetched_vals)),
+         lambda fetched_vals: sparse_tensor.SparseTensorValue(*fetched_vals)),
      lambda feed, feed_val: list(zip(
          [feed.indices, feed.values, feed.shape], feed_val)),
      lambda feed: [feed.indices, feed.values, feed.shape]),
@@ -113,7 +114,7 @@ _REGISTERED_EXPANSIONS = [
          _get_indexed_slices_value_from_fetches),
      _get_feeds_for_indexed_slices,
      lambda feed: [feed.values, feed.indices] if feed.dense_shape is None
-                  else [feed.values, feed.indices, feed.dense_shape]),
+     else [feed.values, feed.indices, feed.dense_shape]),
     # The default catches all other types and performs no expansions.
     (object,
      lambda fetch: ([fetch], lambda fetched_vals: fetched_vals[0]),
diff --git a/tensorflow/python/client/session_test.py b/tensorflow/python/client/session_test.py
index e3acbf4c54d..5e9c0256283 100644
--- a/tensorflow/python/client/session_test.py
+++ b/tensorflow/python/client/session_test.py
@@ -33,6 +33,7 @@ from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import errors
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_util
 from tensorflow.python.framework import test_util
 from tensorflow.python.framework import versions
@@ -464,7 +465,7 @@ class SessionTest(test_util.TensorFlowTestCase):
       indices = np.array([[3, 2, 0], [4, 5, 1]]).astype(np.int64)
       values = np.array([1.0, 2.0]).astype(np.float32)
       shape = np.array([7, 9, 2]).astype(np.int64)
-      sp = ops.SparseTensor(
+      sp = sparse_tensor.SparseTensor(
           constant_op.constant(indices),
           constant_op.constant(values),
           constant_op.constant(shape))
@@ -533,14 +534,14 @@ class SessionTest(test_util.TensorFlowTestCase):
       indices = np.array([[3, 2, 0], [4, 5, 1]]).astype(np.int64)
       values = np.array([1.0, 2.0]).astype(np.float32)
       shape = np.array([7, 9, 2]).astype(np.int64)
-      sp = ops.SparseTensor(
+      sp = sparse_tensor.SparseTensor(
           array_ops.placeholder(dtype=np.int64, shape=(2, 3)),
           array_ops.placeholder(dtype=np.float32, shape=(2,)),
           array_ops.placeholder(dtype=np.int64, shape=(3,)),)
       sp_indices = array_ops.identity(sp.indices)
       sp_values = array_ops.identity(sp.values)
       sp_shape = array_ops.identity(sp.shape)
-      sp2 = ops.SparseTensor(sp_indices, sp_values, sp_shape)
+      sp2 = sparse_tensor.SparseTensor(sp_indices, sp_values, sp_shape)
       # Feed with tuple
       indices_out, values_out, shape_out = s.run(
           [sp_indices, sp_values, sp_shape], {sp: (indices, values, shape)})
@@ -555,17 +556,19 @@ class SessionTest(test_util.TensorFlowTestCase):
       # Feed with SparseTensorValue
       indices_out, values_out, shape_out = s.run(
           [sp_indices, sp_values, sp_shape],
-          {sp: ops.SparseTensorValue(indices, values, shape)})
+          {sp: sparse_tensor.SparseTensorValue(indices, values, shape)})
       self.assertAllEqual(indices_out, indices)
       self.assertAllEqual(values_out, values)
       self.assertAllEqual(shape_out, shape)
       # Feed with SparseTensorValue, fetch SparseTensorValue
-      sp2_out = s.run(sp2, {sp: ops.SparseTensorValue(indices, values, shape)})
+      sp2_out = s.run(
+          sp2, {sp: sparse_tensor.SparseTensorValue(indices, values, shape)})
       self.assertAllEqual(sp2_out.indices, indices)
       self.assertAllEqual(sp2_out.values, values)
       self.assertAllEqual(sp2_out.shape, shape)
       # Feed SparseTensorValue and fetch sp directly.
-      sp_out = s.run(sp, {sp: ops.SparseTensorValue(indices, values, shape)})
+      sp_out = s.run(
+          sp, {sp: sparse_tensor.SparseTensorValue(indices, values, shape)})
       self.assertAllEqual(sp_out.indices, indices)
       self.assertAllEqual(sp_out.values, values)
       self.assertAllEqual(sp_out.shape, shape)
@@ -579,7 +582,7 @@ class SessionTest(test_util.TensorFlowTestCase):
       sp_indices = array_ops.identity(sp.indices)
       sp_values = array_ops.identity(sp.values)
       sp_shape = array_ops.identity(sp.shape)
-      sp2 = ops.SparseTensor(sp_indices, sp_values, sp_shape)
+      sp2 = sparse_tensor.SparseTensor(sp_indices, sp_values, sp_shape)
       # Feed with tuple
       indices_out, values_out, shape_out = s.run(
           [sp_indices, sp_values, sp_shape], {sp: (indices, values, shape)})
@@ -589,17 +592,49 @@ class SessionTest(test_util.TensorFlowTestCase):
       # Feed with SparseTensorValue
       indices_out, values_out, shape_out = s.run(
           [sp_indices, sp_values, sp_shape],
-          {sp: ops.SparseTensorValue(indices, values, shape)})
+          {sp: sparse_tensor.SparseTensorValue(indices, values, shape)})
       self.assertAllEqual(indices_out, indices)
       self.assertAllEqual(values_out, values)
       self.assertAllEqual(shape_out, shape)
       # Feed with SparseTensorValue, fetch SparseTensorValue
-      sp2_out = s.run(sp2, {sp: ops.SparseTensorValue(indices, values, shape)})
+      sp2_out = s.run(
+          sp2, {sp: sparse_tensor.SparseTensorValue(indices, values, shape)})
       self.assertAllEqual(sp2_out.indices, indices)
       self.assertAllEqual(sp2_out.values, values)
       self.assertAllEqual(sp2_out.shape, shape)
 
-  def testFeedSparePlaceholderConstantShape(self):
+  def testFeedSparsePlaceholderPartialShape(self):
+    with session.Session() as s:
+      indices = np.array([[3, 2, 0], [4, 5, 1]]).astype(np.int64)
+      values = np.array([1.0, 2.0]).astype(np.float32)
+      shape = np.array([7, 9, 2]).astype(np.int64)
+      sp = array_ops.sparse_placeholder(
+          shape=[None, 9, 2], dtype=np.float32, name='placeholder1')
+      sp_indices = array_ops.identity(sp.indices)
+      sp_values = array_ops.identity(sp.values)
+      sp_shape = array_ops.identity(sp.shape)
+      sp2 = sparse_tensor.SparseTensor(sp_indices, sp_values, sp_shape)
+      # Feed with tuple
+      indices_out, values_out, shape_out = s.run(
+          [sp_indices, sp_values, sp_shape], {sp: (indices, values, shape)})
+      self.assertAllEqual(indices_out, indices)
+      self.assertAllEqual(values_out, values)
+      self.assertAllEqual(shape_out, shape)
+      # Feed with SparseTensorValue
+      indices_out, values_out, shape_out = s.run(
+          [sp_indices, sp_values, sp_shape],
+          {sp: sparse_tensor.SparseTensorValue(indices, values, shape)})
+      self.assertAllEqual(indices_out, indices)
+      self.assertAllEqual(values_out, values)
+      self.assertAllEqual(shape_out, shape)
+      # Feed with SparseTensorValue, fetch SparseTensorValue
+      sp2_out = s.run(
+          sp2, {sp: sparse_tensor.SparseTensorValue(indices, values, shape)})
+      self.assertAllEqual(sp2_out.indices, indices)
+      self.assertAllEqual(sp2_out.values, values)
+      self.assertAllEqual(sp2_out.shape, shape)
+
+  def testFeedSparsePlaceholderConstantShape(self):
     with session.Session() as s:
       indices = np.array([[3, 2, 0], [4, 5, 1]]).astype(np.int64)
       values = np.array([1.0, 2.0]).astype(np.float32)
diff --git a/tensorflow/python/debug/BUILD b/tensorflow/python/debug/BUILD
index 580bd0e79bf..b948e43501d 100644
--- a/tensorflow/python/debug/BUILD
+++ b/tensorflow/python/debug/BUILD
@@ -41,6 +41,15 @@ py_library(
     ],
 )
 
+py_library(
+    name = "stepper",
+    srcs = ["stepper.py"],
+    srcs_version = "PY2AND3",
+    deps = [
+        ":debug_data",
+    ],
+)
+
 py_library(
     name = "framework",
     srcs = ["wrappers/framework.py"],
@@ -155,6 +164,20 @@ py_test(
     ],
 )
 
+cuda_py_test(
+    name = "stepper_test",
+    size = "small",
+    srcs = [
+        "stepper_test.py",
+    ],
+    additional_deps = [
+        ":stepper",
+        "//tensorflow:tensorflow_py",
+        "//tensorflow/python:framework",
+        "//tensorflow/python:framework_test_lib",
+    ],
+)
+
 py_test(
     name = "framework_test",
     size = "small",
diff --git a/tensorflow/python/debug/stepper.py b/tensorflow/python/debug/stepper.py
new file mode 100644
index 00000000000..d785f47e1e8
--- /dev/null
+++ b/tensorflow/python/debug/stepper.py
@@ -0,0 +1,617 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""TensorFlow Debugger (tfdbg) Stepper Module."""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from tensorflow.core.protobuf import config_pb2
+from tensorflow.python.debug import debug_data
+from tensorflow.python.framework import ops
+from tensorflow.python.ops import session_ops
+
+
+class NodeStepper(object):
+  """TensorFlow Debugger (tfdbg) stepper.
+
+  The stepper provides ability to perform "continue to" actions on a graph,
+  given fetch and feeds. The stepper calculates the transitive closure of the
+  fetch. cont() (continue to) calls can only be performed on members of the
+  transitive closure.
+
+  On a cont() call, the stepper performs depth-first tracing of the input
+  tree of the target. When it reaches an input where one of the following is
+  available, it will supply the available value to the feed_dict of the cont()
+  call:
+    (1) TensorHandles from previous cont() calls.
+    (2) Overriding (injected) values from the client.
+    (3) Feeds supplied during the construction of the stepper instance.
+
+  Once the tracing is complete, it will issue a run() call on the
+  underlying session, using the aforementioned feed_dict prepared by the input
+  tracing, to achieve the "continue-to" action. The above process takes into
+  account whether the transitive closure of an input contains Variables that
+  are updated during previous cont() calls on this stepper instance. If such
+  updates exist, we say the transitive closure is "dirty" and the stepper
+  can restore the "clean" state of the Variable and avoid using the
+  TensorHandle.
+
+  Example of basic usage:
+    a = tf.Variable(1.0, name="a")
+    b = tf.Variable(2.0, anme="b")
+    c = tf.add(a, b, name="c")
+    d = tf.mul(a, c, name="d")
+
+    sess = tf.Session()
+    sess.run(tf.initialize_all_varialbes())
+    stepper = NodeStepper(sess, d)
+
+    stepper.cont(c)  # Caches the handle to Tensor c:0.
+    stepper.cont(d)  # Uses handle to Tensor c:0, avoiding recomputing c.
+  """
+
+  # Possible types of feed used during cont() calls.
+  FEED_TYPE_CLIENT = "client"
+  FEED_TYPE_HANDLE = "handle"
+  FEED_TYPE_OVERRIDE = "override"
+
+  # TODO(cais): The following member constant is currently unused. Use it when
+  # the stepper is capable of using dumped intermediate tensors.
+  FEED_TYPE_INTERMEDIATE = "intermediate"
+
+  def __init__(self, sess, fetch, feed_dict=None):
+    """Constructor for Debugger.
+
+    Args:
+      sess: (Session) the TensorFlow Session to step in.
+      fetch: (str or TensorFlow graph element) A single fetched Tensor or Op,
+        or a name (str) representing the Tensor or Op. In the case of a name
+        str, the graph will be searched to find the corresponding Tensor or Op.
+      feed_dict: (dict or None) feed dict to be used in this stepper instance.
+
+    TODO(cais): Currently the stepper supports a single fetch. Support list,
+      tuple or dict of feeds, as in the Session run() interface.
+    """
+
+    self._sess = sess
+
+    if isinstance(fetch, str):
+      # Fetch target is a string. Assume it is the name of the Tensor or Op and
+      # will attempt to find it in the Session's graph.
+      self._fetch_name = fetch
+    elif isinstance(fetch, list) or isinstance(fetch, tuple) or isinstance(
+        fetch, dict):
+      raise NotImplementedError(
+          "list, tuple or dict fetches are not supported yet.")
+    else:
+      self._fetch_name = fetch.name
+    self._fetch = self._sess.graph.as_graph_element(self._fetch_name)
+
+    # A map from Variable name to initializer op.
+    self._variable_initializers = {}
+
+    # A map from Variable name to initial value, used when overriding or
+    # restoring Variable values.
+    self._variable_initial_values = {}
+
+    # Initialize the map for output recipients (targets).
+    self._non_control_output_targets = {}
+
+    # Sorted transitive closure of the fetched node.
+    self._sorted_transitive_closure = self._dfs_visit(self._sess.graph,
+                                                      self._fetch)
+    self._transitive_closure_set = set(self._sorted_transitive_closure)
+
+    # A map from Variable name to the old values (before any cont() calls).
+    self._cached_variable_values = {}
+
+    # A cache map from tensor name to what variables may invalidate the tensor
+    self._cached_invalidation_path = {}
+
+    # Keep track of which variables are in a dirty state.
+    self._dirty_variables = set()
+
+    # Cached tensor handles: a dict with keys as tensor names and values as
+    # tensor handles.
+    self._tensor_handles = {}
+
+    # Feed dict from the client.
+    self._client_feed_dict = feed_dict
+    if not self._client_feed_dict:
+      self._client_feed_dict = {}
+
+    # Overriding tensor values.
+    self._override_tensors = {}
+
+    # What the feed types were used by the last cont() call.
+    self._last_feed_types = {}
+
+  def _dfs_visit(self, graph, elem):
+    """Trace back the input of a graph element, using depth-first search.
+
+    Uses non-recursive implementation to prevent stack overflow for deep
+    graphs.
+
+    Also performs the following action(s):
+      1) When encountering a Variable, obtain its initializer op, to
+         facilitate possible subsequent restoration / overriding of variable
+         value.
+
+    Args:
+      graph: A TF graph instance.
+      elem: A graph element: a Tensor or an Operation.
+
+    Returns:
+      (list of str) A topologically-sorted list of all graph element names
+        in the transitive closure of elem. Obviously, the topological sort is
+        not unique in general. The return value here is just an arbitrary one
+        of potentially many possible topological sorts.
+    """
+
+    # These set should hold only strings, i.e, names of the nodes.
+    done = set()  # Keep track of visited nodes.
+
+    # A list of str: Names of the topologically-sorted graph elements.
+    sorted_node_list = [elem.name]
+
+    elem_stack = [elem]
+
+    while elem_stack:
+      curr_elem = elem_stack.pop()
+      curr_node = self._get_node(curr_elem)
+
+      done.add(curr_node.name)
+
+      non_control_inputs = [inp for inp in curr_node.inputs]
+      control_inputs = [inp for inp in curr_node.control_inputs]
+      all_inputs = set(non_control_inputs + control_inputs)
+
+      # Iterate through the (non-control) inputs.
+      for inp in all_inputs:
+        is_non_control_input = inp in non_control_inputs
+
+        # Set up the non-control output map.
+        if is_non_control_input:
+          if inp.name not in self._non_control_output_targets:
+            self._non_control_output_targets[inp.name] = set([curr_elem.name])
+          else:
+            self._non_control_output_targets[inp.name].add(curr_elem.name)
+
+          if (inp.op.type == "Variable" and
+              inp.name not in self._variable_initializers):
+            # Obtain the initializer op of the variable, in case the Variable's
+            # value needs to be restored later.
+            initializer = graph.as_graph_element(inp.op.name + "/Assign")
+            self._variable_initializers[inp.name] = initializer
+            self._variable_initial_values[inp.name] = initializer.inputs[1]
+
+        inp_node = self._get_node(inp)
+        if inp_node.name in done:
+          # Already visited.
+          continue
+
+        elem_stack.append(inp)
+        sorted_node_list.append(inp.name)
+
+    sorted_node_list.reverse()
+    return sorted_node_list
+
+  def sorted_transitive_closure(self):
+    """Get a sorted list of transitive inputs to the fetch of the stepper.
+
+    Returns:
+      (list of str): Sorted transitive inputs to the fetch of the stepper
+        instance. The fetch itself is included in the list.
+    """
+
+    return self._sorted_transitive_closure
+
+  def is_feedable(self, name):
+    """Determine if a graph element if feedable.
+
+    Args:
+      name: (str) name of the graph element (Tensor or Operation)
+
+    Returns:
+      (bool) whether the graph element is feedable.
+    """
+
+    if not isinstance(name, str):
+      raise TypeError("Expected type str; got type %s" % type(name))
+
+    elem = self._sess.graph.as_graph_element(name)
+    return self._sess.graph.is_feedable(elem)
+
+  def override_tensor(self, tensor_name, overriding_val):
+    """Override the value of a tensor.
+
+    Args:
+      tensor_name: (str) Name of the tensor to override.
+      overriding_val: (numpy.ndarray) Overriding tensor value.
+
+    Raises:
+      ValueError: If tensor_name does not correspond to a tensor in the input
+        tree to the fetched graph element of this stepper instance.
+    """
+
+    if not isinstance(tensor_name, str):
+      raise TypeError("Expected type str; got type %s" % type(tensor_name))
+
+    if tensor_name not in self._transitive_closure_set:
+      raise ValueError(
+          "Cannot override tensor \"%s\" because it does not exist in the "
+          "input tree to the fetch \"%s\"" % (tensor_name, self._fetch_name))
+
+    self._override_tensors[tensor_name] = overriding_val
+
+    # Invalidate cache by tracing outputs.
+    self._invalidate_transitively_outgoing_cache(tensor_name)
+
+  def remove_override(self, tensor_name):
+    """Remove the overriding value on a tensor.
+
+    Args:
+      tensor_name: (str) name of the tensor to remove the overriding value
+        from.
+
+    Raises:
+      ValueError: If no overriding value exists for tensor_name.
+    """
+
+    if tensor_name not in self._override_tensors:
+      raise ValueError("No overriding value exists for tensor \"%s\"." %
+                       tensor_name)
+
+    del self._override_tensors[tensor_name]
+
+    # Invalidate cache by tracing outputs.
+    self._invalidate_transitively_outgoing_cache(tensor_name)
+
+  def last_feed_types(self):
+    """Obtain information about the feed in the last cont() call.
+
+    Returns:
+      (dict) A dict mapping tensor names to feed types.
+    """
+
+    return self._last_feed_types
+
+  def cont(self,
+           target,
+           use_tensor_handles=True,
+           use_overrides=True,
+           restore_variable_values=False):
+    """Continue till the completion of the specified target tensor.
+
+    Args:
+      target: A single fetched Tensor or Op, or a name (str) representing the
+        Tensor or Op. In the case of a name str, the graph will be searched
+        to find the corresponding Tensor or Op.
+        # TODO(cais): Support multiple fetches as in Session.run() interface.
+      use_tensor_handles: (bool) Whether this cont() run will use cached tensor
+        handles to avoid recomputation. Default: True.
+      use_overrides: (bool) Whether the overriding tensor values supplied by
+        the client are to be used in this cont() call. Default: True.
+      restore_variable_values: (bool) Whether the old values of the variables
+        (before any cont() calls in this object) are to be restored.
+
+    Returns:
+      Value from Session.run() of the target.
+
+    Raises:
+      ValueError: If the target is specified as a string and the string does
+        not correspond to any tensors in the Session graph.
+        Or if the target of this cont() is not in the input list of the Stepper
+        object's target.
+        Or if target is a Placeholder.
+    """
+
+    self._last_feed_types = {}
+
+    if isinstance(target, str):
+      # Fetch target is a string. Assume it is the name of the Tensor or Op and
+      # will attempt to find it in the Session's graph.
+      target_name = target
+    else:
+      target_name = target.name
+
+    graph_element = self._sess.graph.as_graph_element(target_name)
+    if (isinstance(graph_element, ops.Tensor) and
+        graph_element.op.type == "Placeholder"):
+      raise ValueError("Should not call cont() on a Placeholder")
+
+    # Verify that the target is in the transitive closure of the stepper's
+    # fetch.
+    if target_name not in self._transitive_closure_set:
+      raise ValueError(
+          "Target \"%s\" is not in the transitive closure for the fetch of the "
+          "stepper: \"%s\"." % (target_name, self._fetch_name))
+
+    # Check if a cached tensor handle can be used on the fetch directly.
+    if use_tensor_handles and target_name in self._tensor_handles:
+      self._last_feed_types[target_name] = self.FEED_TYPE_HANDLE
+      return self._tensor_handles[target_name].eval()
+
+    # Check if an overriding tensor value can be used directly.
+    if use_overrides and target_name in self._override_tensors:
+      # Override is available. Return the value right away.
+      self._last_feed_types[target_name] = self.FEED_TYPE_OVERRIDE
+      return self._override_tensors[target_name]
+
+    # The feeds to be used in the Session.run() call.
+    feeds = {}
+
+    # Keep track of which variables are restored in this cont() call.
+    restored_variables = set()
+
+    # Keep track of which variables are "touched" (i.e., possibly updated) in
+    # this cont() call.
+    touched_variables = set()
+
+    # =========================================================================
+    # Use a non-recursive method to trace the inputs from the node and set up
+    # the feeds.
+    fetched = self._sess.graph.as_graph_element(target_name)
+    elem_stack = [fetched]
+    done = set()
+
+    while elem_stack:
+      curr_elem = elem_stack.pop()
+      curr_node = self._get_node(curr_elem)
+
+      done.add(curr_node.name)
+
+      non_control_inputs = [inp for inp in curr_node.inputs]
+      control_inputs = [inp for inp in curr_node.control_inputs]
+      all_inputs = set(non_control_inputs + control_inputs)
+
+      # Iterate through the (non-control) inputs.
+      for inp in all_inputs:
+        # Determine whether the input is feedable. Reference-type tensors,
+        # e.g., Variables, should not be fed, because they can change.
+        if isinstance(inp, ops.Tensor):
+          is_inp_ref = inp.dtype.is_ref_dtype
+          can_feed = self._sess.graph.is_feedable(inp) and not is_inp_ref
+        else:
+          is_inp_ref = False
+          can_feed = False
+
+        if (restore_variable_values and inp.name in self._dirty_variables and
+            inp.name not in restored_variables and
+            inp.name not in touched_variables):
+          # Do not restore Variables touched or restored previously in this
+          # cont() call.
+          initializer_op = self._variable_initializers[inp.name]
+          initial_value_tensor = self._variable_initial_values[inp.name]
+          self._sess.run(initializer_op,
+                         feed_dict={
+                             initial_value_tensor:
+                                 self._cached_variable_values[inp.name]
+                         })
+
+          # Mark the variable as restored.
+          restored_variables.add(inp.name)
+
+        # Determine if this is a reference-type input from a variable, and
+        # the recipient node is not Identity. In that case, the Variable
+        # needs to be marked as dirty and its current value recorded, due to
+        # the fact that the receiving op may mutate the value of the Variable.
+        if (is_inp_ref and inp.op.type == "Variable" and
+            curr_node.type != "Identity"):
+          # Mark the variable as dirty.
+          touched_variables.add(inp.name)
+
+          # Obtain the old value of the variable and cache it.
+          if inp.name not in self._cached_variable_values:
+            old_value = self._sess.run(inp)
+            self._cached_variable_values[inp.name] = old_value
+
+        # N.B.: The order of the logical branches matters. For example,
+        # _client_feed_dict comes after _tensor_handles, so that tensor
+        # handles stored in cont() calls can override the original client
+        # feeds. Also for example, _override_tensors comes the first, so
+        # the manual overriding, if exists, can always take effect.
+        if use_overrides and can_feed and inp.name in self._override_tensors:
+          # Use client-supplied overriding tensor value.
+          feeds[inp] = self._override_tensors[inp.name]
+          self._last_feed_types[inp.name] = self.FEED_TYPE_OVERRIDE
+        elif (use_tensor_handles and can_feed and
+              inp.name in self._tensor_handles and inp not in feeds):
+          # Tensor handle found in cache.
+          feeds[inp] = self._tensor_handles[inp.name].eval()
+          self._last_feed_types[inp.name] = self.FEED_TYPE_HANDLE
+        elif inp in self._client_feed_dict:
+          # This input is available in the client feed_dict.
+          feeds[inp] = self._client_feed_dict[inp]
+          self._last_feed_types[inp.name] = self.FEED_TYPE_CLIENT
+        else:
+          # There is no feed available for this input. So keep tracing its
+          # input(s).
+          inp_node = self._get_node(inp)
+          if inp_node.name in done:
+            # Already visited.
+            continue
+
+          elem_stack.append(inp)
+          done.add(inp_node.name)
+
+    # =========================================================================
+
+    if touched_variables:
+      self._dirty_variables.update(touched_variables)
+
+    for variable in restored_variables:
+      self._dirty_variables.remove(variable)
+
+    # Prepare RunOptions for DebugTensorWatches
+    run_options = config_pb2.RunOptions()
+    # TODO(cais): Add fields for watching intermediate tensors.
+
+    if isinstance(fetched, ops.Operation):
+      # The fetched is an Operation: Will not get tensor handle.
+      self._sess.run(fetched, feed_dict=feeds, options=run_options)
+      # No return value for a run of an Operation
+    else:
+      # This is a Tensor: Will get tensor handle and cache it.
+      target_handle = self._sess.run(session_ops.get_session_handle(fetched),
+                                     feed_dict=feeds,
+                                     options=run_options)
+      self._tensor_handles[target_name] = target_handle
+
+      return target_handle.eval()
+
+    # Invalidate caches at the end.
+    for touched_variable in touched_variables:
+      self._invalidate_transitively_outgoing_cache(touched_variable)
+
+  def _invalidate_transitively_outgoing_cache(self, source_element):
+    """Invalidate the cached tensor handles by tracing output.
+
+    This method is used to invalidate caches such as cached TensorHandles
+    and intermediate tensor values when Variable mutation happens or when
+    client overrides tensor values.
+
+    Uses non-recursive implementation to avoid stack overflow on deep networks.
+
+    TODO(cais): Currently, only TensorHandle caches are invalidated. Invalidate
+      cached intermediate tensor values from dumps when dumps are added.
+
+    Args:
+      source_element: The source graph element (e.g., a Variable output slot)
+        to trace the output from.
+    """
+
+    if not self._tensor_handles:
+      return
+
+    # First, use cached invalidation paths to eliminate some cached tensor
+    # handles.
+    for handle_name in self._tensor_handles:
+      if (handle_name in self._cached_invalidation_path and
+          source_element in self._cached_invalidation_path[handle_name]):
+        del self._tensor_handles[handle_name]
+
+    if not self._tensor_handles:
+      return
+
+    stack = [source_element]
+    done = set()
+
+    while stack:
+      curr_element = stack.pop()
+
+      done.add(curr_element)
+
+      if curr_element in self._tensor_handles:
+        # Cache the invalidation path for potential future use.
+        if curr_element not in self._cached_invalidation_path:
+          self._cached_invalidation_path[curr_element] = set([source_element])
+        else:
+          self._cached_invalidation_path[curr_element].add(source_element)
+
+        del self._tensor_handles[curr_element]
+
+      targets = self._non_control_output_targets.get(curr_element, [])
+      for target in targets:
+        if target in done:
+          continue
+        else:
+          stack.append(target)
+
+  def finalize(self):
+    """Run the final fetch(es).
+
+    Restore the dirty variables; ignore the client-supplied overriding tensor
+    values.
+
+    Returns:
+      The same return value as self.cont() as called on the final fetch.
+    """
+
+    return self.cont(
+        self._fetch,
+        use_tensor_handles=False,
+        use_overrides=False,
+        restore_variable_values=True)
+
+  def handle_names(self):
+    """Return names of the TensorHandles that the debugger is holding.
+
+    Returns:
+      (list of str) Name of the tensors for which TensorHandle is available.
+    """
+    return [name for name in self._tensor_handles]
+
+  def dirty_variables(self):
+    """Get the set of variables that are currently "dirty".
+
+    "dirty" means:
+      previous cont() calls have updated the value of the Variable,
+      and the Variable's old value (the value before any cont() calls
+      happened) was not restored.
+
+    Returns:
+      (set) A set of dirty variables.
+    """
+
+    return self._dirty_variables
+
+  def get_tensor_value(self, tensor_name):
+    """Get the value of a tensor that the stepper has access to.
+
+    Args:
+      tensor_name: (str) Name of the tensor.
+
+    Returns:
+      Value of the tensor, from overriding values or cached tensor handles.
+
+    Raises:
+      ValueError: If the value is not available as an overriding value
+        or through a TensorHandle.
+    """
+
+    if tensor_name in self._override_tensors:
+      return self._override_tensors[tensor_name]
+    elif tensor_name in self._tensor_handles:
+      return self._tensor_handles[tensor_name].eval()
+    else:
+      raise ValueError(
+          "This stepper instance does not have access to the value of "
+          "tensor \"%s\"" % tensor_name)
+
+  def get_fetch_result(self):
+    return self.get_tensor_value(self._fetch_name)
+
+  def override_names(self):
+    """Return names of the TensorHandles that the debugger is holding.
+
+    Returns:
+      (list of str) Name of the tensor for which overriding tensor values are
+        available.
+    """
+    return [name for name in self._override_tensors]
+
+  def _get_node(self, element):
+    """Get the node of a graph element.
+
+    Args:
+      element: A graph element (Op, Tensor or Node)
+
+    Returns:
+      The node associated with element in the graph.
+    """
+
+    node_name, _ = debug_data.parse_node_or_tensor_name(element.name)
+    return self._sess.graph.as_graph_element(node_name)
diff --git a/tensorflow/python/debug/stepper_test.py b/tensorflow/python/debug/stepper_test.py
new file mode 100644
index 00000000000..670ae5b3a13
--- /dev/null
+++ b/tensorflow/python/debug/stepper_test.py
@@ -0,0 +1,609 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Unit tests of the tfdbg Stepper."""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow as tf
+
+from tensorflow.python.debug.stepper import NodeStepper
+from tensorflow.python.framework import test_util
+from tensorflow.python.platform import googletest
+
+
+class StepperTest(test_util.TensorFlowTestCase):
+
+  def setUp(self):
+    self.a = tf.Variable(2.0, name="a")
+    self.b = tf.Variable(3.0, name="b")
+
+    self.c = tf.mul(self.a, self.b, name="c")  # Should be 6.0.
+    self.d = tf.mul(self.a, self.a, name="d")  # Should be 4.0.
+
+    self.e = tf.mul(self.d, self.c, name="e")  # Should be 24.0.
+
+    self.f = tf.div(self.b, 0.30, name="f")  # Should be 20.0.
+
+    self.sess = tf.Session()
+    self.sess.run(tf.initialize_all_variables())
+
+  def tearDown(self):
+    tf.reset_default_graph()
+
+  def testAttemptToContToFetchNotInTransitiveClosure(self):
+    stepper = NodeStepper(self.sess, "e:0")
+
+    self.assertEqual(
+        ["a:0", "b:0", "b/read:0", "a/read:0", "c:0", "d:0", "e:0"],
+        stepper.sorted_transitive_closure())
+
+    with self.assertRaisesRegexp(
+        ValueError,
+        "Target \"f:0\" is not in the transitive closure for the fetch of the "
+        "stepper: \"e:0\""):
+      stepper.cont("f:0")
+
+  def testUsingNamesNotUsingIntermediateTensors(self):
+    stepper = NodeStepper(self.sess, "e:0")
+
+    # The first cont() call should have used no feeds.
+    result = stepper.cont("c:0")
+    self.assertAllClose(6.0, result)
+    self.assertEqual({}, stepper.last_feed_types())
+
+    # The second cont() call should have used the tensor handle from the
+    # previous cont() call.
+    result = stepper.cont("e:0")
+    self.assertAllClose(24.0, result)
+    self.assertEqual({
+        "c:0": NodeStepper.FEED_TYPE_HANDLE
+    }, stepper.last_feed_types())
+
+  def testUsingNodesNotUsingIntermediateTensors(self):
+    stepper = NodeStepper(self.sess, self.e)
+
+    # There should be no handles before any cont() calls.
+    self.assertEqual([], stepper.handle_names())
+
+    # Before the cont() call, the stepper should not have access to the value
+    # of c:0.
+    with self.assertRaisesRegexp(
+        ValueError,
+        "This stepper instance does not have access to the value of tensor "
+        "\"c:0\""):
+      stepper.get_tensor_value("c:0")
+
+    # Using the node/tensor itself, instead of the name str, should work on
+    # cont().
+    result = stepper.cont(self.c)
+    self.assertAllClose(6.0, result)
+    self.assertEqual({}, stepper.last_feed_types())
+
+    self.assertEqual(["c:0"], stepper.handle_names())
+
+    # After the cont() call, the stepper should have access to the value of c:0
+    # via a tensor handle.
+    self.assertAllClose(6.0, stepper.get_tensor_value("c:0"))
+
+    result = stepper.cont(self.e)
+    self.assertAllClose(24.0, result)
+    self.assertEqual({
+        "c:0": NodeStepper.FEED_TYPE_HANDLE
+    }, stepper.last_feed_types())
+
+  def testIsFeedable(self):
+    stepper = NodeStepper(self.sess, self.e)
+
+    self.assertTrue(stepper.is_feedable("a/read:0"))
+    self.assertTrue(stepper.is_feedable("b/read:0"))
+    self.assertTrue(stepper.is_feedable("c:0"))
+    self.assertTrue(stepper.is_feedable("d:0"))
+
+  def testOverrideValue(self):
+    stepper = NodeStepper(self.sess, self.e)
+
+    result = stepper.cont(self.c)
+    self.assertAllClose(6.0, result)
+    self.assertEqual({}, stepper.last_feed_types())
+
+    # There should be no overrides before any cont() calls.
+    self.assertEqual([], stepper.override_names())
+
+    # Calling cont() on c again should lead to use of the handle.
+    result = stepper.cont(self.c)
+    self.assertAllClose(6.0, result)
+    self.assertEqual({
+        "c:0": NodeStepper.FEED_TYPE_HANDLE
+    }, stepper.last_feed_types())
+
+    # Override c:0.
+    stepper.override_tensor("c:0", 7.0)
+
+    # After the overriding, calling get_tensor_value() on c:0 should yield the
+    # overriding value.
+    self.assertEqual(7.0, stepper.get_tensor_value("c:0"))
+
+    # Now c:0 should have only an override value, but no cached handle, because
+    # the handle should have been invalidated.
+    self.assertEqual([], stepper.handle_names())
+    self.assertEqual(["c:0"], stepper.override_names())
+
+    # Run a downstream tensor after the value override.
+    result = stepper.cont(self.e)
+    self.assertAllClose(28.0, result)  # Should reflect the overriding value.
+
+    # Should use override, instead of the handle.
+    self.assertEqual({
+        "c:0": NodeStepper.FEED_TYPE_OVERRIDE
+    }, stepper.last_feed_types())
+
+  def testOverrideValueTwice(self):
+    stepper = NodeStepper(self.sess, self.e)
+
+    # Override once.
+    stepper.override_tensor("c:0", 7.0)
+    self.assertAllClose(28.0, stepper.cont(self.e))
+    self.assertEqual({
+        "c:0": NodeStepper.FEED_TYPE_OVERRIDE
+    }, stepper.last_feed_types())
+
+    self.assertEqual(["e:0"], stepper.handle_names())
+    self.assertEqual(["c:0"], stepper.override_names())
+
+    # Calling cont(self.e) again. This time the cached tensor handle of e
+    # should be used.
+    self.assertEqual(28.0, stepper.cont(self.e))
+    self.assertEqual({
+        "e:0": NodeStepper.FEED_TYPE_HANDLE
+    }, stepper.last_feed_types())
+
+    # Override c again. This should have invalidated the cache for e.
+    stepper.override_tensor("c:0", 8.0)
+
+    self.assertEqual([], stepper.handle_names())
+    self.assertEqual(["c:0"], stepper.override_names())
+
+    self.assertAllClose(32.0, stepper.cont(self.e))
+    self.assertEqual({
+        "c:0": NodeStepper.FEED_TYPE_OVERRIDE
+    }, stepper.last_feed_types())
+
+  def testRemoveOverrideValue(self):
+    stepper = NodeStepper(self.sess, self.e)
+
+    result = stepper.cont(self.c)
+    self.assertAllClose(6.0, result)
+    self.assertEqual({}, stepper.last_feed_types())
+
+    # The previous cont() step should have generated a cached tensor handle.
+    self.assertEqual(["c:0"], stepper.handle_names())
+
+    # Override c:0.
+    stepper.override_tensor("c:0", 7.0)
+
+    # The overriding should have invalidated the tensor handle.
+    self.assertEqual([], stepper.handle_names())
+    self.assertEqual(["c:0"], stepper.override_names())
+
+    result = stepper.cont(self.e)
+    self.assertAllClose(28.0, result)  # Should reflect the overriding value.
+    self.assertEqual({
+        "c:0": NodeStepper.FEED_TYPE_OVERRIDE
+    }, stepper.last_feed_types())
+
+    # The handle to tensor e:0 should have been cached, even though its
+    # transitive closure contains an override.
+    self.assertIn("e:0", stepper.handle_names())
+
+    # Remove the override.
+    stepper.remove_override("c:0")
+    # c:0 should not be in the overrides anymore.
+    self.assertEqual([], stepper.override_names())
+
+    # Removing the override should have invalidated the tensor handle for c.
+    self.assertNotIn("e:0", stepper.handle_names())
+
+    # Should reflect the non-overriding value.
+    self.assertAllClose(24.0, stepper.cont(self.e))
+
+    # This time, the handle to tensor e:0 should have been cached again, even
+    # thought its transitive closure contains an override.
+    self.assertIn("e:0", stepper.handle_names())
+
+    # Calling cont(self.e) again should have used the tensor handle to e:0.
+    self.assertAllClose(24.0, stepper.cont(self.e))
+    self.assertEqual({
+        "e:0": NodeStepper.FEED_TYPE_HANDLE
+    }, stepper.last_feed_types())
+
+  def testOverrideAndContToSameTensor(self):
+    stepper = NodeStepper(self.sess, self.e)
+
+    result = stepper.cont(self.c)
+    self.assertAllClose(6.0, result)
+    self.assertEqual({}, stepper.last_feed_types())
+    self.assertEqual(["c:0"], stepper.handle_names())
+
+    self.assertAllClose(6.0, stepper.cont(self.c))
+
+    # The last cont() call should use the tensor handle directly.
+    self.assertEqual({
+        "c:0": NodeStepper.FEED_TYPE_HANDLE
+    }, stepper.last_feed_types())
+
+    # Override c:0.
+    stepper.override_tensor("c:0", 7.0)
+
+    # As a result of the override, the tensor handle should have been
+    # invalidated.
+    self.assertEqual([], stepper.handle_names())
+
+    result = stepper.cont(self.c)
+    self.assertAllClose(7.0, result)
+
+    self.assertEqual({
+        "c:0": NodeStepper.FEED_TYPE_OVERRIDE
+    }, stepper.last_feed_types())
+
+  def testFinalizeWithPreviousOverrides(self):
+    stepper = NodeStepper(self.sess, self.e)
+
+    stepper.override_tensor("a/read:0", 20.0)
+    self.assertEqual(["a/read:0"], stepper.override_names())
+
+    # Should reflect the overriding value.
+    self.assertAllClose(24000.0, stepper.cont("e:0"))
+    self.assertEqual({
+        "a/read:0": NodeStepper.FEED_TYPE_OVERRIDE
+    }, stepper.last_feed_types())
+
+    # Finalize call should have ignored the overriding value.
+    self.assertAllClose(24.0, stepper.finalize())
+
+  def testRemoveNonexistentOverrideValue(self):
+    stepper = NodeStepper(self.sess, self.e)
+    self.assertEqual([], stepper.override_names())
+
+    with self.assertRaisesRegexp(
+        ValueError, "No overriding value exists for tensor \"c:0\""):
+      stepper.remove_override("c:0")
+
+  def testAttemptToOverrideInvalidTensor(self):
+    stepper = NodeStepper(self.sess, self.e)
+
+    with self.assertRaisesRegexp(ValueError, "Cannot override tensor \"f:0\""):
+      stepper.override_tensor("f:0", 42.0)
+
+  def testInvalidOverrideArgumentType(self):
+    stepper = NodeStepper(self.sess, self.e)
+
+    with self.assertRaisesRegexp(TypeError, "Expected type str; got type"):
+      stepper.override_tensor(self.a, 42.0)
+
+
+class StepperTestWithPlaceHolders(test_util.TensorFlowTestCase):
+
+  def setUp(self):
+    self.ph0 = tf.placeholder(tf.float32, shape=(2, 2), name="ph0")
+    self.ph1 = tf.placeholder(tf.float32, shape=(2, 1), name="ph1")
+
+    self.x = tf.matmul(self.ph0, self.ph1, name="x")
+    self.y = tf.add(self.x, self.ph1, name="y")
+
+    self.sess = tf.Session()
+
+  def tearDown(self):
+    tf.reset_default_graph()
+
+  def testContWithPlaceholders(self):
+    stepper = NodeStepper(
+        self.sess,
+        self.y,
+        feed_dict={
+            self.ph0: [[1.0, 2.0], [-3.0, 5.0]],
+            self.ph1: [[-1.0], [0.5]]
+        })
+
+    self.assertEqual(["ph0:0", "ph1:0", "x:0", "y:0"],
+                     stepper.sorted_transitive_closure())
+
+    result = stepper.cont(self.x)
+    self.assertAllClose([[0.0], [5.5]], result)
+    self.assertEqual({
+        "ph0:0": NodeStepper.FEED_TYPE_CLIENT,
+        "ph1:0": NodeStepper.FEED_TYPE_CLIENT,
+    }, stepper.last_feed_types())
+
+    self.assertEqual(["x:0"], stepper.handle_names())
+
+    result = stepper.cont(self.y)
+    self.assertAllClose([[-1.0], [6.0]], result)
+    self.assertEqual({
+        "x:0": NodeStepper.FEED_TYPE_HANDLE,
+        "ph1:0": NodeStepper.FEED_TYPE_CLIENT,
+    }, stepper.last_feed_types())
+
+  def testAttemptToContToPlaceholder(self):
+    stepper = NodeStepper(
+        self.sess,
+        self.y,
+        feed_dict={
+            self.ph0: [[1.0, 2.0], [-3.0, 5.0]],
+            self.ph1: [[-1.0], [0.5]]
+        })
+
+    with self.assertRaisesRegexp(ValueError,
+                                 r"Should not call cont\(\) on a Placeholder"):
+      stepper.cont(self.ph0)
+
+
+class StepperBackwardRunTest(test_util.TensorFlowTestCase):
+
+  def setUp(self):
+    """Test setup.
+
+    Structure of the forward graph:
+              f
+             | |
+        -----   -----
+        |           |
+        d           e
+       | |         | |
+    ---   ---------  ---
+    |         |        |
+    a         b        c
+
+    Construct a backward graph using the GradientDescentOptimizer.
+    """
+
+    self.a = tf.Variable(1.0, name="a")
+    self.b = tf.Variable(2.0, name="b")
+    self.c = tf.Variable(4.0, name="c")
+    self.d = tf.mul(self.a, self.b, name="d")
+    self.e = tf.mul(self.b, self.c, name="e")
+    self.f = tf.mul(self.d, self.e, name="f")
+
+    # Gradient descent optimizer that minimizes g.
+    tf.train.GradientDescentOptimizer(0.01).minimize(self.f, name="optim")
+
+    self.sess = tf.Session()
+    self.sess.run(tf.initialize_all_variables())
+
+  def tearDown(self):
+    tf.reset_default_graph()
+
+  def testContToUpdateA(self):
+    stepper = NodeStepper(self.sess, "optim")
+
+    result = stepper.cont("a:0")
+    self.assertAllClose(1.0, result)
+    self.assertEqual({}, stepper.last_feed_types())
+
+    result = stepper.cont("optim/learning_rate:0")
+    self.assertAllClose(0.01, result)
+    self.assertEqual({}, stepper.last_feed_types())
+
+    # Before any cont calls on ApplyGradientDescent, there should be no "dirty"
+    # variables.
+    self.assertEqual(set(), stepper.dirty_variables())
+
+    # First, all the two control inputs to optim.
+    result = stepper.cont("optim/update_a/ApplyGradientDescent")
+
+    # Now variable a should have been marked as dirty due to the update
+    # by optim/update_a/ApplyGradientDescent.
+    self.assertEqual({"a:0"}, stepper.dirty_variables())
+    self.assertIsNone(result)
+    self.assertEqual({
+        "optim/learning_rate:0": NodeStepper.FEED_TYPE_HANDLE
+    }, stepper.last_feed_types())
+
+    # Check that Variable "a" has been updated properly, but "b", "c" and "d"
+    # remain the same.
+    # For backprop on Variable a:
+    #   Because f = a * b * b * c, df / da = b * b * c.
+    #   1.0 - learning_rate * b * b * c
+    #     = 1.0 -  0.01 * 2.0 * 2.0 * 4.0 = 0.84.
+    self.assertAllClose(0.84, self.sess.run(self.a))
+    self.assertAllClose(2.0, self.sess.run(self.b))
+    self.assertAllClose(4.0, self.sess.run(self.c))
+
+  def testContToUpdateB(self):
+    stepper = NodeStepper(self.sess, "optim")
+
+    result = stepper.cont("optim/update_b/ApplyGradientDescent")
+    self.assertIsNone(result)
+    self.assertEqual(set(["b:0"]), stepper.dirty_variables())
+
+    # For backprop on Variable b:
+    #   Because f = a * b * b * c, df / da = 2 * a * b * c.
+    #   2.0 - learning_rate * 2 * a * b * c
+    #     = 2.0 - 0.01 * 2 * 1.0 * 2.0 * 4.0 = 1.84
+    self.assertAllClose(1.0, self.sess.run(self.a))
+    self.assertAllClose(1.84, self.sess.run(self.b))
+    self.assertAllClose(4.0, self.sess.run(self.c))
+
+  def testContAfterUpdateWithoutRestoringVariableValue(self):
+    stepper = NodeStepper(self.sess, "optim")
+
+    # First, update Variable a from 1.0 to 0.84.
+    result = stepper.cont("optim/update_a/ApplyGradientDescent",
+                          restore_variable_values=True)
+    self.assertIsNone(result)
+    self.assertEqual(set(["a:0"]), stepper.dirty_variables())
+    self.assertAllClose(0.84, self.sess.run(self.a))
+    self.assertAllClose(2.0, self.sess.run(self.b))
+    self.assertAllClose(4.0, self.sess.run(self.c))
+
+    # Second, update Variable b without the default restore_variable_values.
+    result = stepper.cont(
+        "optim/update_b/ApplyGradientDescent", restore_variable_values=False)
+    self.assertIsNone(result)
+    # For the backprop on Variable b under the updated value of a:
+    #   2.0 - learning_rate * 2 * a' * b * c
+    #     = 2.0 - 0.01 * 2 * 0.84 * 2.0 * 4.0 = 1.8656
+    self.assertAllClose(0.84, self.sess.run(self.a))
+    self.assertAllClose(1.8656, self.sess.run(self.b))
+    self.assertAllClose(4.0, self.sess.run(self.c))
+
+  def testUpdateTwiceRestoreVariable(self):
+    stepper = NodeStepper(self.sess, "optim")
+
+    result = stepper.cont("optim/update_a/ApplyGradientDescent",
+                          restore_variable_values=True)
+    self.assertIsNone(result)
+    self.assertEqual({"a:0"}, stepper.dirty_variables())
+
+    result = stepper.cont("optim/update_b/ApplyGradientDescent",
+                          restore_variable_values=True)
+    self.assertIsNone(result)
+    # Variables a and c should have been restored and hence no longer dirty.
+    # Variable b should have been marked as dirty.
+    self.assertEqual({"b:0"}, stepper.dirty_variables())
+
+    # The result of the update should be identitcal to as if only update_b is
+    # run.
+    self.assertAllClose(1.0, self.sess.run(self.a))
+    self.assertAllClose(1.84, self.sess.run(self.b))
+    self.assertAllClose(4.0, self.sess.run(self.c))
+
+  def testSelectiveHandleUsageDependingOnTransitiveCleanliness(self):
+    """Test tensor handlers are using only during clean transitive closure.
+
+    "clean" means no Variables have been updated by preceding cont() calls.
+    """
+
+    stepper = NodeStepper(self.sess, "optim")
+
+    # First, call cont() on the two tensors on the intermediate level: e and f.
+    result = stepper.cont("d:0")
+    self.assertAllClose(2.0, result)
+    self.assertEqual({}, stepper.last_feed_types())
+    self.assertEqual(set(), stepper.dirty_variables())
+
+    # The cont call above should have restored Variable "b".
+    result = stepper.cont("e:0")
+    self.assertAllClose(8.0, result)
+    self.assertEqual({}, stepper.last_feed_types())
+    self.assertEqual(set(), stepper.dirty_variables())
+
+    # Now run update_a, so as to let Variable a be diry.
+    result = stepper.cont("optim/update_a/ApplyGradientDescent",
+                          restore_variable_values=True)
+    self.assertIsNone(result)
+    self.assertEqual({"a:0"}, stepper.dirty_variables())
+
+    # Now, run update_b.
+    result = stepper.cont("optim/update_b/ApplyGradientDescent",
+                          restore_variable_values=True)
+    self.assertIsNone(result)
+
+    # The last cont() run should have use the handle of tensor e, but not the
+    # handle of tensor d, because the transitive closure of e is clean, whereas
+    # that of d is dirty due to the update to a in the previous cont() call.
+    self.assertEqual({
+        "e:0": NodeStepper.FEED_TYPE_HANDLE
+    }, stepper.last_feed_types())
+
+    # The result of the update_b should be identical to as if no other
+    # update_* cont() calls have occurred before.
+    self.assertAllClose(1.0, self.sess.run(self.a))
+    self.assertAllClose(1.84, self.sess.run(self.b))
+    self.assertAllClose(4.0, self.sess.run(self.c))
+
+  def testFinalize(self):
+    """Test finalize() to restore variables and run the original fetch."""
+
+    stepper = NodeStepper(self.sess, "optim")
+
+    # Invoke update_b before calling finalize.
+    stepper.cont("optim/update_b/ApplyGradientDescent",
+                 restore_variable_values=True)
+
+    result = stepper.finalize()
+    self.assertIsNone(result)
+
+    # The results of the Variable updates should be the same as if no cont()
+    # call has occurred on update_b.
+    self.assertAllClose(0.84, self.sess.run(self.a))
+    self.assertAllClose(1.84, self.sess.run(self.b))
+    self.assertAllClose(3.96, self.sess.run(self.c))
+
+  def testOverrideThenContToUpdate(self):
+    """Test cont() to update nodes after overriding tensor values."""
+
+    stepper = NodeStepper(self.sess, "optim")
+
+    result = stepper.cont("d:0")
+    self.assertAllClose(2.0, result)
+    self.assertEqual({}, stepper.last_feed_types())
+    self.assertEqual(set(), stepper.dirty_variables())
+    self.assertEqual(["d:0"], stepper.handle_names())
+
+    # Override the value from 1.0 to 10.0.
+    stepper.override_tensor("a/read:0", 10.0)
+
+    self.assertEqual(["a/read:0"], stepper.override_names())
+
+    result = stepper.cont("optim/update_c/ApplyGradientDescent",
+                          restore_variable_values=True)
+    self.assertIsNone(result)
+
+    # The last cont() call should have not used the tensor handle to d:0,
+    # because the transitive closure of d:0 contains an override tensor.
+    self.assertEqual({
+        "a/read:0": NodeStepper.FEED_TYPE_OVERRIDE
+    }, stepper.last_feed_types())
+
+    # The tensor handle to d:0 should have been removed due to the dirty
+    # transitive closure.
+    self.assertEqual([], stepper.handle_names())
+
+    # For this backprop on c, the overriding value of a/read:0 should have been
+    # used:
+    #   4.0 - learning_rate * a * b * b
+    #     = 4.0 - 0.01 * 10.0 * 2.0 * 2.0 = 3.6.
+    self.assertAllClose(3.6, self.sess.run(self.c))
+
+    # Now remove the overriding value of a/read:0.
+    stepper.remove_override("a/read:0")
+    self.assertEqual([], stepper.override_names())
+
+    # Obtain the tensor handle to d:0 again.
+    result = stepper.cont("d:0")
+    self.assertAllClose(2.0, result)
+    self.assertEqual(["d:0"], stepper.handle_names())
+
+    # Then call update_c again, without restoring c.
+    result = stepper.cont(
+        "optim/update_c/ApplyGradientDescent", restore_variable_values=False)
+    self.assertIsNone(result)
+
+    # This time, the d:0 tensor handle should have been used, because its
+    # transitive closure is clean.
+    self.assertEqual({
+        "d:0": NodeStepper.FEED_TYPE_HANDLE
+    }, stepper.last_feed_types())
+
+    # For this backprop on c, the overriding value of a/read:0 should have been
+    # used:
+    #   3.6 - learning_rate * a * b * b
+    #     = 3.6 - 0.01 * 1.0 * 2.0 * 2.0 = 3.56.
+    self.assertAllClose(3.56, self.sess.run(self.c))
+
+
+if __name__ == "__main__":
+  googletest.main()
diff --git a/tensorflow/python/framework/common_shapes.py b/tensorflow/python/framework/common_shapes.py
index 09afe56b191..c8867b4b1b0 100644
--- a/tensorflow/python/framework/common_shapes.py
+++ b/tensorflow/python/framework/common_shapes.py
@@ -552,7 +552,9 @@ def broadcast_shape(shape_x, shape_y):
   return tensor_shape.TensorShape(return_dims)
 
 
-def call_cpp_shape_fn(op, input_tensors_needed=None,
+def call_cpp_shape_fn(op,
+                      input_tensors_needed=None,
+                      input_tensors_as_shapes_needed=None,
                       debug_python_shape_fn=None):
   """A shape function that delegates to the registered C++ shape function.
 
@@ -560,6 +562,8 @@ def call_cpp_shape_fn(op, input_tensors_needed=None,
     op: the node in the graph for which to compute output shapes.
     input_tensors_needed: a list of input tensor indices for which to compute
       the input tensor's value and pass to the C++ shape function.
+    input_tensors_as_shapes_needed: a list of input tensor indices for which to
+      compute the constant_value_as_shape and pass to the C++ shape function.
     debug_python_shape_fn: For testing only during migration to using
       call_cpp_shape_fn. Do not submit calls that set this,
       as the comparison is slow. If non-None, the python shape function;
@@ -594,16 +598,25 @@ def call_cpp_shape_fn(op, input_tensors_needed=None,
   input_tensors = [None for i in input_shapes]
   if input_tensors_needed:
     for idx in input_tensors_needed:
-      input_tensors[idx] = tensor_util.constant_value(op.inputs[idx])
-      if input_tensors[idx] is not None:
-        input_tensors[idx] = np.asarray(input_tensors[idx])
+      v = tensor_util.constant_value(op.inputs[idx])
+      if v is not None:
+        input_tensors[idx] = np.asarray(v)
+
+  serialized_unknown_shape = (
+      tensor_shape.TensorShape(None).as_proto().SerializeToString())
+  arr = [serialized_unknown_shape for i in input_shapes]
+  if input_tensors_as_shapes_needed:
+    for idx in input_tensors_as_shapes_needed:
+      s = tensor_util.constant_value_as_shape(op.inputs[idx])
+      if s is not None:
+        arr[idx] = s.as_proto().SerializeToString()
+  input_tensors_as_shapes = arr
 
   try:
     with errors.raise_exception_on_not_ok_status() as status:
-      output_shapes = pywrap_tensorflow.RunCppShapeInference(node_def_str,
-                                                             input_shapes,
-                                                             input_tensors,
-                                                             status)
+      output_shapes = pywrap_tensorflow.RunCppShapeInference(
+          node_def_str, input_shapes, input_tensors, input_tensors_as_shapes,
+          status)
   except errors.InvalidArgumentError as err:
     raise ValueError(err.message)
 
diff --git a/tensorflow/python/framework/cpp_shape_inference.cc b/tensorflow/python/framework/cpp_shape_inference.cc
index 57b85e81187..7620b52f9fc 100644
--- a/tensorflow/python/framework/cpp_shape_inference.cc
+++ b/tensorflow/python/framework/cpp_shape_inference.cc
@@ -50,6 +50,7 @@ Status RunCppShapeInferenceImpl(
     const string& serialized_node_def,
     const std::vector<string>& input_serialized_shapes,
     const std::vector<PyObject*>& input_constant_tensor_values,
+    const std::vector<string>& input_constant_tensor_as_shape_values,
     std::vector<string>* output_tensor_shape_protos) {
   tensorflow::NodeDef node;
   if (!node.ParseFromString(serialized_node_def)) {
@@ -87,10 +88,9 @@ Status RunCppShapeInferenceImpl(
   }
 
   // Convert input tensor values;
-  const int num_input_tensors = input_constant_tensor_values.size();
-  std::vector<Tensor> input_tensor_values(num_input_tensors);
+  std::vector<Tensor> input_tensor_values(input_constant_tensor_values.size());
   std::vector<const Tensor*> input_tensors;
-  for (int i = 0; i < num_input_tensors; ++i) {
+  for (int i = 0; i < input_constant_tensor_values.size(); ++i) {
     auto* py_val = input_constant_tensor_values[i];
     if (py_val == Py_None) {
       input_tensors.push_back(nullptr);
@@ -101,11 +101,21 @@ Status RunCppShapeInferenceImpl(
     }
   }
 
+  // Convert input tensor-as-shape values;
+  std::vector<TensorShapeProto> input_tensor_as_shapes_protos(
+      input_constant_tensor_as_shape_values.size());
+  for (int i = 0; i < input_constant_tensor_as_shape_values.size(); ++i) {
+    if (!input_tensor_as_shapes_protos[i].ParseFromString(
+            input_constant_tensor_as_shape_values[i])) {
+      return errors::InvalidArgument(
+          "Error parsing shape proto during cpp shape inference");
+    }
+  }
+
   // Run shape inference.
   tensorflow::shape_inference::InferenceContext c(
       &node, op_reg_data->op_def, input_shapes, input_tensors,
-      {} /* input_tensors_as_shapes */, input_handle_shapes,
-      input_handle_dtypes);
+      input_tensor_as_shapes_protos, input_handle_shapes, input_handle_dtypes);
   TF_RETURN_IF_ERROR(c.construction_status());
 
   TF_RETURN_IF_ERROR(c.Run(op_reg_data->shape_inference_fn));
@@ -130,16 +140,17 @@ Status RunCppShapeInferenceImpl(
 std::vector<string> RunCppShapeInference(
     const string& serialized_node_def,
     const std::vector<string>& input_serialized_shapes,
-    PyObject* input_constant_tensor_values, TF_Status* out_status) {
+    PyObject* input_constant_tensor_values,
+    const std::vector<string>& input_constant_tensor_as_shape_values,
+    TF_Status* out_status) {
   if (!PyList_Check(input_constant_tensor_values)) {
     TF_SetStatus(out_status, TF_INVALID_ARGUMENT, "Invalid python value");
     return std::vector<string>();
   }
 
   std::vector<PyObject*> input_constant_tensor_values_v;
-  int num_input_constant_tensor_values =
-      PyList_Size(input_constant_tensor_values);
-  for (int i = 0; i < num_input_constant_tensor_values; ++i) {
+  int cnt = PyList_Size(input_constant_tensor_values);
+  for (int i = 0; i < cnt; ++i) {
     input_constant_tensor_values_v.push_back(
         PyList_GetItem(input_constant_tensor_values, i));
   }
@@ -147,7 +158,8 @@ std::vector<string> RunCppShapeInference(
   std::vector<string> output_tensor_shape_protos;
   tensorflow::Status status = RunCppShapeInferenceImpl(
       serialized_node_def, input_serialized_shapes,
-      input_constant_tensor_values_v, &output_tensor_shape_protos);
+      input_constant_tensor_values_v, input_constant_tensor_as_shape_values,
+      &output_tensor_shape_protos);
 
   Set_TF_Status_from_Status(out_status, status);
   return status.ok() ? output_tensor_shape_protos : std::vector<string>();
diff --git a/tensorflow/python/framework/cpp_shape_inference.h b/tensorflow/python/framework/cpp_shape_inference.h
index f91af8e1a84..b4893829939 100644
--- a/tensorflow/python/framework/cpp_shape_inference.h
+++ b/tensorflow/python/framework/cpp_shape_inference.h
@@ -44,7 +44,9 @@ namespace swig {
 std::vector<string> RunCppShapeInference(
     const string& serialized_node_def,
     const std::vector<string>& input_serialized_shapes,
-    PyObject* input_constant_tensor_values, TF_Status* out_status);
+    PyObject* input_constant_tensor_values,
+    const std::vector<string>& input_constant_tensor_as_shape_values,
+    TF_Status* out_status);
 
 }  // namespace swig
 }  // namespace tensorflow
diff --git a/tensorflow/python/framework/docs.py b/tensorflow/python/framework/docs.py
index 6cc8ab34143..442b8033b42 100644
--- a/tensorflow/python/framework/docs.py
+++ b/tensorflow/python/framework/docs.py
@@ -85,7 +85,7 @@ class Index(Document):
     print("# TensorFlow Python reference documentation", file=f)
     print("", file=f)
     fullname_f = lambda name: self._members[name][0]
-    anchor_f = lambda name: _get_anchor(self._module_to_name, fullname_f(name))
+    anchor_f = lambda name: get_anchor(self._module_to_name, fullname_f(name))
 
     for filename, library in self._filename_to_library_map:
       sorted_names = sorted(library.mentioned, key=lambda x: (str.lower(x), x))
@@ -142,7 +142,7 @@ def collect_members(module_to_name, exclude=()):
   return members
 
 
-def _get_anchor(module_to_name, fullname):
+def get_anchor(module_to_name, fullname):
   """Turn a full member name into an anchor.
 
   Args:
@@ -416,7 +416,7 @@ class Library(Document):
     heading = prefix + " `" + fullname
     if not isinstance(func, property):
       heading += self._generate_signature_for_function(func)
-    heading += "` {#%s}" % _get_anchor(self._module_to_name, fullname)
+    heading += "` {#%s}" % get_anchor(self._module_to_name, fullname)
     print(heading, file=f)
     print("", file=f)
     self._print_formatted_docstring(inspect.getdoc(func), f)
@@ -444,7 +444,7 @@ class Library(Document):
       print("- - -", file=f)
       print("", file=f)
       print("%s `class %s` {#%s}" % (prefix, name,
-                                     _get_anchor(self._module_to_name, name)),
+                                     get_anchor(self._module_to_name, name)),
             file=f)
       print("", file=f)
       self._write_class_markdown_to_file(f, name, member)
diff --git a/tensorflow/python/framework/framework_lib.py b/tensorflow/python/framework/framework_lib.py
index 69d66ea17c3..4f44041df73 100644
--- a/tensorflow/python/framework/framework_lib.py
+++ b/tensorflow/python/framework/framework_lib.py
@@ -74,10 +74,11 @@ from tensorflow.python.framework.ops import Graph
 from tensorflow.python.framework.ops import Operation
 from tensorflow.python.framework.ops import Tensor
 from tensorflow.python.framework.ops import Output
-from tensorflow.python.framework.ops import SparseTensor
-from tensorflow.python.framework.ops import SparseTensorValue
 from tensorflow.python.framework.ops import IndexedSlices
 
+from tensorflow.python.framework.sparse_tensor import SparseTensor
+from tensorflow.python.framework.sparse_tensor import SparseTensorValue
+
 # Utilities used when building a Graph.
 from tensorflow.python.framework.ops import device
 from tensorflow.python.framework.ops import container
@@ -94,6 +95,7 @@ from tensorflow.python.framework.ops import convert_to_tensor
 from tensorflow.python.framework.ops import convert_to_tensor_or_indexed_slices
 from tensorflow.python.framework.random_seed import get_seed
 from tensorflow.python.framework.random_seed import set_random_seed
+from tensorflow.python.framework.subscribe import subscribe
 from tensorflow.python.framework.importer import import_graph_def
 
 # Needed when you defined a new Op in C++.
diff --git a/tensorflow/python/framework/gen_docs_combined.py b/tensorflow/python/framework/gen_docs_combined.py
index 83d2751f214..ceaf81517ae 100644
--- a/tensorflow/python/framework/gen_docs_combined.py
+++ b/tensorflow/python/framework/gen_docs_combined.py
@@ -67,6 +67,7 @@ def module_names():
       "tf.contrib.ffmpeg",
       "tf.contrib.framework",
       "tf.contrib.graph_editor",
+      "tf.contrib.integrate",
       "tf.contrib.layers",
       "tf.contrib.learn",
       "tf.contrib.learn.monitors",
@@ -220,6 +221,7 @@ def all_libraries(module_to_name, members, documented):
       library("contrib.framework", "Framework (contrib)", tf.contrib.framework),
       library("contrib.graph_editor", "Graph Editor (contrib)",
               tf.contrib.graph_editor),
+      library("contrib.integrate", "Integrate (contrib)", tf.contrib.integrate),
       library("contrib.layers", "Layers (contrib)", tf.contrib.layers),
       library("contrib.learn", "Learn (contrib)", tf.contrib.learn),
       library("contrib.learn.monitors", "Monitors (contrib)",
diff --git a/tensorflow/python/framework/ops.py b/tensorflow/python/framework/ops.py
index be9de08ba36..56018f735a4 100644
--- a/tensorflow/python/framework/ops.py
+++ b/tensorflow/python/framework/ops.py
@@ -43,6 +43,7 @@ from tensorflow.python.framework import tensor_shape
 from tensorflow.python.framework import versions
 from tensorflow.python.platform import tf_logging as logging
 from tensorflow.python.util import compat
+from tensorflow.python.util import decorator_utils
 
 
 def _override_helper(clazz_object, operator, func):
@@ -186,7 +187,13 @@ def register_dense_tensor_like_type(tensor_type):
   _TENSOR_LIKE_TYPES = tuple(list(_TENSOR_LIKE_TYPES) + [tensor_type])
 
 
-class Tensor(object):
+# NOTE(ebrevdo): Do not subclass this.  If you do, I will break you on purpose.
+class _TensorLike(object):
+  """Internal cls for grouping Tensor, SparseTensor, ..., for is_instance."""
+  pass
+
+
+class Tensor(_TensorLike):
   """Represents one of the outputs of an `Operation`.
 
   *Note:* the `Tensor` class will be replaced by `Output` in the future.
@@ -752,7 +759,7 @@ def convert_to_tensor_or_indexed_slices(value, dtype=None, name=None,
   Raises:
     ValueError: If `dtype` does not match the element type of `value`.
   """
-  if isinstance(value, (IndexedSlices, SparseTensor)):
+  if isinstance(value, _TensorLike):
     if dtype and not dtypes.as_dtype(dtype).is_compatible_with(value.dtype):
       raise ValueError(
           "Tensor conversion requested dtype %s for Tensor with dtype %s: %r"
@@ -858,7 +865,7 @@ def register_tensor_conversion_function(base_type, conversion_func,
   funcs_at_priority.append((base_type, conversion_func))
 
 
-class IndexedSlices(object):
+class IndexedSlices(_TensorLike):
   """A sparse representation of a set of tensor slices at given indices.
 
   This class is a simple wrapper for a pair of `Tensor` objects:
@@ -958,190 +965,6 @@ IndexedSlicesValue = collections.namedtuple(
     "IndexedSlicesValue", ["values", "indices", "dense_shape"])
 
 
-class SparseTensor(object):
-  """Represents a sparse tensor.
-
-  TensorFlow represents a sparse tensor as three separate dense tensors:
-  `indices`, `values`, and `shape`.  In Python, the three tensors are
-  collected into a `SparseTensor` class for ease of use.  If you have separate
-  `indices`, `values`, and `shape` tensors, wrap them in a `SparseTensor`
-  object before passing to the ops below.
-
-  Concretely, the sparse tensor `SparseTensor(indices, values, shape)`
-  comprises the following components, where `N` and `ndims` are the number
-  of values and number of dimensions in the `SparseTensor`, respectively:
-
-  * `indices`: A 2-D int64 tensor of shape `[N, ndims]`, which specifies
-    the indices of the elements in the sparse tensor that contain nonzero
-    values (elements are zero-indexed). For example, `indices=[[1,3], [2,4]]`
-    specifies that the elements with indexes of [1,3] and [2,4] have
-    nonzero values.
-
-  * `values`: A 1-D tensor of any type and shape `[N]`, which supplies the
-    values for each element in `indices`. For example, given
-    `indices=[[1,3], [2,4]]`, the parameter `values=[18, 3.6]` specifies
-    that element [1,3] of the sparse tensor has a value of 18, and element
-    [2,4] of the tensor has a value of 3.6.
-
-  * `shape`: A 1-D int64 tensor of shape `[ndims]`, which specifies the shape
-    of the sparse tensor. Takes a list indicating the number of elements in
-    each dimension. For example, `shape=[3,6]` specifies a two-dimensional 3x6
-    tensor, `shape=[2,3,4]` specifies a three-dimensional 2x3x4 tensor, and
-    `shape=[9]` specifies a one-dimensional tensor with 9 elements.
-
-  The corresponding dense tensor satisfies:
-
-  ```python
-  dense.shape = shape
-  dense[tuple(indices[i])] = values[i]
-  ```
-
-  By convention, `indices` should be sorted in row-major order (or equivalently
-  lexicographic order on the tuples `indices[i]`). This is not enforced when
-  `SparseTensor` objects are constructed, but most ops assume correct ordering.
-  If the ordering of sparse tensor `st` is wrong, a fixed version can be
-  obtained by calling `tf.sparse_reorder(st)`.
-
-  Example: The sparse tensor
-
-  ```python
-  SparseTensor(indices=[[0, 0], [1, 2]], values=[1, 2], shape=[3, 4])
-  ```
-
-  represents the dense tensor
-
-  ```python
-  [[1, 0, 0, 0]
-   [0, 0, 2, 0]
-   [0, 0, 0, 0]]
-  ```
-
-  @@__init__
-  @@indices
-  @@values
-  @@shape
-  @@dtype
-  @@op
-  @@graph
-  """
-
-  @classmethod
-  def from_value(cls, sparse_tensor_value):
-    return SparseTensor(
-        indices=sparse_tensor_value.indices,
-        values=sparse_tensor_value.values,
-        shape=sparse_tensor_value.shape)
-
-  def __init__(self, indices, values, shape):
-    """Creates a `SparseTensor`.
-
-    Args:
-      indices: A 2-D int64 tensor of shape `[N, ndims]`.
-      values: A 1-D tensor of any type and shape `[N]`.
-      shape: A 1-D int64 tensor of shape `[ndims]`.
-
-    Returns:
-      A `SparseTensor`
-    """
-    with name_scope(None, "SparseTensor", [indices, values, shape]):
-      indices = convert_to_tensor(indices, name="indices", dtype=dtypes.int64)
-      # Always pass as_ref=True because we want to be able to update
-      # values later if it is a VariableOp.
-      # TODO(touts): Consider adding mutable_values() when 'values'
-      # is a VariableOp and updating users of SparseTensor.
-      values = convert_to_tensor(values, name="values", as_ref=True)
-      shape = convert_to_tensor(shape, name="shape", dtype=dtypes.int64)
-    self._indices = indices
-    self._values = values
-    self._shape = shape
-
-    indices_shape = indices.get_shape().with_rank(2)
-    values_shape = values.get_shape().with_rank(1)
-    shape_shape = shape.get_shape().with_rank(1)
-
-    # Assert number of rows in indices match the number of elements in values.
-    indices_shape[0].merge_with(values_shape[0])
-    # Assert number of columns in indices matches the number of elements in
-    # shape.
-    indices_shape[1].merge_with(shape_shape[0])
-
-  @property
-  def indices(self):
-    """The indices of non-zero values in the represented dense tensor.
-
-    Returns:
-      A 2-D Tensor of int64 with shape `[N, ndims]`, where `N` is the
-        number of non-zero values in the tensor, and `ndims` is the rank.
-    """
-    return self._indices
-
-  @property
-  def values(self):
-    """The non-zero values in the represented dense tensor.
-
-    Returns:
-      A 1-D Tensor of any data type.
-    """
-    return self._values
-
-  @property
-  def op(self):
-    """The `Operation` that produces `values` as an output."""
-    return self.values.op
-
-  @property
-  def dtype(self):
-    """The `DType` of elements in this tensor."""
-    return self._values.dtype
-
-  @property
-  def shape(self):
-    """A 1-D Tensor of int64 representing the shape of the dense tensor."""
-    return self._shape
-
-  @property
-  def graph(self):
-    """The `Graph` that contains the index, value, and shape tensors."""
-    return self._indices.graph
-
-  def __str__(self):
-    return "SparseTensor(indices=%s, values=%s, shape=%s)" % (
-        self._indices, self._values, self._shape)
-
-  def eval(self, feed_dict=None, session=None):
-    """Evaluates this sparse tensor in a `Session`.
-
-    Calling this method will execute all preceding operations that
-    produce the inputs needed for the operation that produces this
-    tensor.
-
-    *N.B.* Before invoking `SparseTensor.eval()`, its graph must have been
-    launched in a session, and either a default session must be
-    available, or `session` must be specified explicitly.
-
-    Args:
-      feed_dict: A dictionary that maps `Tensor` objects to feed values.
-        See [`Session.run()`](../../api_docs/python/client.md#Session.run) for a
-        description of the valid feed values.
-      session: (Optional.) The `Session` to be used to evaluate this sparse
-        tensor. If none, the default session will be used.
-
-    Returns:
-      A `SparseTensorValue` object.
-    """
-    indices, values, shape = _eval_using_default_session(
-        [self.indices, self.values, self.shape], feed_dict, self.graph, session)
-    return SparseTensorValue(indices, values, shape)
-
-  @staticmethod
-  def _override_operator(operator, func):
-    _override_helper(SparseTensor, operator, func)
-
-
-SparseTensorValue = collections.namedtuple("SparseTensorValue",
-                                           ["indices", "values", "shape"])
-
-
 def _device_string(dev_spec):
   if isinstance(dev_spec, pydev.DeviceSpec):
     return dev_spec.to_string()
@@ -1875,23 +1698,21 @@ class RegisterStatistics(object):
 
   Well-known types of statistics include these so far:
 
-  - weight_parameters: For operations like MatMul, Conv, and BiasAdd that take
-    learned weights as inputs, this statistic captures how many numerical values
-    are used. This is good to know because the weights take up most of the size
-    of a typical serialized graph on disk.
-
   - flops: When running a graph, the bulk of the computation happens doing
     numerical calculations like matrix multiplications. This type allows a node
     to return how many floating-point operations it takes to complete. The
     total number of FLOPs for a graph is a good guide to its expected latency.
 
   You can add your own statistics just by picking a new type string, registering
-  functions for the ops you care about, and then calling something like
-  python/tools/graph_metrics.py with the new type as an argument.
+  functions for the ops you care about, and then calling get_stats_for_node_def.
 
   If a statistic for an op is registered multiple times, a KeyError will be
   raised.
 
+  Since the statistics is counted on a per-op basis. It is not suitable for
+  model parameters (capacity), which is expected to be counted only once, even
+  if it is shared by multiple ops. (e.g. RNN)
+
   For example, you can define a new metric called doohickey for a Foo operation
   by placing this in your code:
 
@@ -3972,7 +3793,7 @@ def _get_graph_from_inputs(op_input_list, graph=None):
   for op_input in op_input_list:
     # Determine if this is a valid graph_element.
     graph_element = None
-    if isinstance(op_input, (Operation, Tensor, SparseTensor, IndexedSlices)):
+    if isinstance(op_input, (Operation, _TensorLike)):
       graph_element = op_input
     else:
       graph_element = _as_graph_element(op_input)
@@ -4003,10 +3824,18 @@ class GraphKeys(object):
 
   The following standard keys are defined:
 
-  * `VARIABLES`: the `Variable` objects that comprise a model, and
-    must be saved and restored together. See
-    [`tf.all_variables()`](../../api_docs/python/state_ops.md#all_variables)
+  * `GLOBAL_VARIABLES`: the default collection of `Variable` objects, shared
+    across distributed environment (model variables are subset of these). See
+    [`tf.global_variables()`](../../api_docs/python/state_ops.md#global_variables)
     for more details.
+    Commonly, all `TRAINABLE_VARIABLES` variables will be in `MODEL_VARIABLES`,
+    and all `MODEL_VARIABLES` variables will be in `GLOBAL_VARIABLES`.
+  * `LOCAL_VARIABLES`: the subset of `Variable` objects that are local to each
+    machine. Usually used for temporarily variables, like counters.
+    Note: use `tf.contrib.framework.local_variable` to add to this collection.
+  * `MODEL_VARIABLES`: the subset of `Variable` objects that are used in the
+    model for inference (feed forward). Note: use
+    `tf.contrib.framework.model_variable` to add to this collection.
   * `TRAINABLE_VARIABLES`: the subset of `Variable` objects that will
     be trained by an optimizer. See
     [`tf.trainable_variables()`](../../api_docs/python/state_ops.md#trainable_variables)
@@ -4030,16 +3859,17 @@ class GraphKeys(object):
   * `ACTIVATIONS`: activations of neural network layers
   """
 
-  # Key to collect Variable objects that must be saved and restored
-  # by the model.
-  VARIABLES = "variables"
-  # Key to collect Variable objects that will be trained by the
-  # optimizers.
-  TRAINABLE_VARIABLES = "trainable_variables"
-  # Key to collect local variables that are not saved/restored.
+  # Key to collect Variable objects that are global (shared across machines).
+  # Default collection for all variables, except local ones.
+  GLOBAL_VARIABLES = "variables"
+  # Key to collect local variables that are local to the machine and are not
+  # saved/restored.
   LOCAL_VARIABLES = "local_variables"
   # Key to collect model variables defined by layers.
   MODEL_VARIABLES = "model_variables"
+  # Key to collect Variable objects that will be trained by the
+  # optimizers.
+  TRAINABLE_VARIABLES = "trainable_variables"
   # Key to collect summaries.
   SUMMARIES = "summaries"
   # Key to collect QueueRunners.
@@ -4089,6 +3919,13 @@ class GraphKeys(object):
   COND_CONTEXT = "cond_context"
   WHILE_CONTEXT = "while_context"
 
+  @decorator_utils.classproperty
+  def VARIABLES(cls):  # pylint: disable=no-self-argument
+    logging.warning("VARIABLES collection name is deprecated, "
+                    "please use GLOBAL_VARIABLES instead.\n"
+                    "VARIABLES will be removed after 2017-03-02.")
+    return cls.GLOBAL_VARIABLES
+
 
 def add_to_collection(name, value):
   """Wrapper for `Graph.add_to_collection()` using the default graph.
diff --git a/tensorflow/python/framework/ops_test.py b/tensorflow/python/framework/ops_test.py
index 78416c6fb39..f9687405b4d 100644
--- a/tensorflow/python/framework/ops_test.py
+++ b/tensorflow/python/framework/ops_test.py
@@ -25,6 +25,7 @@ from tensorflow.python.framework import device as pydev
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import errors
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.framework import test_ops
 from tensorflow.python.framework import test_util
@@ -86,32 +87,6 @@ class TensorTest(test_util.TensorFlowTestCase):
         pass
 
 
-class SparseTensorTest(test_util.TensorFlowTestCase):
-
-  def testPythonConstruction(self):
-    indices = [[1, 2], [2, 0], [3, 4]]
-    values = [b"a", b"b", b"c"]
-    shape = [4, 5]
-    sp_value = ops.SparseTensorValue(indices, values, shape)
-    for sp in [
-        ops.SparseTensor(indices, values, shape),
-        ops.SparseTensor.from_value(sp_value),
-        ops.SparseTensor.from_value(ops.SparseTensor(indices, values, shape))]:
-      self.assertEqual(sp.indices.dtype, dtypes.int64)
-      self.assertEqual(sp.values.dtype, dtypes.string)
-      self.assertEqual(sp.shape.dtype, dtypes.int64)
-
-      with self.test_session() as sess:
-        value = sp.eval()
-        self.assertAllEqual(indices, value.indices)
-        self.assertAllEqual(values, value.values)
-        self.assertAllEqual(shape, value.shape)
-        sess_run_value = sess.run(sp)
-        self.assertAllEqual(sess_run_value.indices, value.indices)
-        self.assertAllEqual(sess_run_value.values, value.values)
-        self.assertAllEqual(sess_run_value.shape, value.shape)
-
-
 class IndexedSlicesTest(test_util.TensorFlowTestCase):
 
   def testToTensor(self):
@@ -1246,7 +1221,7 @@ class OpScopeTest(test_util.TensorFlowTestCase):
     g0 = ops.Graph()
     a = g0.create_op("a", [], [dtypes.float32])
     b = g0.create_op("b", [], [dtypes.float32])
-    sparse = ops.SparseTensor(
+    sparse = sparse_tensor.SparseTensor(
         _apply_op(g0, "const", [], [dtypes.int64]),
         _apply_op(g0, "const", [], [dtypes.float32]),
         _apply_op(g0, "const", [], [dtypes.int64]))
@@ -1421,12 +1396,6 @@ class AsGraphDefTest(test_util.TensorFlowTestCase):
       """, gd)
 
 
-# NOTE(petewarden): Dummy stats registrations for ops used in the tests.
-@ops.RegisterStatistics("a", "weight_parameters")
-def _calc_a_weight_params(unused_graph, unused_node):
-  return ops.OpStats("weight_parameters", 10)
-
-
 @ops.RegisterStatistics("a", "flops")
 def _calc_a_forward_flops(unused_graph, unused_node):
   return ops.OpStats("flops", 20)
@@ -1437,8 +1406,6 @@ class StatisticsTest(test_util.TensorFlowTestCase):
   def testRegisteredNode(self):
     graph = ops.Graph()
     node = ops._NodeDef("a", "an_a")
-    weight_params = ops.get_stats_for_node_def(graph, node, "weight_parameters")
-    self.assertEqual(10, weight_params.value)
     flops = ops.get_stats_for_node_def(graph, node, "flops")
     self.assertEqual(20, flops.value)
     missing_stat = ops.get_stats_for_node_def(graph, node, "missing_stat")
@@ -1451,19 +1418,11 @@ class StatisticsTest(test_util.TensorFlowTestCase):
     self.assertEqual(None, weight_params.value)
 
   def testAccumulateStatistics(self):
-    weight_params_total = ops.OpStats("weight_parameters")
-    self.assertEqual(None, weight_params_total.value)
     flops_total = ops.OpStats("flops")
     self.assertEqual(None, flops_total.value)
-    first_weight_params = ops.OpStats("weight_parameters", 100)
-    weight_params_total += first_weight_params
-    self.assertEqual(100, weight_params_total.value)
     second_flops = ops.OpStats("flops", 3)
     flops_total += second_flops
     self.assertEqual(3, flops_total.value)
-    second_weight_params = ops.OpStats("weight_parameters", 200)
-    weight_params_total += second_weight_params
-    self.assertEqual(300, weight_params_total.value)
 
 
 class ColocationGroupTest(test_util.TensorFlowTestCase):
diff --git a/tensorflow/python/framework/sparse_tensor.py b/tensorflow/python/framework/sparse_tensor.py
new file mode 100644
index 00000000000..4ce92c4225a
--- /dev/null
+++ b/tensorflow/python/framework/sparse_tensor.py
@@ -0,0 +1,232 @@
+# Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""Classes and functions used to construct graphs."""
+# pylint: disable=g-bad-name
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import collections
+
+from tensorflow.python.framework import dtypes
+from tensorflow.python.framework import ops
+from tensorflow.python.framework import tensor_util
+
+
+# pylint: disable=protected-access
+_TensorLike = ops._TensorLike
+_eval_using_default_session = ops._eval_using_default_session
+_override_helper = ops._override_helper
+# pylint: enable=protected-access
+
+
+class SparseTensor(_TensorLike):
+  """Represents a sparse tensor.
+
+  TensorFlow represents a sparse tensor as three separate dense tensors:
+  `indices`, `values`, and `shape`.  In Python, the three tensors are
+  collected into a `SparseTensor` class for ease of use.  If you have separate
+  `indices`, `values`, and `shape` tensors, wrap them in a `SparseTensor`
+  object before passing to the ops below.
+
+  Concretely, the sparse tensor `SparseTensor(indices, values, shape)`
+  comprises the following components, where `N` and `ndims` are the number
+  of values and number of dimensions in the `SparseTensor`, respectively:
+
+  * `indices`: A 2-D int64 tensor of shape `[N, ndims]`, which specifies
+    the indices of the elements in the sparse tensor that contain nonzero
+    values (elements are zero-indexed). For example, `indices=[[1,3], [2,4]]`
+    specifies that the elements with indexes of [1,3] and [2,4] have
+    nonzero values.
+
+  * `values`: A 1-D tensor of any type and shape `[N]`, which supplies the
+    values for each element in `indices`. For example, given
+    `indices=[[1,3], [2,4]]`, the parameter `values=[18, 3.6]` specifies
+    that element [1,3] of the sparse tensor has a value of 18, and element
+    [2,4] of the tensor has a value of 3.6.
+
+  * `shape`: A 1-D int64 tensor of shape `[ndims]`, which specifies the shape
+    of the sparse tensor. Takes a list indicating the number of elements in
+    each dimension. For example, `shape=[3,6]` specifies a two-dimensional 3x6
+    tensor, `shape=[2,3,4]` specifies a three-dimensional 2x3x4 tensor, and
+    `shape=[9]` specifies a one-dimensional tensor with 9 elements.
+
+  The corresponding dense tensor satisfies:
+
+  ```python
+  dense.shape = shape
+  dense[tuple(indices[i])] = values[i]
+  ```
+
+  By convention, `indices` should be sorted in row-major order (or equivalently
+  lexicographic order on the tuples `indices[i]`). This is not enforced when
+  `SparseTensor` objects are constructed, but most ops assume correct ordering.
+  If the ordering of sparse tensor `st` is wrong, a fixed version can be
+  obtained by calling `tf.sparse_reorder(st)`.
+
+  Example: The sparse tensor
+
+  ```python
+  SparseTensor(indices=[[0, 0], [1, 2]], values=[1, 2], shape=[3, 4])
+  ```
+
+  represents the dense tensor
+
+  ```python
+  [[1, 0, 0, 0]
+   [0, 0, 2, 0]
+   [0, 0, 0, 0]]
+  ```
+
+  @@__init__
+  @@get_shape
+  @@indices
+  @@values
+  @@shape
+  @@dtype
+  @@op
+  @@graph
+  """
+
+  @classmethod
+  def from_value(cls, sparse_tensor_value):
+    if not (isinstance(sparse_tensor_value, SparseTensor) or
+            isinstance(sparse_tensor_value, SparseTensorValue)):
+      raise TypeError(
+          "Neither a SparseTensor nor SparseTensorValue: %s."
+          % sparse_tensor_value)
+    return SparseTensor(
+        indices=sparse_tensor_value.indices,
+        values=sparse_tensor_value.values,
+        shape=sparse_tensor_value.shape)
+
+  def __init__(self, indices, values, shape):
+    """Creates a `SparseTensor`.
+
+    Args:
+      indices: A 2-D int64 tensor of shape `[N, ndims]`.
+      values: A 1-D tensor of any type and shape `[N]`.
+      shape: A 1-D int64 tensor of shape `[ndims]`.
+
+    Returns:
+      A `SparseTensor`
+    """
+    with ops.name_scope(None, "SparseTensor", [indices, values, shape]):
+      indices = ops.convert_to_tensor(
+          indices, name="indices", dtype=dtypes.int64)
+      # Always pass as_ref=True because we want to be able to update
+      # values later if it is a VariableOp.
+      # TODO(touts): Consider adding mutable_values() when 'values'
+      # is a VariableOp and updating users of SparseTensor.
+      values = ops.convert_to_tensor(values, name="values", as_ref=True)
+      shape = ops.convert_to_tensor(shape, name="shape", dtype=dtypes.int64)
+    self._indices = indices
+    self._values = values
+    self._shape = shape
+
+    indices_shape = indices.get_shape().with_rank(2)
+    values_shape = values.get_shape().with_rank(1)
+    shape_shape = shape.get_shape().with_rank(1)
+
+    # Assert number of rows in indices match the number of elements in values.
+    indices_shape[0].merge_with(values_shape[0])
+    # Assert number of columns in indices matches the number of elements in
+    # shape.
+    indices_shape[1].merge_with(shape_shape[0])
+
+  def get_shape(self):
+    """Get the `TensorShape` that represents the shape of the dense tensor.
+
+    Returns:
+      A `TensorShape` object.
+    """
+    return tensor_util.constant_value_as_shape(self._shape)
+
+  @property
+  def indices(self):
+    """The indices of non-zero values in the represented dense tensor.
+
+    Returns:
+      A 2-D Tensor of int64 with shape `[N, ndims]`, where `N` is the
+        number of non-zero values in the tensor, and `ndims` is the rank.
+    """
+    return self._indices
+
+  @property
+  def values(self):
+    """The non-zero values in the represented dense tensor.
+
+    Returns:
+      A 1-D Tensor of any data type.
+    """
+    return self._values
+
+  @property
+  def op(self):
+    """The `Operation` that produces `values` as an output."""
+    return self.values.op
+
+  @property
+  def dtype(self):
+    """The `DType` of elements in this tensor."""
+    return self._values.dtype
+
+  @property
+  def shape(self):
+    """A 1-D Tensor of int64 representing the shape of the dense tensor."""
+    return self._shape
+
+  @property
+  def graph(self):
+    """The `Graph` that contains the index, value, and shape tensors."""
+    return self._indices.graph
+
+  def __str__(self):
+    return "SparseTensor(indices=%s, values=%s, shape=%s)" % (
+        self._indices, self._values, self._shape)
+
+  def eval(self, feed_dict=None, session=None):
+    """Evaluates this sparse tensor in a `Session`.
+
+    Calling this method will execute all preceding operations that
+    produce the inputs needed for the operation that produces this
+    tensor.
+
+    *N.B.* Before invoking `SparseTensor.eval()`, its graph must have been
+    launched in a session, and either a default session must be
+    available, or `session` must be specified explicitly.
+
+    Args:
+      feed_dict: A dictionary that maps `Tensor` objects to feed values.
+        See [`Session.run()`](../../api_docs/python/client.md#Session.run) for a
+        description of the valid feed values.
+      session: (Optional.) The `Session` to be used to evaluate this sparse
+        tensor. If none, the default session will be used.
+
+    Returns:
+      A `SparseTensorValue` object.
+    """
+    indices, values, shape = _eval_using_default_session(
+        [self.indices, self.values, self.shape], feed_dict, self.graph, session)
+    return SparseTensorValue(indices, values, shape)
+
+  @staticmethod
+  def _override_operator(operator, func):
+    _override_helper(SparseTensor, operator, func)
+
+
+SparseTensorValue = collections.namedtuple("SparseTensorValue",
+                                           ["indices", "values", "shape"])
diff --git a/tensorflow/python/framework/sparse_tensor_test.py b/tensorflow/python/framework/sparse_tensor_test.py
new file mode 100644
index 00000000000..b5f8142afc6
--- /dev/null
+++ b/tensorflow/python/framework/sparse_tensor_test.py
@@ -0,0 +1,56 @@
+# Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""Tests for tensorflow.python.framework.ops."""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from tensorflow.python.framework import dtypes
+from tensorflow.python.framework import sparse_tensor
+from tensorflow.python.framework import test_util
+from tensorflow.python.platform import googletest
+
+
+class SparseTensorTest(test_util.TensorFlowTestCase):
+
+  def testPythonConstruction(self):
+    indices = [[1, 2], [2, 0], [3, 4]]
+    values = [b"a", b"b", b"c"]
+    shape = [4, 5]
+    sp_value = sparse_tensor.SparseTensorValue(indices, values, shape)
+    for sp in [
+        sparse_tensor.SparseTensor(indices, values, shape),
+        sparse_tensor.SparseTensor.from_value(sp_value),
+        sparse_tensor.SparseTensor.from_value(
+            sparse_tensor.SparseTensor(indices, values, shape))]:
+      self.assertEqual(sp.indices.dtype, dtypes.int64)
+      self.assertEqual(sp.values.dtype, dtypes.string)
+      self.assertEqual(sp.shape.dtype, dtypes.int64)
+      self.assertEqual(sp.get_shape(), (4, 5))
+
+      with self.test_session() as sess:
+        value = sp.eval()
+        self.assertAllEqual(indices, value.indices)
+        self.assertAllEqual(values, value.values)
+        self.assertAllEqual(shape, value.shape)
+        sess_run_value = sess.run(sp)
+        self.assertAllEqual(sess_run_value.indices, value.indices)
+        self.assertAllEqual(sess_run_value.values, value.values)
+        self.assertAllEqual(sess_run_value.shape, value.shape)
+
+
+if __name__ == "__main__":
+  googletest.main()
diff --git a/tensorflow/python/framework/subscribe.py b/tensorflow/python/framework/subscribe.py
new file mode 100644
index 00000000000..53d299a976c
--- /dev/null
+++ b/tensorflow/python/framework/subscribe.py
@@ -0,0 +1,144 @@
+# Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""Subscribe function."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+from tensorflow.python.framework import ops
+from tensorflow.python.ops import array_ops
+
+
+def _recursive_apply(tensors, apply_fn):
+  """Helper method to recursively apply a function to structure of tensors.
+
+  The structure of the tensors should take the form similar to fetches in
+  `tf.Session` and includes single `Tensor`, `list`, nested `list`, `tuple`,
+  `namedtuple`, or `dict`.
+
+  Args:
+    tensors: Single `Tensor`, `list`, nested `list, `tuple`,
+      `namedtuple`, or `dict`.
+    apply_fn: Function to apply to each `Tensor` and should return a `Tensor`.
+  Returns:
+    Returns the modified tensors with the same structure.
+  Raises:
+    `TypeError` if undefined type in the tensors structure.
+  """
+  tensors_type = type(tensors)
+  if tensors_type is ops.Tensor:
+    return apply_fn(tensors)
+  elif isinstance(tensors, (list, tuple)):
+    tensors = [_recursive_apply(t, apply_fn) for t in tensors]
+    if tensors_type is list:
+      return list(tensors)
+    elif tensors_type is tuple:
+      return tuple(tensors)
+    return tensors_type(*tensors)  # collections.namedtuple
+  elif tensors_type is dict:
+    return dict([(k, _recursive_apply(v, apply_fn))
+                 for k, v in tensors.iteritems()])
+  else:
+    raise TypeError('_recursive_apply argument %r has invalid type %r' %
+                    (tensors, tensors_type))
+
+
+def _control_outputs(op):
+  """Returns the control_input consumers for the supplied `Operation`.
+
+  Args:
+    op: The `Operation` to find consumers of.
+  Yields:
+    A list of ops that have op as a control dependency.
+  """
+  for o in op.graph.get_operations():
+    if op in o.control_inputs:
+      yield o
+
+
+def _subscribe(tensor, side_effects):
+  """Helper method that subscribes a single tensor to a list of side_effects.
+
+  Args:
+    tensor: `tf.Tensor`
+    side_effects: List of side_effect functions see subscribe for details.
+  Returns:
+    The modified replacement to the passed in tensor which triggers the side
+    effects.
+  """
+  update_input = []
+  for consumer_op in list(tensor.consumers()):  # explicit copy
+    update_input.append((consumer_op, list(consumer_op.inputs).index(tensor)))
+
+  update_control_input = list(_control_outputs(tensor.op))
+
+  # Trailing slash on name scope to replace the scope.
+  name_scope = tensor.op.name + '/subscription/'
+  with ops.name_scope(name_scope):
+    outs = []
+    for s in side_effects:
+      outs += s(tensor)
+
+    with ops.control_dependencies(outs):
+      out = array_ops.identity(tensor)
+
+  for consumer_op, index in update_input:
+    consumer_op._update_input(index, out)  # pylint: disable=protected-access
+
+  for consumer_op in update_control_input:
+    consumer_op._control_inputs.remove(tensor.op)  # pylint: disable=protected-access
+    consumer_op._control_inputs.append(out.op)  # pylint: disable=protected-access
+    consumer_op._recompute_node_def()  # pylint: disable=protected-access
+
+  return out
+
+
+def subscribe(tensors, side_effects):
+  """Subscribe to a tensor.
+
+  This method will attach side effect graphs to a given set
+  of tensors. Set of tensors follows from session.run and supports
+  single `Tensor`, `list`, nested `list`, `tuple`, `namedtuple`, or `dict`. It
+  returns the tensors in the same passed in structure, but as clones with
+  side effects applied. The supplied side effect graphs are specified
+  as a constructor function which takes the target tensor and
+  constructs a side effect graph and returns a list of ops that should
+  be control dependencies on fetching the tensor. It will append
+  'subscription' to the name scope of the tensor for every node in
+  the side effect graph. These control dependencies are what trigger
+  the side effects. Subscribe will construct the additions to your
+  graph and return the created identity tensor downstream of the control
+  dependencies. Use these tensors as you would normally in the rest of
+  your tensorflow code.
+
+  Args:
+    tensors: `Tensor` or set of tensors to subscribe to. Set of tensors format
+      follows from `Session.run` and supports single `Tensor`, `list`, nested
+      `list`, `tuple`, `namedtuple`, or `dict`.
+    side_effects: Function(s) that takes a `Tensor`, construct a subgraph, and
+      return a nonempty list of control dependencies. This can be a single
+      function or list of functions.
+  Returns:
+    Subscribed tensors, which are identity copies of the passed in tensors
+      in the same passed in structure, but the graph has been modified
+      such that these are downstream of the control dependencies for
+      the side effect graphs. Use these functionally equivelant tensors
+      instead of the passed in tensors for further construction or running.
+  """
+  if not hasattr(side_effects, '__iter__'):
+    side_effects = [side_effects]
+  return _recursive_apply(tensors, lambda t: _subscribe(t, side_effects))
diff --git a/tensorflow/python/framework/subscribe_test.py b/tensorflow/python/framework/subscribe_test.py
new file mode 100644
index 00000000000..8371c2cfc43
--- /dev/null
+++ b/tensorflow/python/framework/subscribe_test.py
@@ -0,0 +1,59 @@
+# Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+
+"""Tests for tf.subscribe."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import tensorflow as tf
+
+from tensorflow.python.framework import subscribe
+from tensorflow.python.framework import test_util
+from tensorflow.python.platform import googletest
+
+
+class SubscribeTest(test_util.TensorFlowTestCase):
+
+  def testSideEffect(self):
+    a = tf.constant(1)
+    b = tf.constant(1)
+    c = tf.add(a, b)
+    with tf.control_dependencies([c]):
+      d = tf.constant(42)
+    n = tf.neg(c)
+
+    shared = []
+
+    def sub(t):
+      shared.append(t)
+      return t
+
+    c = subscribe.subscribe(c, lambda t: tf.py_func(sub, [t], [t.dtype]))
+
+    with self.test_session() as sess:
+      c_out = sess.run([c])
+      n_out = sess.run([n])
+      d_out = sess.run([d])
+
+    self.assertEquals(n_out, [-2])
+    self.assertEquals(c_out, [2])
+    self.assertEquals(d_out, [42])
+    self.assertEquals(shared, [2, 2, 2])
+
+
+if __name__ == '__main__':
+  googletest.main()
diff --git a/tensorflow/python/kernel_tests/BUILD b/tensorflow/python/kernel_tests/BUILD
index fe74b3426c5..0100e6b3268 100644
--- a/tensorflow/python/kernel_tests/BUILD
+++ b/tensorflow/python/kernel_tests/BUILD
@@ -220,7 +220,7 @@ cuda_py_test(
     additional_deps = ["//tensorflow:tensorflow_py"],
 )
 
-tf_py_test(
+cuda_py_test(
     name = "parameterized_truncated_normal_op_test",
     size = "small",
     srcs = ["parameterized_truncated_normal_op_test.py"],
@@ -272,6 +272,13 @@ tf_py_test(
     additional_deps = ["//tensorflow:tensorflow_py"],
 )
 
+tf_py_test(
+    name = "scatter_nd_ops_test",
+    size = "medium",
+    srcs = ["scatter_nd_ops_test.py"],
+    additional_deps = ["//tensorflow:tensorflow_py"],
+)
+
 tf_py_test(
     name = "segment_reduction_ops_test",
     size = "small",
diff --git a/tensorflow/python/kernel_tests/cwise_ops_test.py b/tensorflow/python/kernel_tests/cwise_ops_test.py
index 60eb7c26d91..f71dcbeae1e 100644
--- a/tensorflow/python/kernel_tests/cwise_ops_test.py
+++ b/tensorflow/python/kernel_tests/cwise_ops_test.py
@@ -194,6 +194,7 @@ class UnaryOpTest(tf.test.TestCase):
     self._compareBoth(z, self._rsqrt, tf.rsqrt)
     self._compareBoth(x, np.exp, tf.exp)
     self._compareBoth(z, np.log, tf.log)
+    self._compareBoth(z, np.log1p, tf.log1p)
     self._compareBoth(x, np.tanh, tf.tanh)
     self._compareBoth(x, self._sigmoid, tf.sigmoid)
     self._compareBoth(y, np.sign, tf.sign)
@@ -236,6 +237,7 @@ class UnaryOpTest(tf.test.TestCase):
     self._compareBoth(x, self._rsqrt, tf.rsqrt)
     self._compareBoth(x, np.exp, tf.exp)
     self._compareBoth(x, np.log, tf.log)
+    self._compareBoth(x, np.log1p, tf.log1p)
     self._compareBoth(x, np.tanh, tf.tanh)
     self._compareBoth(x, self._sigmoid, tf.sigmoid)
     self._compareBoth(x, np.sign, tf.sign)
@@ -273,6 +275,7 @@ class UnaryOpTest(tf.test.TestCase):
     self._compareBoth(z, self._rsqrt, tf.rsqrt)
     self._compareBoth(x, np.exp, tf.exp)
     self._compareBoth(z, np.log, tf.log)
+    self._compareBoth(z, np.log1p, tf.log1p)
     self._compareBoth(x, np.tanh, tf.tanh)
     self._compareBoth(x, self._sigmoid, tf.sigmoid)
     self._compareBoth(y, np.sign, tf.sign)
@@ -311,6 +314,7 @@ class UnaryOpTest(tf.test.TestCase):
     self._compareBoth(z, self._rsqrt, tf.rsqrt)
     self._compareBoth(x, np.exp, tf.exp)
     self._compareBoth(z, np.log, tf.log)
+    self._compareBoth(z, np.log1p, tf.log1p)
     self._compareBoth(x, np.tanh, tf.tanh)
     self._compareBoth(x, self._sigmoid, tf.sigmoid)
     self._compareBoth(y, np.sign, tf.sign)
@@ -374,6 +378,7 @@ class UnaryOpTest(tf.test.TestCase):
     self._compareCpu(y, self._rsqrt, tf.rsqrt)
     self._compareCpu(x, np.exp, tf.exp)
     self._compareCpu(y, np.log, tf.log)
+    self._compareCpu(y, np.log1p, tf.log1p)
     self._compareCpu(x, np.tanh, tf.tanh)
     self._compareCpu(x, self._sigmoid, tf.sigmoid)
     self._compareCpu(x, np.sin, tf.sin)
@@ -405,6 +410,7 @@ class UnaryOpTest(tf.test.TestCase):
     self._compareCpu(y, self._rsqrt, tf.rsqrt)
     self._compareCpu(x, np.exp, tf.exp)
     self._compareCpu(y, np.log, tf.log)
+    self._compareCpu(y, np.log1p, tf.log1p)
     self._compareCpu(x, np.tanh, tf.tanh)
     self._compareCpu(x, self._sigmoid, tf.sigmoid)
     self._compareCpu(x, np.sin, tf.sin)
diff --git a/tensorflow/python/kernel_tests/gather_nd_op_test.py b/tensorflow/python/kernel_tests/gather_nd_op_test.py
index f3fd47381a9..13b3bec3c0f 100644
--- a/tensorflow/python/kernel_tests/gather_nd_op_test.py
+++ b/tensorflow/python/kernel_tests/gather_nd_op_test.py
@@ -53,20 +53,20 @@ class GatherNdTest(tf.test.TestCase):
       gather_nd_ok_t = tf.gather_nd(params, indices_empty)
       gather_nd_ok_val = gather_nd_ok_t.eval()
       self.assertEqual([0], gather_nd_ok_t.get_shape())
-      self.assertAllEqual(np.empty((0,), dtype=np.float32), gather_nd_ok_val)
+      self.assertAllClose(np.empty((0,), dtype=np.float32), gather_nd_ok_val)
 
       indices_empty = np.empty((0, 1), dtype=np.int32)
       gather_nd_ok_t = tf.gather_nd(params, indices_empty)
       gather_nd_ok_val = gather_nd_ok_t.eval()
       self.assertEqual([0, 3], gather_nd_ok_t.get_shape())
-      self.assertAllEqual(np.empty((0, 3), dtype=np.float32), gather_nd_ok_val)
+      self.assertAllClose(np.empty((0, 3), dtype=np.float32), gather_nd_ok_val)
 
       params_empty = np.empty((0, 3), dtype=np.float32)
       indices_empty = np.empty((0, 2), dtype=np.int32)
       gather_nd_ok_t = tf.gather_nd(params_empty, indices_empty)
       gather_nd_ok_val = gather_nd_ok_t.eval()
       self.assertEqual([0], gather_nd_ok_t.get_shape())
-      self.assertAllEqual(np.empty((0,), dtype=np.float32), gather_nd_ok_val)
+      self.assertAllClose(np.empty((0,), dtype=np.float32), gather_nd_ok_val)
 
       params_empty = np.empty((0, 3), dtype=np.float32)
       indices_nonempty = np.zeros((1, 2), dtype=np.int32)
@@ -74,7 +74,7 @@ class GatherNdTest(tf.test.TestCase):
       with self.assertRaisesOpError(
           r"Requested more than 0 entries, but params is empty."):
         gather_nd_break_t.eval()
-      self.assertAllEqual(np.empty((0,), dtype=np.float32), gather_nd_ok_val)
+      self.assertAllClose(np.empty((0,), dtype=np.float32), gather_nd_ok_val)
 
   def testIndexScalar(self):
     with self.test_session(use_gpu=self.use_gpu):
@@ -184,11 +184,11 @@ class GatherNdTest(tf.test.TestCase):
     indices = tf.placeholder(tf.int32)
     gather_nd_t = tf.gather_nd(params, indices)
     shape = gather_nd_t.get_shape()
-    self.assertEqual(shape.ndims, None)
-    self.assertEqual(shape[0].value, None)
+    self.assertEqual(None, shape.ndims)
+    self.assertEqual(None, shape[0].value)
 
   def testBadIndices(self):
-    with self.test_session(use_gpu=False):
+    with self.test_session():
       params = [0, 1, 2]
       indices = [[[0], [7]]]  # Make this one higher rank
       gather_nd = tf.gather_nd(params, indices)
@@ -198,7 +198,7 @@ class GatherNdTest(tf.test.TestCase):
         gather_nd.eval()
 
   def testBadIndicesWithSlices(self):
-    with self.test_session(use_gpu=False):
+    with self.test_session():
       params = [[0, 1, 2]]
       indices = [[[0], [0], [1]]]  # Make this one higher rank
       gather_nd = tf.gather_nd(params, indices)
@@ -207,6 +207,62 @@ class GatherNdTest(tf.test.TestCase):
           r"\(shape: \[1,3\]\)"):
         gather_nd.eval()
 
+  def testGradientsRank2Elements(self):
+    indices = tf.constant([[0, 0], [1, 1]], dtype=tf.int32)
+    inputs = tf.constant([[1, 2], [3, 4]], dtype=tf.float64)
+    outputs = tf.gather_nd(inputs, indices)
+
+    grad_vals = tf.constant([1, 2], dtype=tf.float64)
+    grads = tf.gradients([outputs], [inputs], [grad_vals])[0]
+    expected_grads = np.array([[1, 0], [0, 2]], dtype=np.float64)
+    with self.test_session():
+      assert np.array_equal(expected_grads, grads.eval())
+
+  def testGradientsRank2Slices(self):
+    indices = tf.constant([[1], [0]], dtype=tf.int32)
+    inputs = tf.constant([[1, 2], [3, 4]], dtype=tf.float64)
+    outputs = tf.gather_nd(inputs, indices)
+
+    grad_vals = tf.constant([[1, 2], [3, 4]], dtype=tf.float64)
+    grads = tf.gradients([outputs], [inputs], [grad_vals])[0]
+    expected_grads = np.array([[3, 4], [1, 2]], dtype=np.float64)
+    with self.test_session():
+      self.assertAllEqual(expected_grads, grads.eval())
+
+  def testGradientsRank3Elements(self):
+    indices = tf.constant([[[0, 1], [1, 0]], [[0, 0], [1, 1]]], dtype=tf.int32)
+    inputs = tf.constant([[[1, 3], [5, 7]], [[2, 4], [6, 8]]], dtype=tf.float64)
+    outputs = tf.gather_nd(inputs, indices)
+
+    grad_vals = tf.constant(
+        [[[1, 2], [3, 4]], [[5, 6], [7, 8]]], dtype=tf.float64)
+    grads = tf.gradients([outputs], [inputs], [grad_vals])[0]
+    expected_grads = np.array(
+        [[[5, 6], [1, 2]], [[3, 4], [7, 8]]], dtype=np.float64)
+    with self.test_session():
+      self.assertAllEqual(expected_grads, grads.eval())
+
+  def testGradientsRank2SlicesWithEmptySpace(self):
+    indices = tf.constant([[2], [0], [5]], dtype=tf.int32)
+    inputs = tf.constant(
+        [[1, 2, 3, 4, 5, 6, 7, 8, 9], [1, 2, 3, 4, 5, 6, 7, 8, 9],
+         [1, 2, 3, 4, 5, 6, 7, 8, 9], [1, 2, 3, 4, 5, 6, 7, 8, 9],
+         [1, 2, 3, 4, 5, 6, 7, 8, 9], [1, 2, 3, 4, 5, 6, 7, 8, 9]],
+        dtype=tf.float64)
+    outputs = tf.gather_nd(inputs, indices)
+    grad_vals = tf.constant(
+        [[1, 1, 1, 1, 1, 1, 1, 1, 1], [2, 2, 2, 2, 2, 2, 2, 2, 2],
+         [3, 3, 3, 3, 3, 3, 3, 3, 3]],
+        dtype=tf.float64)
+    grads = tf.gradients([outputs], [inputs], [grad_vals])[0]
+    expected_grads = np.array(
+        [[2, 2, 2, 2, 2, 2, 2, 2, 2], [0, 0, 0, 0, 0, 0, 0, 0, 0],
+         [1, 1, 1, 1, 1, 1, 1, 1, 1], [0, 0, 0, 0, 0, 0, 0, 0, 0],
+         [0, 0, 0, 0, 0, 0, 0, 0, 0], [3, 3, 3, 3, 3, 3, 3, 3, 3]],
+        dtype=np.float64)
+    with self.test_session():
+      self.assertAllEqual(expected_grads, grads.eval())
+
 
 class GatherNdGpuTest(GatherNdTest):
   use_gpu = True
diff --git a/tensorflow/python/kernel_tests/io_ops_test.py b/tensorflow/python/kernel_tests/io_ops_test.py
index 9e85fe2b97a..d484a609fce 100644
--- a/tensorflow/python/kernel_tests/io_ops_test.py
+++ b/tensorflow/python/kernel_tests/io_ops_test.py
@@ -39,6 +39,18 @@ class IoOpsTest(tf.test.TestCase):
         self.assertEqual([], read.get_shape())
         self.assertEqual(read.eval(), contents)
 
+  def testWriteFile(self):
+    cases = ['', 'Some contents']
+    for contents in cases:
+      contents = tf.compat.as_bytes(contents)
+      temp = tempfile.NamedTemporaryFile(
+          prefix='WriteFileTest', dir=self.get_temp_dir())
+      with self.test_session() as sess:
+        w = tf.write_file(temp.name, contents)
+        sess.run(w)
+        file_contents = open(temp.name, 'rb').read()
+        self.assertEqual(file_contents, contents)
+
   def _subset(self, files, indices):
     return set(tf.compat.as_bytes(files[i].name)
                for i in range(len(files)) if i in indices)
diff --git a/tensorflow/python/kernel_tests/linalg_grad_test.py b/tensorflow/python/kernel_tests/linalg_grad_test.py
index 062b714a103..a61e8ed8c2f 100644
--- a/tensorflow/python/kernel_tests/linalg_grad_test.py
+++ b/tensorflow/python/kernel_tests/linalg_grad_test.py
@@ -163,8 +163,19 @@ if __name__ == '__main__':
                 _GetMatrixUnaryFunctorGradientTest(tf.matrix_inverse,
                                                    dtype, shape))
         setattr(MatrixUnaryFunctorGradientTest,
-                'testMatrixUnaryFunctorGradient_' + name,
-                _GetMatrixUnaryFunctorGradientTest(tf.matrix_determinant,
-                                                   dtype, shape))
+                'testMatrixDeterminantGradient_' + name,
+                _GetMatrixUnaryFunctorGradientTest(tf.matrix_determinant, dtype,
+                                                   shape))
+
+  # Tests for gradients of matrix_solve_ls
+  for dtype in np.float32, np.float64:
+    for rows in 2, 5, 10:
+      for cols in 2, 5, 10:
+        for l2_regularization in 0.0, 0.001, 1.0:
+          shape = (rows, cols)
+          setattr(MatrixBinaryFunctorGradientTest,
+                  'testMatrixSolveLsGradient_' + name,
+                  _GetMatrixBinaryFunctorGradientTest(tf.matrix_solve_ls, dtype,
+                                                      shape))
 
   tf.test.main()
diff --git a/tensorflow/python/kernel_tests/parameterized_truncated_normal_op_test.py b/tensorflow/python/kernel_tests/parameterized_truncated_normal_op_test.py
index 8d41029c0b5..1c09949598a 100644
--- a/tensorflow/python/kernel_tests/parameterized_truncated_normal_op_test.py
+++ b/tensorflow/python/kernel_tests/parameterized_truncated_normal_op_test.py
@@ -97,10 +97,10 @@ def z_test(real, expected, i, num_samples):
 
 
 class ParameterizedTruncatedNormalTest(tf.test.TestCase):
-  use_gpu = False
+  _use_gpu = False
   z_limit = 6.0
 
-  # Stop at moment 20 to avoid numerical errors in the theoretical moments.
+  # Stop at moment 10 to avoid numerical errors in the theoretical moments.
   max_moment = 10
 
   def validateMoments(self, shape, mean, stddev, minval, maxval, seed=1618):
@@ -109,9 +109,11 @@ class ParameterizedTruncatedNormalTest(tf.test.TestCase):
       # Give up early if we are unable to import it.
       import scipy.stats  # pylint: disable=g-import-not-at-top,unused-variable
       tf.set_random_seed(seed)
-      with self.test_session(use_gpu=self.use_gpu):
-        samples = random_ops.parameterized_truncated_normal(
-            shape, mean, stddev, minval, maxval).eval()
+      with self.test_session(use_gpu=self._use_gpu):
+        samples = random_ops.parameterized_truncated_normal(shape, mean, stddev,
+                                                            minval,
+                                                            maxval).eval()
+        assert (~np.isnan(samples)).all()
       moments = calculate_moments(samples, self.max_moment)
       expected_moments = TruncatedNormalMoments(mean, stddev, minval, maxval)
       num_samples = functools.reduce(lambda x, y: x * y, shape, 1)
@@ -131,9 +133,11 @@ class ParameterizedTruncatedNormalTest(tf.test.TestCase):
     try:
       import scipy.stats  # pylint: disable=g-import-not-at-top
       tf.set_random_seed(seed)
-      with self.test_session(use_gpu=self.use_gpu):
-        samples = random_ops.parameterized_truncated_normal(
-            shape, mean, stddev, minval, maxval).eval()
+      with self.test_session(use_gpu=self._use_gpu):
+        samples = random_ops.parameterized_truncated_normal(shape, mean, stddev,
+                                                            minval,
+                                                            maxval).eval()
+      assert (~np.isnan(samples)).all()
       minval = max(mean - stddev * 10, minval)
       maxval = min(mean + stddev * 10, maxval)
       dist = scipy.stats.norm(loc=mean, scale=stddev)
@@ -173,8 +177,12 @@ class ParameterizedTruncatedNormalTest(tf.test.TestCase):
     self.validateKolmogorovSmirnov([10**5], 0.0, 0.1, 0.05, 0.10)
 
 
+class ParameterizedTruncatedNormalGpuTest(ParameterizedTruncatedNormalTest):
+  _use_gpu = True
+
+
 # Benchmarking code
-def parameterized_vs_naive(shape, num_iters):
+def parameterized_vs_naive(shape, num_iters, use_gpu=False):
   np.random.seed(1618)  # Make it reproducible.
 
   # No CSE/CF.
@@ -183,17 +191,29 @@ def parameterized_vs_naive(shape, num_iters):
       graph_options=tf.GraphOptions(optimizer_options=optimizer_options))
 
   with tf.Session(config=config) as sess:
-    param_op = tf.group(random_ops.parameterized_truncated_normal(shape))
-    naive_op = tf.group(random_ops.truncated_normal(shape))
+    with tf.device("/cpu:0" if not use_gpu else None):
+      param_op = tf.group(random_ops.parameterized_truncated_normal(shape))
+      naive_op = tf.group(random_ops.truncated_normal(shape))
 
+    # Burn-in to avoid session setup costs in the timing.
+    sess.run(param_op)
+    sess.run(param_op)
     param_dt = timeit.timeit(lambda: sess.run(param_op), number=num_iters)
+    sess.run(naive_op)
+    sess.run(naive_op)
     naive_dt = timeit.timeit(lambda: sess.run(naive_op), number=num_iters)
     return param_dt, naive_dt
 
 
 class TruncatedNormalBenchmark(tf.test.Benchmark):
 
-  def benchmarkParameterizedOpVsNaiveOp(self):
+  def benchmarkParameterizedOpVsNaiveOpCpu(self):
+    self._benchmarkParameterizedOpVsNaiveOp(False)
+
+  def benchmarkParameterizedOpVsNaiveOpGpu(self):
+    self._benchmarkParameterizedOpVsNaiveOp(True)
+
+  def _benchmarkParameterizedOpVsNaiveOp(self, use_gpu):
     num_iters = 50
     print(("Composition of new ParameterizedTruncatedNormalOp vs. "
            "naive TruncatedNormalOp [%d iters]") % num_iters)
@@ -201,16 +221,16 @@ class TruncatedNormalBenchmark(tf.test.Benchmark):
 
     for shape in [[10000, 100], [1000, 1000], [1000000], [100, 100, 100],
                   [20, 20, 20, 20]]:
-      p_dt, n_dt = parameterized_vs_naive(shape, num_iters)
+      p_dt, n_dt = parameterized_vs_naive(shape, num_iters, use_gpu)
       print("%s\t%.3f\t%.3f\t%.2f" % (shape, p_dt, n_dt, p_dt / n_dt))
 
       shape_str = "-".join(map(str, shape))
-      self.report_benchmark(name="parameterized_shape" + shape_str,
-                            iters=num_iters,
-                            wall_time=p_dt)
-      self.report_benchmark(name="naive_shape" + shape_str,
-                            iters=num_iters,
-                            wall_time=n_dt)
+      self.report_benchmark(
+          name="parameterized_shape" + shape_str,
+          iters=num_iters,
+          wall_time=p_dt)
+      self.report_benchmark(
+          name="naive_shape" + shape_str, iters=num_iters, wall_time=n_dt)
 
 
 if __name__ == "__main__":
diff --git a/tensorflow/python/kernel_tests/reshape_op_test.py b/tensorflow/python/kernel_tests/reshape_op_test.py
index a68f722244e..8e62be107be 100644
--- a/tensorflow/python/kernel_tests/reshape_op_test.py
+++ b/tensorflow/python/kernel_tests/reshape_op_test.py
@@ -100,7 +100,7 @@ class ReshapeTest(tf.test.TestCase):
 
   def testErrors(self):
     y = tf.constant(0.0, shape=[23, 29, 31])
-    with self.assertRaisesRegexp(ValueError, "isn't divisible by 17"):
+    with self.assertRaisesRegexp(ValueError, "must be evenly divisible by 17"):
       tf.reshape(y, [17, -1])
 
     z = tf.constant(0.0, shape=[32, 128])
diff --git a/tensorflow/python/kernel_tests/resource_variable_ops_test.py b/tensorflow/python/kernel_tests/resource_variable_ops_test.py
index cb4375ce913..116939dc2d8 100644
--- a/tensorflow/python/kernel_tests/resource_variable_ops_test.py
+++ b/tensorflow/python/kernel_tests/resource_variable_ops_test.py
@@ -19,6 +19,7 @@ from __future__ import print_function
 
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
+from tensorflow.python.framework import ops
 from tensorflow.python.framework import test_util
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import resource_variable_ops
@@ -46,6 +47,42 @@ class ResourceVariableOpsTest(test_util.TensorFlowTestCase):
       resource_variable_ops.create_variable_op(
           id_handle, constant_op.constant(0, dtype=dtypes.int32)).run()
 
+  def testCreateRead(self):
+    with self.test_session():
+      handle = resource_variable_ops.var_handle_op(dtype=dtypes.int32, shape=[])
+      resource_variable_ops.create_variable_op(
+          handle, constant_op.constant(1, dtype=dtypes.int32)).run()
+      value = resource_variable_ops.read_variable_op(
+          handle, dtype=dtypes.int32).eval()
+      self.assertAllEqual(1, value)
+
+  def testManyAssigns(self):
+    with self.test_session() as session:
+      handle = resource_variable_ops.var_handle_op(dtype=dtypes.int32, shape=[])
+      create = resource_variable_ops.create_variable_op(
+          handle, constant_op.constant(1, dtype=dtypes.int32))
+      with ops.control_dependencies([create]):
+        first_read = resource_variable_ops.read_variable_op(
+            handle, dtype=dtypes.int32)
+      with ops.control_dependencies([first_read]):
+        write = resource_variable_ops.assign_variable_op(
+            handle, constant_op.constant(2, dtype=dtypes.int32))
+      with ops.control_dependencies([write]):
+        second_read = resource_variable_ops.read_variable_op(
+            handle, dtype=dtypes.int32)
+      f, s = session.run([first_read, second_read])
+      self.assertEqual(f, 1)
+      self.assertEqual(s, 2)
+
+  def testAssignAdd(self):
+    with self.test_session():
+      handle = resource_variable_ops.var_handle_op(dtype=dtypes.int32, shape=[])
+      resource_variable_ops.create_variable_op(
+          handle, constant_op.constant(1, dtype=dtypes.int32)).run()
+      assign_add = resource_variable_ops.assign_add_variable_op(
+          handle, constant_op.constant(1, dtype=dtypes.int32))
+      self.assertEqual(assign_add.eval(), 2)
+
 
 if __name__ == "__main__":
   test.main()
diff --git a/tensorflow/python/kernel_tests/scatter_nd_ops_test.py b/tensorflow/python/kernel_tests/scatter_nd_ops_test.py
new file mode 100644
index 00000000000..7ff5a286c69
--- /dev/null
+++ b/tensorflow/python/kernel_tests/scatter_nd_ops_test.py
@@ -0,0 +1,380 @@
+# Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Tests for tensorflow.ops.tf.scatter_nd."""
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import functools
+
+import numpy as np
+import tensorflow as tf
+
+
+def _AsType(v, vtype):
+  return v.astype(vtype) if isinstance(v, np.ndarray) else vtype(v)
+
+
+def _FlatInnerDims(tensor, ndims=2):
+  shape = list(tensor.shape)
+  return tensor.reshape([functools.reduce(lambda x, y: x * y,
+                                          shape[:-ndims + 1], 1)] +
+                        shape[-ndims + 1:])
+
+
+def _FlatOuterDims(tensor, ndims=2):
+  shape = list(tensor.shape)
+  return tensor.reshape(shape[:ndims - 1] +
+                        [functools.reduce(lambda x, y: x * y,
+                                          shape[ndims - 1:], 1)])
+
+
+def _NumpyScatterNd(ref, indices, updates, op):
+  ixdim = indices.shape[-1]
+  num_updates = indices.size / ixdim
+  total_nd = len(ref.shape)
+  slice_size = 1
+  for i in range(ixdim, total_nd):
+    slice_size *= ref.shape[i]
+  flat_indices = _FlatInnerDims(indices)
+  flat_updates = updates.reshape((num_updates, slice_size))
+  output_flat = _FlatOuterDims(ref, ixdim + 1)
+  for ix_updates, ix_output in enumerate(flat_indices):
+    ix_output = tuple(ix_output)
+    output_flat[ix_output] = op(output_flat[ix_output],
+                                flat_updates[ix_updates])
+  return output_flat.reshape(ref.shape)
+
+
+def _NumpyUpdate(ref, indices, updates):
+  return _NumpyScatterNd(ref, indices, updates, lambda p, u: u)
+
+
+def _NumpyAdd(ref, indices, updates):
+  return _NumpyScatterNd(ref, indices, updates, lambda p, u: p + u)
+
+
+def _NumpySub(ref, indices, updates):
+  return _NumpyScatterNd(ref, indices, updates, lambda p, u: p - u)
+
+
+def _NumpyMul(ref, indices, updates):
+  return _NumpyScatterNd(ref, indices, updates, lambda p, u: p * u)
+
+
+def _NumpyDiv(ref, indices, updates):
+  return _NumpyScatterNd(ref, indices, updates, lambda p, u: p / u)
+
+
+class ScatterTest(tf.test.TestCase):
+
+  def _VariableRankTest(self,
+                        np_scatter,
+                        tf_scatter,
+                        vtype,
+                        itype,
+                        use_gpu,
+                        repeat_indices=False):
+    np.random.seed(8)
+    ref_shapes = [(3, 6), (3, 6), (3, 6, 9), (3, 6, 9), (3, 6, 9), (3, 6, 9)]
+    indices_shapes = [(2,), (2, 2), (2,), (2, 2), (2, 3), (2, 3, 3)]
+    with self.test_session(use_gpu=use_gpu):
+      for ref_shape, indices_shape in zip(ref_shapes, indices_shapes):
+        num_updates = indices_shape[0]
+        ixdim = indices_shape[-1]
+
+        indexable_area_shape = ()
+        for i in range(ixdim):
+          indexable_area_shape += (ref_shape[i],)
+        all_indices = [
+            list(coord)
+            for coord, _ in np.ndenumerate(
+                np.empty(indexable_area_shape, vtype))
+        ]
+        np.random.shuffle(all_indices)
+        indices = np.array(all_indices[:num_updates])
+
+        if num_updates > 1 and repeat_indices:
+          indices = indices[:num_updates // 2]
+          for _ in range(num_updates - num_updates // 2):
+            indices = np.append(
+                indices, [indices[np.random.randint(num_updates // 2)]], axis=0)
+          np.random.shuffle(indices)
+        indices = _AsType(indices[:num_updates], itype)
+
+        updates_shape = (num_updates,)
+        for i in range(ixdim, len(ref_shape)):
+          updates_shape += (ref_shape[i],)
+        updates = _AsType(np.random.randn(*(updates_shape)), vtype)
+        ref = _AsType(np.random.randn(*(ref_shape)), vtype)
+
+        # Scatter via numpy
+        new = ref.copy()
+        np_scatter(new, indices, updates)
+        # Scatter via tensorflow
+        ref_var = tf.Variable(ref)
+        ref_var.initializer.run()
+        tf_scatter(ref_var, indices, updates).eval()
+        # Compare
+        self.assertAllClose(new, ref_var.eval())
+
+  def _VariableRankTests(self, np_scatter, tf_scatter):
+    for vtype in (np.float32, np.float64):
+      for itype in (np.int32, np.int64):
+        for use_gpu in (False, True):
+          self._VariableRankTest(np_scatter, tf_scatter, vtype, itype, use_gpu)
+
+  def testVariableRankUpdate(self):
+    self._VariableRankTests(_NumpyUpdate, tf.scatter_nd_update)
+
+  def testVariableRankAdd(self):
+    self._VariableRankTests(_NumpyAdd, tf.scatter_nd_add)
+
+  def testVariableRankSub(self):
+    self._VariableRankTests(_NumpySub, tf.scatter_nd_sub)
+
+  def testVariableRankMul(self):
+    self._VariableRankTests(_NumpyMul, tf.scatter_nd_mul)
+
+  def testVariableRankDiv(self):
+    self._VariableRankTests(_NumpyDiv, tf.scatter_nd_div)
+
+  def _ScatterRepeatIndicesTest(self, np_scatter, tf_scatter):
+    for vtype in (np.float32, np.float64):
+      for itype in (np.int32, np.int64):
+        for use_gpu in (False, True):
+          self._VariableRankTest(
+              np_scatter,
+              tf_scatter,
+              vtype,
+              itype,
+              use_gpu,
+              repeat_indices=True)
+
+  def testScatterRepeatIndices(self):
+    """This tests scatter_add using indices that repeat."""
+    self._ScatterRepeatIndicesTest(_NumpyAdd, tf.scatter_nd_add)
+    self._ScatterRepeatIndicesTest(_NumpySub, tf.scatter_nd_sub)
+    self._ScatterRepeatIndicesTest(_NumpyMul, tf.scatter_nd_mul)
+    self._ScatterRepeatIndicesTest(_NumpyDiv, tf.scatter_nd_div)
+
+  def testBooleanScatterUpdate(self):
+    with self.test_session(use_gpu=False) as session:
+      var = tf.Variable([True, False])
+      update0 = tf.scatter_nd_update(var, [[1]], [True])
+      update1 = tf.scatter_nd_update(
+          var, tf.constant(
+              [[0]], dtype=tf.int64), [False])
+      var.initializer.run()
+
+      session.run([update0, update1])
+
+      self.assertAllEqual([False, True], var.eval())
+
+  def testScatterOutOfRangeCpu(self):
+    for op in (tf.scatter_nd_add, tf.scatter_nd_sub, tf.scatter_nd_mul,
+               tf.scatter_nd_div, tf.scatter_nd_update):
+      params = np.array([1, 2, 3, 4, 5, 6]).astype(np.float32)
+      updates = np.array([-3, -4, -5]).astype(np.float32)
+      with self.test_session(use_gpu=False):
+        ref = tf.Variable(params)
+        ref.initializer.run()
+
+        # Indices all in range, no problem.
+        indices = np.array([[2], [0], [5]])
+        op(ref, indices, updates).eval()
+
+        # Test some out of range errors.
+        indices = np.array([[-1], [0], [5]])
+        with self.assertRaisesOpError(
+            r"Invalid indices: \[0,0\] = \[-1\] is not in \[0, 6\)"):
+          op(ref, indices, updates).eval()
+
+        indices = np.array([[2], [0], [6]])
+        with self.assertRaisesOpError(
+            r"Invalid indices: \[2,0\] = \[6\] is not in \[0, 6\)"):
+          op(ref, indices, updates).eval()
+
+  def testRank3ValidShape(self):
+    indices = tf.zeros([2, 2, 2], tf.int32)
+    updates = tf.zeros([2, 2, 2], tf.int32)
+    shape = np.array([2, 2, 2])
+    self.assertAllEqual(
+        tf.scatter_nd(indices, updates, shape).get_shape().as_list(), shape)
+
+    ref = tf.Variable(tf.zeros(shape, tf.int32))
+    self.assertAllEqual(
+        tf.scatter_nd_update(ref, indices, updates).get_shape().as_list(),
+        shape)
+
+  def testUndefinedIndicesShape(self):
+    indices = tf.placeholder(tf.int32, shape=None)
+    updates = tf.placeholder(tf.int32, shape=[2, 2, 2])
+    shape = tf.constant([2, 2, 2], tf.int32)
+    tf.scatter_nd(indices, updates, shape)
+
+  def testUndefinedUpdatesShape(self):
+    indices = tf.placeholder(tf.int32, shape=[2, 2, 2])
+    updates = tf.placeholder(tf.int32, shape=None)
+    shape = tf.constant([2, 2, 2], tf.int32)
+    tf.scatter_nd(indices, updates, shape)
+
+  def testUndefinedOutputShape(self):
+    indices = tf.placeholder(tf.int32, shape=[2, 2, 2])
+    updates = tf.placeholder(tf.int32, shape=[2, 2, 2])
+    shape = tf.placeholder(tf.int32, shape=[None])
+    tf.scatter_nd(indices, updates, shape)
+
+  def testEmptyoutputShape1(self):
+    indices = tf.zeros([2, 2, 2], tf.int32)
+    updates = tf.zeros([2, 2, 2], tf.int32)
+    shape = tf.constant([0, 3, 2], tf.int32)
+
+    with self.assertRaisesWithPredicateMatch(
+        ValueError, "Indices and updates specified for empty output shape"):
+      tf.scatter_nd(indices, updates, shape)
+
+  def testEmptyoutputShape2(self):
+    indices = tf.placeholder(tf.int32, shape=None)
+    updates = tf.placeholder(tf.int32, shape=None)
+    shape = tf.constant([0, 3, 2], tf.int32)
+
+    with self.test_session():
+      tf.scatter_nd(indices, updates, shape).eval(feed_dict={
+          indices: np.zeros(
+              [2, 2, 2], dtype=np.int32),
+          updates: np.zeros(
+              [2, 2, 2], dtype=np.int32)
+      })
+
+  def testEmptyoutputShape3(self):
+    indices = tf.zeros([0], tf.int32)
+    updates = tf.zeros([0], tf.int32)
+    shape = tf.constant([0], tf.int32)
+    scatter = tf.scatter_nd(indices, updates, shape)
+
+    with self.test_session():
+      self.assertEqual(scatter.eval().size, 0)
+
+  def testRank3InvalidShape1(self):
+    indices = tf.zeros([3, 2, 2], tf.int32)
+    updates = tf.zeros([2, 2, 2], tf.int32)
+    shape = np.array([2, 2, 2])
+    with self.assertRaisesWithPredicateMatch(
+        ValueError, "The outer \\d+ dimensions of indices\\.shape="):
+      tf.scatter_nd(indices, updates, shape)
+
+    ref = tf.Variable(tf.zeros(shape, tf.int32))
+    with self.assertRaisesWithPredicateMatch(
+        ValueError, "The outer \\d+ dimensions of indices\\.shape="):
+      tf.scatter_nd_update(ref, indices, updates)
+
+  def testRank3InvalidShape2(self):
+    indices = tf.zeros([2, 2, 1], tf.int32)
+    updates = tf.zeros([2, 2], tf.int32)
+    shape = np.array([2, 2, 2])
+    with self.assertRaisesWithPredicateMatch(
+        ValueError, "The inner \\d+ dimensions of output\\.shape="):
+      tf.scatter_nd(indices, updates, shape)
+
+    ref = tf.Variable(tf.zeros(shape, tf.int32))
+    with self.assertRaisesWithPredicateMatch(
+        ValueError, "The inner \\d+ dimensions of ref\\.shape="):
+      tf.scatter_nd_update(ref, indices, updates)
+
+  def testGradientsRank2ElementUpdate(self):
+    indices = tf.constant([[0, 0], [1, 1]], dtype=tf.int32)
+    updates = tf.constant([1, 4], dtype=tf.float64)
+    shape = tf.constant([2, 2], dtype=tf.int32)
+    outputs = tf.scatter_nd(indices, updates, shape)
+
+    grad_vals = tf.constant([[1, 2], [3, 4]], dtype=tf.float64)
+    grads = tf.gradients([outputs], [updates], [grad_vals])[0]
+    expected_grads = np.array([1, 4], dtype=np.float64)
+    with self.test_session():
+      self.assertAllEqual(expected_grads, grads.eval())
+
+  def testGradientsRank2SliceUpdate(self):
+    indices = tf.constant([[1], [0]], dtype=tf.int32)
+    updates = tf.constant([[3, 4], [1, 2]], dtype=tf.float64)
+    shape = tf.constant([2, 2], dtype=tf.int32)
+    outputs = tf.scatter_nd(indices, updates, shape)
+
+    grad_vals = tf.constant([[3, 4], [1, 2]], dtype=tf.float64)
+    grads = tf.gradients([outputs], [updates], [grad_vals])[0]
+    expected_grads = np.array([[1, 2], [3, 4]], dtype=np.float64)
+    with self.test_session():
+      self.assertAllEqual(expected_grads, grads.eval())
+
+  def testGradientsRank3SliceUpdate(self):
+    indices = tf.constant([[[0, 1], [1, 0]], [[0, 0], [1, 1]]], dtype=tf.int32)
+    updates = tf.constant(
+        [[[5, 7], [2, 4]], [[1, 3], [6, 8]]], dtype=tf.float64)
+    shape = tf.constant([2, 2, 2], dtype=tf.int32)
+    outputs = tf.scatter_nd(indices, updates, shape)
+
+    grad_vals = tf.constant(
+        [[[1, 2], [3, 4]], [[5, 6], [7, 8]]], dtype=tf.float64)
+    grads = tf.gradients([outputs], [updates], [grad_vals])[0]
+    expected_grads = np.array(
+        [[[3, 4], [5, 6]], [[1, 2], [7, 8]]], dtype=np.float64)
+    with self.test_session():
+      self.assertAllEqual(expected_grads, grads.eval())
+
+  def testConcurrentUpdates(self):
+    num_updates = 10000
+    update_values = np.random.rand(num_updates)
+    ref = tf.Variable(np.zeros([2, 2]), dtype=tf.float64)
+    indices = tf.constant([[0, 1]] * num_updates, dtype=tf.int32)
+    updates = tf.constant(update_values, dtype=tf.float64)
+
+    exepected_result = np.zeros([2, 2], dtype=np.float64)
+    exepected_result[0, 1] = np.sum(update_values)
+
+    scatter = tf.scatter_nd_add(ref, indices, updates)
+    init = tf.initialize_all_variables()
+
+    with tf.Session() as sess:
+      sess.run(init)
+      result = sess.run(scatter)
+      assert np.allclose(result, exepected_result)
+
+  # TODO(fpmc): Re-enable this test when gpu_pip test actually runs on a GPU.
+  def _disabledTestScatterOutOfRangeGpu(self):
+    if not tf.test.IsBuiltWithCuda():
+      return
+    for op in (tf.scatter_nd_add, tf.scatter_nd_sub, tf.scatter_nd_mul,
+               tf.scatter_nd_div, tf.scatter_nd_update):
+      params = np.array([1, 2, 3, 4, 5, 6]).astype(np.float32)
+      updates = np.array([-3, -4, -5]).astype(np.float32)
+      # With GPU, the code ignores indices that are out of range.
+      # We don't test the implementation; just test there's no failures.
+      with self.test_session(force_gpu=True):
+        ref = tf.Variable(params)
+        ref.initializer.run()
+
+        # Indices all in range, no problem.
+        indices = np.array([2, 0, 5])
+        op(ref, indices, updates).eval()
+
+        # Indicies out of range should not fail.
+        indices = np.array([-1, 0, 5])
+        op(ref, indices, updates).eval()
+        indices = np.array([2, 0, 6])
+        op(ref, indices, updates).eval()
+
+
+if __name__ == "__main__":
+  tf.test.main()
diff --git a/tensorflow/python/kernel_tests/shape_ops_test.py b/tensorflow/python/kernel_tests/shape_ops_test.py
index 465a02bfe69..67d6fdd96a7 100644
--- a/tensorflow/python/kernel_tests/shape_ops_test.py
+++ b/tensorflow/python/kernel_tests/shape_ops_test.py
@@ -22,7 +22,6 @@ import numpy as np
 
 import tensorflow as tf
 
-from tensorflow.python.framework import ops
 from tensorflow.python.ops import array_ops
 
 
@@ -36,7 +35,7 @@ def _sparsify(x, thresh=0.5, index_dtype=np.int64):
   x_values = x[non_zero]
   x_shape = x.shape
 
-  return ops.SparseTensor(
+  return tf.SparseTensor(
       indices=x_indices, values=x_values, shape=x_shape), len(x_values)
 
 class ShapeOpsTest(tf.test.TestCase):
diff --git a/tensorflow/python/kernel_tests/sparse_ops_test.py b/tensorflow/python/kernel_tests/sparse_ops_test.py
index 9f2b9f43eff..554556a65af 100644
--- a/tensorflow/python/kernel_tests/sparse_ops_test.py
+++ b/tensorflow/python/kernel_tests/sparse_ops_test.py
@@ -24,7 +24,6 @@ import tensorflow as tf
 
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
-from tensorflow.python.framework import ops
 from tensorflow.python.framework import test_util
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import sparse_ops
@@ -41,7 +40,7 @@ def _sparsify(x, thresh=0.5, index_dtype=np.int64):
   x_values = x[non_zero]
   x_shape = x.shape
 
-  return ops.SparseTensor(
+  return tf.SparseTensor(
       indices=x_indices, values=x_values, shape=x_shape), len(x_values)
 
 
@@ -54,7 +53,7 @@ class SparseToIndicatorTest(test_util.TensorFlowTestCase):
         [3, 2], [3, 3]])
     val = np.array([0, 10, 13, 14, 32, 33])
     shape = np.array([5, 6])
-    return ops.SparseTensor(
+    return tf.SparseTensor(
         constant_op.constant(ind, dtypes.int64),
         constant_op.constant(val, dtype),
         constant_op.constant(shape, dtypes.int64))
@@ -72,7 +71,7 @@ class SparseToIndicatorTest(test_util.TensorFlowTestCase):
         [1, 2, 2]])
     val = np.array([1, 10, 12, 103, 150, 149, 150, 122])
     shape = np.array([2, 3, 4])
-    return ops.SparseTensor(
+    return tf.SparseTensor(
         constant_op.constant(ind, dtypes.int64),
         constant_op.constant(val, dtype),
         constant_op.constant(shape, dtypes.int64))
@@ -130,11 +129,11 @@ class SparseMergeTest(test_util.TensorFlowTestCase):
     indices = np.array([0, 13, 10, 33, 32, 14])
     values = np.array([-3, 4, 1, 9, 5, 1])
     shape = np.array([3, 3])
-    indices = ops.SparseTensorValue(
+    indices = tf.SparseTensorValue(
         np.array(ind, np.int64),
         np.array(indices, indices_dtype),
         np.array(shape, np.int64))
-    values = ops.SparseTensorValue(
+    values = tf.SparseTensorValue(
         np.array(ind, np.int64),
         np.array(values, values_dtype),
         np.array(shape, np.int64))
@@ -143,8 +142,8 @@ class SparseMergeTest(test_util.TensorFlowTestCase):
   def _SparseTensor_3x50(self, indices_dtype, values_dtype):
     indices, values = self._SparseTensorValue_3x50(indices_dtype, values_dtype)
     return (
-        ops.SparseTensor.from_value(indices),
-        ops.SparseTensor.from_value(values))
+        tf.SparseTensor.from_value(indices),
+        tf.SparseTensor.from_value(values))
 
   def _AssertResultsSorted(self, output, vocab_size):
     self.assertAllEqual(
@@ -172,8 +171,8 @@ class SparseMergeTest(test_util.TensorFlowTestCase):
     vocab_size = 50
     indices_v, values_v = self._SparseTensorValue_3x50(np.int32, np.float32)
     with self.test_session(use_gpu=False) as sess:
-      for indices in (indices_v, ops.SparseTensor.from_value(indices_v)):
-        for values in (values_v, ops.SparseTensor.from_value(values_v)):
+      for indices in (indices_v, tf.SparseTensor.from_value(indices_v)):
+        for values in (values_v, tf.SparseTensor.from_value(values_v)):
           sp_output = sparse_ops.sparse_merge(indices, values, vocab_size)
 
           output = sess.run(sp_output)
@@ -237,13 +236,13 @@ class SparseRetainTest(test_util.TensorFlowTestCase):
         [3, 2], [3, 3]])
     val = np.array([0, 10, 13, 14, 32, 33])
     shape = np.array([5, 6])
-    return ops.SparseTensorValue(
+    return tf.SparseTensorValue(
         np.array(ind, np.int64),
         np.array(val, np.int32),
         np.array(shape, np.int64))
 
   def _SparseTensor_5x6(self):
-    return ops.SparseTensor.from_value(self._SparseTensorValue_5x6())
+    return tf.SparseTensor.from_value(self._SparseTensorValue_5x6())
 
   def testBasic(self):
     with self.test_session(use_gpu=False) as sess:
@@ -285,14 +284,14 @@ class SparseResetShapeTest(test_util.TensorFlowTestCase):
   _SHP_2_5_6 = np.array([2, 5, 6], dtype=np.int64)
 
   def _SparseTensor_2x5x6(self):
-    return ops.SparseTensor(
+    return tf.SparseTensor(
         constant_op.constant(self._IND_2_5_6, dtypes.int64),
         constant_op.constant(self._VAL_2_5_6, dtypes.int32),
         constant_op.constant(self._SHP_2_5_6, dtypes.int64))
 
   def _SparseTensorValue_2x5x6(self):
-    return ops.SparseTensorValue(self._IND_2_5_6, self._VAL_2_5_6,
-                                 self._SHP_2_5_6)
+    return tf.SparseTensorValue(self._IND_2_5_6, self._VAL_2_5_6,
+                                self._SHP_2_5_6)
 
   def testBasic(self):
     with self.test_session(use_gpu=False) as sess:
@@ -395,13 +394,13 @@ class SparseFillEmptyRowsTest(test_util.TensorFlowTestCase):
         [3, 2], [3, 3]])
     val = np.array([0, 10, 13, 14, 32, 33])
     shape = np.array([5, 6])
-    return ops.SparseTensorValue(
+    return tf.SparseTensorValue(
         np.array(ind, np.int64),
         np.array(val, np.int32),
         np.array(shape, np.int64))
 
   def _SparseTensor_5x6(self):
-    return ops.SparseTensor.from_value(self._SparseTensorValue_5x6())
+    return tf.SparseTensor.from_value(self._SparseTensorValue_5x6())
 
   def _SparseTensor_String5x6(self):
     ind = np.array([
@@ -410,7 +409,7 @@ class SparseFillEmptyRowsTest(test_util.TensorFlowTestCase):
         [3, 2], [3, 3]])
     val = np.array(["a", "b", "c", "d", "e", "f"])
     shape = np.array([5, 6])
-    return ops.SparseTensor(
+    return tf.SparseTensor(
         constant_op.constant(ind, dtypes.int64),
         constant_op.constant(val, dtypes.string),
         constant_op.constant(shape, dtypes.int64))
@@ -419,7 +418,7 @@ class SparseFillEmptyRowsTest(test_util.TensorFlowTestCase):
     ind = np.array([[0, 0], [1, 0], [1, 3], [1, 4]])
     val = np.array([0, 10, 13, 14])
     shape = np.array([2, 6])
-    return ops.SparseTensor(
+    return tf.SparseTensor(
         constant_op.constant(ind, dtypes.int64),
         constant_op.constant(val, dtypes.int32),
         constant_op.constant(shape, dtypes.int64))
@@ -518,7 +517,7 @@ class SparseReduceSumTest(test_util.TensorFlowTestCase):
     self._compare(sp_t, reduction_axes, ndims, True)
 
   def testSimpleAndRandomInputs(self):
-    sp_t = ops.SparseTensor(self.ind, self.vals, self.shape)
+    sp_t = tf.SparseTensor(self.ind, self.vals, self.shape)
 
     with self.test_session(use_gpu=False):
       self._compare_all(sp_t, None, ndims=2)
@@ -542,7 +541,7 @@ class SparseReduceSumTest(test_util.TensorFlowTestCase):
           self._compare_all(sp_t, axes, ndims=len(dims))
 
   def testInvalidAxes(self):
-    sp_t = ops.SparseTensor(self.ind, self.vals, self.shape)
+    sp_t = tf.SparseTensor(self.ind, self.vals, self.shape)
     with self.test_session(use_gpu=False):
       with self.assertRaisesOpError("Invalid reduction dimension -3"):
         sparse_ops.sparse_reduce_sum(sp_t, -3).eval()
@@ -574,8 +573,8 @@ class SparseReduceSumTest(test_util.TensorFlowTestCase):
 class SparseMathOpsTest(test_util.TensorFlowTestCase):
 
   def _check(self, result_tensor, result_np, input_sp_t):
-    self.assertTrue(isinstance(result_tensor, ops.SparseTensor))
-    self.assertTrue(isinstance(input_sp_t, ops.SparseTensor))
+    self.assertTrue(isinstance(result_tensor, tf.SparseTensor))
+    self.assertTrue(isinstance(input_sp_t, tf.SparseTensor))
     self.assertAllEqual(input_sp_t.indices.eval(), result_tensor.indices.eval())
     self.assertAllEqual(input_sp_t.shape.eval(), result_tensor.shape.eval())
 
@@ -725,17 +724,17 @@ class SparseMinimumMaximumTest(test_util.TensorFlowTestCase):
   def testBasic(self):
     with self.test_session(use_gpu=False):
       # 1-D, values at index 0.
-      sp_zero = ops.SparseTensor([[0]], [0], [7])
-      sp_one = ops.SparseTensor([[0]], [1], [7])
+      sp_zero = tf.SparseTensor([[0]], [0], [7])
+      sp_one = tf.SparseTensor([[0]], [1], [7])
       max_tf = tf.sparse_maximum(sp_zero, sp_one).eval()
       min_tf = tf.sparse_minimum(sp_zero, sp_one).eval()
       self._assertSparseTensorValueEqual(sp_one.eval(), max_tf)
       self._assertSparseTensorValueEqual(sp_zero.eval(), min_tf)
 
       # Values at different indices.
-      sp_zero = ops.SparseTensor([[0]], [0], [7])
-      sp_zero_2 = ops.SparseTensor([[1]], [0], [7])
-      expected = ops.SparseTensor([[0], [1]], [0, 0], [7])
+      sp_zero = tf.SparseTensor([[0]], [0], [7])
+      sp_zero_2 = tf.SparseTensor([[1]], [0], [7])
+      expected = tf.SparseTensor([[0], [1]], [0, 0], [7])
       max_tf = tf.sparse_maximum(sp_zero, sp_zero_2).eval()
       min_tf = tf.sparse_minimum(sp_zero, sp_zero_2).eval()
       self._assertSparseTensorValueEqual(expected.eval(), max_tf)
@@ -767,13 +766,13 @@ class SparseMinimumMaximumTest(test_util.TensorFlowTestCase):
 
   def testMismatchedShapes(self):
     with self.test_session(use_gpu=False):
-      sp_zero = ops.SparseTensor([[0, 0]], [0], [1, 1])
-      sp_one = ops.SparseTensor([[0]], [1], [2])
+      sp_zero = tf.SparseTensor([[0, 0]], [0], [1, 1])
+      sp_one = tf.SparseTensor([[0]], [1], [2])
       with self.assertRaisesOpError("Operands do not have the same ranks"):
         tf.sparse_maximum(sp_zero, sp_one).eval()
 
-      sp_zero = ops.SparseTensor([[0]], [0], [1])
-      sp_one = ops.SparseTensor([[0]], [1], [2])
+      sp_zero = tf.SparseTensor([[0]], [0], [1])
+      sp_one = tf.SparseTensor([[0]], [1], [2])
       with self.assertRaisesOpError("Operands' shapes do not match"):
         tf.sparse_maximum(sp_zero, sp_one).eval()
 
diff --git a/tensorflow/python/kernel_tests/variables_test.py b/tensorflow/python/kernel_tests/variables_test.py
index a3cd3240f25..c715e5630d0 100644
--- a/tensorflow/python/kernel_tests/variables_test.py
+++ b/tensorflow/python/kernel_tests/variables_test.py
@@ -49,7 +49,7 @@ class VariablesTestCase(tf.test.TestCase):
       with self.assertRaisesOpError("Attempting to use uninitialized value"):
         var1.eval()
 
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
 
       self.assertAllClose(0.0, var0.eval())
       self.assertAllClose(1.1, var1.eval())
@@ -75,7 +75,7 @@ class VariablesTestCase(tf.test.TestCase):
       self.assertEqual([3, 6], depdep.get_shape())
       self.assertEqual([3, 6], depdep.get_shape())
 
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
 
       self.assertAllClose(rnd.eval(), dep.eval())
       self.assertAllClose(rnd.eval() + dep.eval() + 2.0,
@@ -95,7 +95,7 @@ class VariablesTestCase(tf.test.TestCase):
       plus_one = var.assign_add(1.0)
       minus_one = var.assign_sub(2.0)
       four = var.assign(4.0)
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       self.assertAllClose(0.0, var.eval())
 
       self.assertAllClose(1.0, plus_one.eval())
@@ -113,7 +113,7 @@ class VariablesTestCase(tf.test.TestCase):
       var = tf.Variable(zero)
       count_up_to = var.count_up_to(3)
 
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       self.assertEqual(0, var.eval())
 
       self.assertEqual(0, count_up_to.eval())
@@ -193,7 +193,7 @@ class VariablesTestCase(tf.test.TestCase):
     with self.test_session():
       var_x = tf.Variable(2.0)
       var_y = tf.Variable(3.0)
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       self.assertAllClose(2.0, var_x.eval())
       self.assertAllClose(3.0, var_y.eval())
       self.assertAllClose(5.0, tf.add(var_x, var_y).eval())
@@ -204,7 +204,7 @@ class VariablesTestCase(tf.test.TestCase):
       zero_size_const = tf.ones([2, 0])
       variable_mul = tf.matmul(zero_size_const, zero_size_var)
       const_mul = tf.matmul(zero_size_const, zero_size_const, transpose_b=True)
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       variable_output = variable_mul.eval()
       self.assertAllClose(const_mul.eval(), variable_output)
       self.assertAllClose([[0., 0.], [0., 0.]], variable_output)
@@ -230,7 +230,7 @@ class VariablesTestCase(tf.test.TestCase):
           2.0, trainable=True,
           collections=[tf.GraphKeys.TRAINABLE_VARIABLES,
                        tf.GraphKeys.VARIABLES])
-      self.assertEqual([var_x, var_y, var_z, var_t], tf.all_variables())
+      self.assertEqual([var_x, var_y, var_z, var_t], tf.global_variables())
       self.assertEqual([var_x, var_z, var_t], tf.trainable_variables())
 
   def testOperators(self):
@@ -269,7 +269,7 @@ class VariablesTestCase(tf.test.TestCase):
       var_t = tf.Variable(rnd)
       slice_v = var_t[2, 0:0]
 
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       self.assertAllClose([2.0], add.eval())
       self.assertAllClose([3.0], radd.eval())
       self.assertAllClose([1.0], sub.eval())
@@ -302,7 +302,7 @@ class VariablesTestCase(tf.test.TestCase):
   def testSession(self):
     with self.test_session() as sess:
       var = tf.Variable([1, 12])
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       self.assertAllClose([1, 12], sess.run(var))
 
   def testDevicePlacement(self):
@@ -310,7 +310,7 @@ class VariablesTestCase(tf.test.TestCase):
       with tf.device("/cpu:0"):
         var = tf.Variable([1, 12])
       init_value = var.initialized_value()
-      init_op = tf.initialize_all_variables()
+      init_op = tf.global_variables_initializer()
       self.assertEqual(var.op.device, init_value.device)
       self.assertEqual(var.op.device, init_op.device)
       sess.run(init_op)
@@ -348,7 +348,7 @@ class VariablesTestCase(tf.test.TestCase):
 
       with self.assertRaises(tf.errors.FailedPreconditionError):
         v2.eval()
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       self.assertAllClose(np.negative(value), v2.eval())
 
   def testInitializerFunctionDevicePlacement(self):
@@ -385,7 +385,7 @@ class IsInitializedTest(tf.test.TestCase):
       _ = v, w
       uninited = tf.report_uninitialized_variables()
       self.assertAllEqual(np.array([b"v", b"w"]), sess.run(uninited))
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       self.assertEqual(0, sess.run(uninited).size)
 
   def testVariableList(self):
@@ -411,7 +411,7 @@ class IsInitializedTest(tf.test.TestCase):
       a = tf.Variable(tf.zeros([0, 2]))
       b = tf.Variable(tf.ones([2, 2]))
       objective = tf.reduce_sum(b + tf.matmul(a, a, transpose_a=True))
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       do_opt = tf.train.GradientDescentOptimizer(0.1).minimize(objective)
       sess.run([do_opt])
       self.assertAllClose([[0.9, 0.9], [0.9, 0.9]], b.eval())
@@ -431,7 +431,7 @@ class ObsoleteIsInitializedTest(tf.test.TestCase):
       inited = tf.assert_variables_initialized()
       with self.assertRaisesOpError("Attempting to use uninitialized value"):
         sess.run(inited)
-      tf.initialize_all_variables().run()
+      tf.global_variables_initializer().run()
       sess.run(inited)
 
   def testVariableList(self):
diff --git a/tensorflow/python/lib/io/file_io.i b/tensorflow/python/lib/io/file_io.i
index d88e6b59b6f..33a0ef64922 100644
--- a/tensorflow/python/lib/io/file_io.i
+++ b/tensorflow/python/lib/io/file_io.i
@@ -66,6 +66,16 @@ void WriteStringToFile(const string& filename, const string& file_content,
   }
 }
 
+std::vector<string> GetChildren(const string& dir, TF_Status* out_status) {
+  std::vector<string> results;
+  tensorflow::Status status = tensorflow::Env::Default()->GetChildren(
+      dir, &results);
+  if (!status.ok()) {
+    Set_TF_Status_from_Status(out_status, status);
+  }
+  return results;
+}
+
 std::vector<string> GetMatchingFiles(const string& filename,
                                      TF_Status* out_status) {
   std::vector<string> results;
@@ -233,6 +243,7 @@ inline void DeleteFile(const string& filename, TF_Status* out_status);
 string ReadFileToString(const string& filename, TF_Status* out_status);
 void WriteStringToFile(const string& filename, const string& file_content,
                        TF_Status* out_status);
+std::vector<string> GetChildren(const string& dir, TF_Status* out_status);
 std::vector<string> GetMatchingFiles(const string& filename,
                                      TF_Status* out_status);
 void CreateDir(const string& dirname, TF_Status* out_status);
diff --git a/tensorflow/python/lib/io/file_io.py b/tensorflow/python/lib/io/file_io.py
index 87550bb094f..adce569019e 100644
--- a/tensorflow/python/lib/io/file_io.py
+++ b/tensorflow/python/lib/io/file_io.py
@@ -388,11 +388,14 @@ def list_directory(dirname):
   """
   if not is_directory(dirname):
     raise errors.NotFoundError(None, None, "Could not find directory")
-  file_list = get_matching_files(os.path.join(compat.as_str_any(dirname), "*"))
-  return [
-      compat.as_str_any(pywrap_tensorflow.Basename(compat.as_bytes(filename)))
-      for filename in file_list
-  ]
+  with errors.raise_exception_on_not_ok_status() as status:
+    # Convert each element to string, since the return values of the
+    # vector of string should be interpreted as strings, not bytes.
+    return [
+        compat.as_str_any(filename)
+        for filename in pywrap_tensorflow.GetChildren(
+            compat.as_bytes(dirname), status)
+    ]
 
 
 def walk(top, in_order=True):
diff --git a/tensorflow/python/lib/io/python_io.py b/tensorflow/python/lib/io/python_io.py
index 7ffb79ef9ae..a4c682aa28a 100644
--- a/tensorflow/python/lib/io/python_io.py
+++ b/tensorflow/python/lib/io/python_io.py
@@ -21,6 +21,8 @@ suitable if fast sharding or other non-sequential access is desired.
 
 @@TFRecordWriter
 @@tf_record_iterator
+@@TFRecordCompressionType
+@@TFRecordOptions
 
 - - -
 
@@ -49,7 +51,8 @@ from __future__ import print_function
 # pylint: disable=wildcard-import
 from tensorflow.python.lib.io.tf_record import *
 # pylint: enable=wildcard-import
-from tensorflow.python.util.all_util import make_all
+from tensorflow.python.util.all_util import remove_undocumented
 
+_allowed_symbols = []
 
-__all__ = make_all(__name__)
+remove_undocumented(__name__, _allowed_symbols)
diff --git a/tensorflow/python/lib/io/tf_record.py b/tensorflow/python/lib/io/tf_record.py
index c07ff5c2d3d..9dc3ac52c2a 100644
--- a/tensorflow/python/lib/io/tf_record.py
+++ b/tensorflow/python/lib/io/tf_record.py
@@ -25,6 +25,7 @@ from tensorflow.python.util import compat
 
 
 class TFRecordCompressionType(object):
+  """The type of compression for the record."""
   NONE = 0
   ZLIB = 1
   GZIP = 2
diff --git a/tensorflow/python/ops/array_grad.py b/tensorflow/python/ops/array_grad.py
index 40f4ceb69d7..d96002169ab 100644
--- a/tensorflow/python/ops/array_grad.py
+++ b/tensorflow/python/ops/array_grad.py
@@ -23,6 +23,7 @@ from math import ceil
 
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_util
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import gen_array_ops
@@ -301,8 +302,12 @@ def _GatherGrad(op, grad):
 
 
 @ops.RegisterGradient("GatherNd")
-def _GatherNdGrad(unused_op, unused_grad):
-  raise NotImplementedError("Gradient for gather_nd is not implemented.")
+def _GatherNdGrad(op, grad):
+  ref = op.inputs[0]
+  ref_shape = array_ops.shape(ref)
+  indices = op.inputs[1]
+  ref_grad = array_ops.scatter_nd(indices, grad, ref_shape)
+  return [ref_grad, None]
 
 
 @ops.RegisterGradient("CheckNumerics")
@@ -552,7 +557,7 @@ def _ExtractImagePatchesGrad(op, grad):
   sp_shape = (rows_in * cols_in,
               rows_out * cols_out * ksize_r * ksize_c)
 
-  sp_mat = ops.SparseTensor(
+  sp_mat = sparse_tensor.SparseTensor(
     array_ops.constant(idx, dtype=ops.dtypes.int64),
     array_ops.ones((len(idx),), dtype=ops.dtypes.float32),
     sp_shape
@@ -566,3 +571,10 @@ def _ExtractImagePatchesGrad(op, grad):
   grad_out = array_ops.transpose(grad_out, (2, 0, 1, 3))
 
   return [grad_out]
+
+
+@ops.RegisterGradient("ScatterNd")
+def _ScatterNdGrad(op, grad):
+  indices = op.inputs[0]
+  updates_grad = array_ops.gather_nd(grad, indices)
+  return [None, updates_grad, None]
diff --git a/tensorflow/python/ops/array_ops.py b/tensorflow/python/ops/array_ops.py
index 6474d54f66f..9206002f5ef 100644
--- a/tensorflow/python/ops/array_ops.py
+++ b/tensorflow/python/ops/array_ops.py
@@ -71,6 +71,7 @@ or join multiple tensors together.
 @@gather
 @@gather_nd
 @@unique_with_counts
+@@scatter_nd
 @@dynamic_partition
 @@dynamic_stitch
 @@boolean_mask
@@ -81,6 +82,15 @@ or join multiple tensors together.
 @@quantized_concat
 @@setdiff1d
 
+## Fake quantization
+Operations used to help train for better quantization accuracy.
+
+@@fake_quant_with_min_max_args
+@@fake_quant_with_min_max_args_gradient
+@@fake_quant_with_min_max_vars
+@@fake_quant_with_min_max_vars_gradient
+@@fake_quant_with_min_max_vars_per_channel
+@@fake_quant_with_min_max_vars_per_channel_gradient
 """
 from __future__ import absolute_import
 from __future__ import division
@@ -93,6 +103,7 @@ from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.framework import tensor_util
 # 'Constant' gets imported in the module 'array_ops'.
@@ -176,7 +187,8 @@ def shape_internal(input, name=None, optimize=True, out_type=dtypes.int32):
 
   """
   with ops.name_scope(name, "Shape", [input]) as name:
-    if isinstance(input, (ops.SparseTensor, ops.SparseTensorValue)):
+    if isinstance(
+        input, (sparse_tensor.SparseTensor, sparse_tensor.SparseTensorValue)):
       return gen_math_ops.cast(input.shape, out_type)
     else:
       input_tensor = ops.convert_to_tensor(input)
@@ -227,7 +239,8 @@ def size_internal(input, name=None, optimize=True, out_type=dtypes.int32):
     A `Tensor` of type `out_type`.
   """
   with ops.name_scope(name, "Size", [input]) as name:
-    if isinstance(input, (ops.SparseTensor, ops.SparseTensorValue)):
+    if isinstance(
+        input, (sparse_tensor.SparseTensor, sparse_tensor.SparseTensorValue)):
       return gen_math_ops._prod(
           gen_math_ops.cast(input.shape, out_type), 0, name=name)
     else:
@@ -279,7 +292,8 @@ def rank_internal(input, name=None, optimize=True):
     A `Tensor` of type `int32`.
   """
   with ops.name_scope(name, "Rank", [input]) as name:
-    if isinstance(input, (ops.SparseTensor, ops.SparseTensorValue)):
+    if isinstance(
+        input, (sparse_tensor.SparseTensor, sparse_tensor.SparseTensorValue)):
       return gen_array_ops.size(input.shape, name=name)
     else:
       input_tensor = ops.convert_to_tensor(input)
@@ -1445,6 +1459,17 @@ def placeholder(dtype, shape=None, name=None):
   return ret
 
 
+# pylint: disable=redefined-outer-name
+def _normalize_sparse_shape(shape, name):
+  """Takes numpy array or Tensor or None and returns either None or Tensor."""
+  if shape is None: return None
+  if not isinstance(shape, ops.Tensor):
+    for el in shape:
+      if el is None:
+        return None
+  return ops.convert_to_tensor(shape, name=name)
+
+
 def sparse_placeholder(dtype, shape=None, name=None):
   """Inserts a placeholder for a sparse tensor that will be always fed.
 
@@ -1484,14 +1509,11 @@ def sparse_placeholder(dtype, shape=None, name=None):
     A `SparseTensor` that may be used as a handle for feeding a value, but not
     evaluated directly.
   """
+  shape_name = (name + "/shape") if name is not None else None
+  shape = _normalize_sparse_shape(shape, shape_name)
   if shape is None:
-    shape = placeholder(
-        dtypes.int64, shape=[None],
-        name=(name + "/shape") if name is not None else None)
-  else:
-    shape = ops.convert_to_tensor(
-        shape, name=(name + "/shape") if name is not None else None)
-  return ops.SparseTensor(
+    shape = placeholder(dtypes.int64, shape=[None], name=shape_name)
+  return sparse_tensor.SparseTensor(
       values=placeholder(
           dtype, shape=[None],
           name=(name + "/values") if name is not None else None),
@@ -1500,6 +1522,7 @@ def sparse_placeholder(dtype, shape=None, name=None):
           name=(name + "/indices") if name is not None else None),
       shape=shape
   )
+# pylint: enable=redefined-outer-name
 
 
 def pad(tensor, paddings, mode="CONSTANT", name=None):  # pylint: disable=invalid-name
@@ -1774,6 +1797,10 @@ ops.RegisterShape("Bitcast")(common_shapes.call_cpp_shape_fn)
 
 
 @ops.RegisterShape("Reshape")
+def _DelegateReshapeShape(op):
+  return common_shapes.call_cpp_shape_fn(op, input_tensors_as_shapes_needed=[1])
+
+
 def _ReshapeShape(op):
   """Shape function for Reshape op."""
   input_shape = op.inputs[0].get_shape()
@@ -1991,9 +2018,13 @@ def edit_distance(hypothesis, truth, normalize=True, name="edit_distance"):
   Raises:
     TypeError: If either `hypothesis` or `truth` are not a `SparseTensor`.
   """
-  if not isinstance(hypothesis, (ops.SparseTensor, ops.SparseTensorValue)):
+  if not isinstance(
+      hypothesis, (sparse_tensor.SparseTensor,
+                   sparse_tensor.SparseTensorValue)):
     raise TypeError("Hypothesis must be a SparseTensor.")
-  if not isinstance(truth, (ops.SparseTensor, ops.SparseTensorValue)):
+  if not isinstance(
+      truth, (sparse_tensor.SparseTensor,
+              sparse_tensor.SparseTensorValue)):
     raise TypeError("Truth must be a SparseTensor.")
 
   return gen_array_ops._edit_distance(hypothesis.indices,
@@ -2022,9 +2053,15 @@ def _FakeQuantWithMinMaxArgsGradient(op, grad):
 
 
 ops.RegisterShape("FakeQuantWithMinMaxArgs")(common_shapes.call_cpp_shape_fn)
+ops.RegisterShape("FakeQuantWithMinMaxArgsGradient")(
+    common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("FakeQuantWithMinMaxVars")(common_shapes.call_cpp_shape_fn)
+ops.RegisterShape("FakeQuantWithMinMaxVarsGradient")(
+    common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("FakeQuantWithMinMaxVarsPerChannel")(
     common_shapes.call_cpp_shape_fn)
+ops.RegisterShape("FakeQuantWithMinMaxVarsPerChannelGradient")(
+    common_shapes.call_cpp_shape_fn)
 
 
 @ops.RegisterGradient("FakeQuantWithMinMaxVars")
@@ -2516,3 +2553,49 @@ def _QuantizedReshapeShape(op):
 ops.RegisterShape("QuantizeV2")(None)
 ops.RegisterShape("QuantizedBatchNormWithGlobalNormalization")(None)
 ops.RegisterShape("QuantizedConcat")(None)
+
+
+@ops.RegisterShape("ScatterNd")
+def _ScatterNdShape(op):
+  """Shape function for the ScatterNd op.
+
+  The shape of the ouput is defined as a parameter on the Operation.
+
+  Args:
+    op: A ScatterNd Operation.
+
+  Returns:
+    A single-element list containing the shape of the output.
+
+  Raises:
+    ValueError: if the arguments have invalid rank
+  """
+  indices_shape = op.inputs[0].get_shape()
+  updates_shape = op.inputs[1].get_shape()
+  output_shape = tensor_util.constant_value_as_shape(op.inputs[2])
+
+  if output_shape.num_elements() == 0 and not (
+      indices_shape.num_elements() in
+      (None, 0) and updates_shape.num_elements() in (None, 0)):
+    raise ValueError("Indices and updates specified for empty output shape")
+
+  if indices_shape.ndims is not None and output_shape is not None:
+    outer_dims = len(indices_shape) - 1
+    ixdim = indices_shape[-1].value or 0
+
+    if not indices_shape[:outer_dims].is_compatible_with(
+        updates_shape[:outer_dims]):
+      raise ValueError("The outer %d dimensions of indices.shape=%s must "
+                       "match the outer %d dimensions of updates.shape=%s" % (
+                           outer_dims, indices_shape, outer_dims,
+                           updates_shape))
+    if output_shape.ndims is not None:
+      if not output_shape[ixdim:].is_compatible_with(updates_shape[
+          outer_dims:]):
+        raise ValueError("The inner %d dimensions of output.shape=%s must "
+                         "match the inner %d dimensions of updates.shape=%s" % (
+                             len(output_shape)-ixdim, output_shape,
+                             len(updates_shape)-outer_dims, updates_shape))
+
+    return [output_shape]
+  return [None]
diff --git a/tensorflow/python/ops/candidate_sampling_ops.py b/tensorflow/python/ops/candidate_sampling_ops.py
index a1cd8d803ef..b27167df542 100644
--- a/tensorflow/python/ops/candidate_sampling_ops.py
+++ b/tensorflow/python/ops/candidate_sampling_ops.py
@@ -13,7 +13,7 @@
 # limitations under the License.
 # ==============================================================================
 
-"""Wrappers for primitive Neural Net (NN) Operations."""
+"""Wrappers for candidate sampling operations."""
 
 from __future__ import absolute_import
 from __future__ import division
diff --git a/tensorflow/python/ops/check_ops.py b/tensorflow/python/ops/check_ops.py
index cee1ff47ff0..d4e8e02dec5 100644
--- a/tensorflow/python/ops/check_ops.py
+++ b/tensorflow/python/ops/check_ops.py
@@ -42,6 +42,7 @@ import numpy as np
 
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_util
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
@@ -88,7 +89,7 @@ def assert_proper_iterable(values):
       `Tensor`, `SparseTensor`, `np.array`, `tf.compat.bytes_or_text_types`.
   """
   unintentional_iterables = (
-      (ops.Tensor, ops.SparseTensor, np.ndarray)
+      (ops.Tensor, sparse_tensor.SparseTensor, np.ndarray)
       + compat.bytes_or_text_types
   )
   if isinstance(values, unintentional_iterables):
diff --git a/tensorflow/python/ops/control_flow_grad.py b/tensorflow/python/ops/control_flow_grad.py
index 55f335120cf..b9750c87826 100644
--- a/tensorflow/python/ops/control_flow_grad.py
+++ b/tensorflow/python/ops/control_flow_grad.py
@@ -21,6 +21,7 @@ from __future__ import print_function
 from six.moves import xrange  # pylint: disable=redefined-builtin
 
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import math_ops
 # go/tf-wildcard-import
@@ -149,7 +150,7 @@ def _ExitGrad(op, grad):
   if isinstance(grad, ops.Tensor):
     grad_ctxt.AddName(grad.name)
   else:
-    if not isinstance(grad, (ops.IndexedSlices, ops.SparseTensor)):
+    if not isinstance(grad, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
       raise TypeError("Type %s not supported" % type(grad))
     grad_ctxt.AddName(grad.values.name)
     grad_ctxt.AddName(grad.indices.name)
diff --git a/tensorflow/python/ops/control_flow_ops.py b/tensorflow/python/ops/control_flow_ops.py
index bfe5a78ac3c..ec66532afb0 100644
--- a/tensorflow/python/ops/control_flow_ops.py
+++ b/tensorflow/python/ops/control_flow_ops.py
@@ -80,6 +80,7 @@ from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import gen_array_ops
@@ -165,7 +166,7 @@ def _Identity(data, name=None):
     else:
       return array_ops.identity(data, name=name)
   else:
-    if not isinstance(data, (ops.IndexedSlices, ops.SparseTensor)):
+    if not isinstance(data, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
       raise TypeError("Type %s not supported" % type(data))
     values = _Identity(data.values, name=name)
     indices = array_ops.identity(data.indices, name="indices")
@@ -176,7 +177,7 @@ def _Identity(data, name=None):
       return ops.IndexedSlices(values, indices, dense_shape)
     else:
       dense_shape = array_ops.identity(data.shape, name="dense_shape")
-      return ops.SparseTensor(indices, values, dense_shape)
+      return sparse_tensor.SparseTensor(indices, values, dense_shape)
 
 
 def _NextIteration(data, name=None):
@@ -187,7 +188,7 @@ def _NextIteration(data, name=None):
     else:
       return next_iteration(data, name=name)
   else:
-    if not isinstance(data, (ops.IndexedSlices, ops.SparseTensor)):
+    if not isinstance(data, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
       raise TypeError("Type %s not supported" % type(data))
     values = _NextIteration(data.values, name=name)
     indices = next_iteration(data.indices, name="indices")
@@ -198,7 +199,7 @@ def _NextIteration(data, name=None):
       return ops.IndexedSlices(values, indices, dense_shape)
     else:
       dense_shape = next_iteration(data.shape, name="dense_shape")
-      return ops.SparseTensor(indices, values, dense_shape)
+      return sparse_tensor.SparseTensor(indices, values, dense_shape)
 
 
 def _Enter(data, frame_name, is_constant=False, parallel_iterations=10,
@@ -233,7 +234,7 @@ def _Enter(data, frame_name, is_constant=False, parallel_iterations=10,
       result.set_shape(data.get_shape())
     return result
   else:
-    if not isinstance(data, (ops.IndexedSlices, ops.SparseTensor)):
+    if not isinstance(data, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
       raise TypeError("Type %s not supported" % type(data))
     values = _Enter(data.values, frame_name, is_constant,
                     parallel_iterations=parallel_iterations,
@@ -255,7 +256,7 @@ def _Enter(data, frame_name, is_constant=False, parallel_iterations=10,
                           parallel_iterations, name="dense_shape")
       if use_input_shape:
         dense_shape.set_shape(data.shape.get_shape())
-      return ops.SparseTensor(indices, values, dense_shape)
+      return sparse_tensor.SparseTensor(indices, values, dense_shape)
 
 
 def exit(data, name=None):
@@ -277,7 +278,7 @@ def exit(data, name=None):
     else:
       return gen_control_flow_ops._exit(data, name)
   else:
-    if not isinstance(data, (ops.IndexedSlices, ops.SparseTensor)):
+    if not isinstance(data, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
       raise TypeError("Type %s not supported" % type(data))
     values = exit(data.values, name=name)
     indices = gen_control_flow_ops._exit(data.indices, name="indices")
@@ -288,7 +289,7 @@ def exit(data, name=None):
       return ops.IndexedSlices(values, indices, dense_shape)
     else:
       dense_shape = gen_control_flow_ops._exit(data.shape, name)
-      return ops.SparseTensor(indices, values, dense_shape)
+      return sparse_tensor.SparseTensor(indices, values, dense_shape)
 
 
 def switch(data, pred, dtype=None, name=None):
@@ -317,7 +318,7 @@ def switch(data, pred, dtype=None, name=None):
     if isinstance(data, ops.Tensor):
       return gen_control_flow_ops._switch(data, pred, name=name)
     else:
-      if not isinstance(data, (ops.IndexedSlices, ops.SparseTensor)):
+      if not isinstance(data, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
         raise TypeError("Type %s not supported" % type(data))
       val, ind = data.values, data.indices
       val_f, val_t = gen_control_flow_ops._switch(val, pred, name=name)
@@ -335,8 +336,8 @@ def switch(data, pred, dtype=None, name=None):
         dense_shape = data.shape
         dense_shape_f, dense_shape_t = gen_control_flow_ops._switch(
             data.shape, pred, name="dense_shape")
-        return (ops.SparseTensor(ind_f, val_f, dense_shape_f),
-                ops.SparseTensor(ind_t, val_t, dense_shape_t))
+        return (sparse_tensor.SparseTensor(ind_f, val_f, dense_shape_f),
+                sparse_tensor.SparseTensor(ind_t, val_t, dense_shape_t))
 
 
 def _SwitchRefOrTensor(data, pred, name="Switch"):
@@ -418,14 +419,15 @@ def merge(inputs, name=None):
         return gen_control_flow_ops._ref_merge(inputs, name)
       else:
         return gen_control_flow_ops._merge(inputs, name)
-    elif all([isinstance(v, ops.SparseTensor) for v in inputs]):
+    elif all([isinstance(v, sparse_tensor.SparseTensor) for v in inputs]):
       # Only handle the case when all inputs are SparseTensor.
       values, _ = merge([inp.values for inp in inputs], name=name)
       indices, chosen_index = gen_control_flow_ops._merge(
           [inp.indices for inp in inputs], name="indices")
       dense_shape, _ = gen_control_flow_ops._merge(
           [inp.shape for inp in inputs], name="dense_shape")
-      return ops.SparseTensor(indices, values, dense_shape), chosen_index
+      return (sparse_tensor.SparseTensor(indices, values, dense_shape),
+              chosen_index)
     else:
       # For now convert all the inputs as IndexedSlices.
       inputs = math_ops._as_indexed_slices_list(inputs, optimize=False)
@@ -533,7 +535,7 @@ def _SetShapeInvariants(input_vars, enter_vars, shapes):
             % (inp.name, inp.get_shape(), shape))
       var.set_shape(shape)
     else:
-      if not isinstance(var, (ops.IndexedSlices, ops.SparseTensor)):
+      if not isinstance(var, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
         raise TypeError("Type %s not supported" % type(var))
       if isinstance(var, ops.IndexedSlices):
         if not _ShapeLessThanOrEqual(inp.values.get_shape(), shape):
@@ -584,7 +586,7 @@ def _EnforceShapeInvariant(merge_var, next_var):
           "argument of tf.while_loop or set_shape() on the loop variables."
           % (merge_var.name, m_shape, n_shape))
   else:
-    if not isinstance(var, (ops.IndexedSlices, ops.SparseTensor)):
+    if not isinstance(var, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
       raise TypeError("Type %s not supported" % type(var))
     if isinstance(var, ops.IndexedSlices):
       m_values_shape = merge_var.values.get_shape()
@@ -645,8 +647,8 @@ def _AddNextAndBackEdge(m, v):
       if v.dense_shape is None:
         raise ValueError("Must have dense shape: %s" % v.name)
       m.dense_shape.op._update_input(1, v.dense_shape)
-  elif isinstance(m, ops.SparseTensor):
-    if not isinstance(v, ops.SparseTensor):
+  elif isinstance(m, sparse_tensor.SparseTensor):
+    if not isinstance(v, sparse_tensor.SparseTensor):
       raise ValueError("Must be a sparse tensor: %s" % v.name)
     v = _NextIteration(v)
     # pylint: disable=protected-access
@@ -1687,7 +1689,7 @@ class CondContext(ControlFlowContext):
           # Use pivot as the proxy for this op.
           real_v = with_dependencies([v], self._pivot)
         else:
-          if isinstance(v, (ops.IndexedSlices, ops.SparseTensor)):
+          if isinstance(v, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
             values = self._ProcessOutputTensor(v.values)
             indices = self._ProcessOutputTensor(v.indices)
             if isinstance(v, ops.IndexedSlices):
@@ -1697,7 +1699,7 @@ class CondContext(ControlFlowContext):
               real_v = ops.IndexedSlices(values, indices, dense_shape)
             else:
               dense_shape = self._ProcessOutputTensor(v.shape)
-              real_v = ops.SparseTensor(indices, values, dense_shape)
+              real_v = sparse_tensor.SparseTensor(indices, values, dense_shape)
           else:
             real_v = self._ProcessOutputTensor(v)
         result.append(real_v)
@@ -1791,8 +1793,8 @@ def cond(pred, fn1, fn2, name=None):
     for x, y in zip(res_f, res_t):
       assert ((isinstance(x, ops.IndexedSlices) and
                isinstance(y, ops.IndexedSlices)) or
-              (isinstance(x, ops.SparseTensor) and
-               isinstance(y, ops.SparseTensor)) or
+              (isinstance(x, sparse_tensor.SparseTensor) and
+               isinstance(y, sparse_tensor.SparseTensor)) or
               (isinstance(x, ops.Tensor) and isinstance(y, ops.Tensor)))
       val_x = x if isinstance(x, ops.Tensor) else x.values
       val_y = y if isinstance(y, ops.Tensor) else y.values
@@ -2356,7 +2358,7 @@ class WhileContext(ControlFlowContext):
         self._values.add(x.indices.name)
         if isinstance(x, ops.IndexedSlices):
           dense_shape = x.dense_shape
-        elif isinstance(x, ops.SparseTensor):
+        elif isinstance(x, sparse_tensor.SparseTensor):
           dense_shape = x.shape
         else:
           raise TypeError("Type %s not supported" % type(x))
@@ -2487,7 +2489,7 @@ class WhileContext(ControlFlowContext):
       if isinstance(e, ops.Tensor):
         xs = [e]
       else:
-        if not isinstance(e, (ops.IndexedSlices, ops.SparseTensor)):
+        if not isinstance(e, (ops.IndexedSlices, sparse_tensor.SparseTensor)):
           raise TypeError("Type %s not supported" % type(e))
         xs = [e.values, e.indices]
         shape = e.dense_shape if isinstance(e, ops.IndexedSlices) else e.shape
diff --git a/tensorflow/python/ops/ctc_ops.py b/tensorflow/python/ops/ctc_ops.py
index 97b9cecc9e9..cce72d71dc9 100644
--- a/tensorflow/python/ops/ctc_ops.py
+++ b/tensorflow/python/ops/ctc_ops.py
@@ -21,6 +21,7 @@ from __future__ import print_function
 
 from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 
 from tensorflow.python.ops import gen_ctc_ops
 from tensorflow.python.ops import array_ops
@@ -29,7 +30,8 @@ from tensorflow.python.ops.nn_grad import _BroadcastMul
 
 # pylint: disable=protected-access, invalid-name
 def ctc_loss(inputs, labels, sequence_length,
-             preprocess_collapse_repeated=False, ctc_merge_repeated=True, time_major=True):
+             preprocess_collapse_repeated=False,
+             ctc_merge_repeated=True, time_major=True):
   """Computes the CTC (Connectionist Temporal Classification) Loss.
 
   This op implements the CTC loss as presented in the article:
@@ -128,7 +130,7 @@ def ctc_loss(inputs, labels, sequence_length,
   """
   # The second, third, etc output tensors contain the gradients.  We use it in
   # _CTCLossGrad() below.
-  if not isinstance(labels, ops.SparseTensor):
+  if not isinstance(labels, sparse_tensor.SparseTensor):
     raise TypeError("Expected labels to be a SparseTensor")
 
   # For internal calculations, we transpose to [time, batch, num_classes]
@@ -206,7 +208,7 @@ def ctc_greedy_decoder(inputs, sequence_length, merge_repeated=True):
   outputs = gen_ctc_ops._ctc_greedy_decoder(
       inputs, sequence_length, merge_repeated=merge_repeated)
   (decoded_ix, decoded_val, decoded_shape, log_probabilities) = outputs
-  return ([ops.SparseTensor(decoded_ix, decoded_val, decoded_shape)],
+  return ([sparse_tensor.SparseTensor(decoded_ix, decoded_val, decoded_shape)],
           log_probabilities)
 
 
@@ -258,7 +260,7 @@ def ctc_beam_search_decoder(inputs, sequence_length, beam_width=100,
           merge_repeated=merge_repeated))
 
   return (
-      [ops.SparseTensor(ix, val, shape) for (ix, val, shape)
+      [sparse_tensor.SparseTensor(ix, val, shape) for (ix, val, shape)
        in zip(decoded_ixs, decoded_vals, decoded_shapes)],
       log_probabilities)
 
diff --git a/tensorflow/python/ops/embedding_ops.py b/tensorflow/python/ops/embedding_ops.py
index 2e2365e4303..b6e252829ca 100644
--- a/tensorflow/python/ops/embedding_ops.py
+++ b/tensorflow/python/ops/embedding_ops.py
@@ -23,6 +23,7 @@ from six.moves import xrange  # pylint: disable=redefined-builtin
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import data_flow_ops
 from tensorflow.python.ops import math_ops
@@ -257,11 +258,11 @@ def embedding_lookup_sparse(params, sp_ids, sp_weights,
     params = list(params)  # Iterate to get the underlying Variables.
   if not isinstance(params, list):
     params = [params]
-  if not isinstance(sp_ids, ops.SparseTensor):
+  if not isinstance(sp_ids, sparse_tensor.SparseTensor):
     raise TypeError("sp_ids must be SparseTensor")
   ignore_weights = sp_weights is None
   if not ignore_weights:
-    if not isinstance(sp_weights, ops.SparseTensor):
+    if not isinstance(sp_weights, sparse_tensor.SparseTensor):
       raise TypeError("sp_weights must be either None or SparseTensor")
     sp_ids.values.get_shape().assert_is_compatible_with(
         sp_weights.values.get_shape())
diff --git a/tensorflow/python/ops/functional_ops.py b/tensorflow/python/ops/functional_ops.py
index 8ef05b03344..f0a21178d18 100644
--- a/tensorflow/python/ops/functional_ops.py
+++ b/tensorflow/python/ops/functional_ops.py
@@ -33,6 +33,7 @@ from __future__ import print_function
 from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
@@ -301,7 +302,7 @@ def map_fn(fn, elems, dtype=None, parallel_iterations=10, back_prop=True,
   if not callable(fn):
     raise TypeError("fn must be callable.")
 
-  if isinstance(elems, ops.SparseTensor):
+  if isinstance(elems, sparse_tensor.SparseTensor):
     raise TypeError(
         "To perform a map on the values of a sparse tensor use either "
         " SparseTensor(input.indices, fn(input.values), input.shape) or "
diff --git a/tensorflow/python/ops/gradients.py b/tensorflow/python/ops/gradients.py
index 870fed3e188..921fd50aa9f 100644
--- a/tensorflow/python/ops/gradients.py
+++ b/tensorflow/python/ops/gradients.py
@@ -18,814 +18,17 @@ from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 
-import collections
-import contextlib
-import warnings
-
-import numpy as np
-import six
-from six.moves import xrange  # pylint: disable=redefined-builtin
-
-from tensorflow.core.framework import attr_value_pb2
-from tensorflow.python.framework import constant_op
-from tensorflow.python.framework import dtypes
-from tensorflow.python.framework import ops
-from tensorflow.python.framework import tensor_shape
-from tensorflow.python.framework import tensor_util
-from tensorflow.python.ops import array_grad  # pylint: disable=unused-import
-from tensorflow.python.ops import array_ops
-from tensorflow.python.ops import control_flow_grad  # pylint: disable=unused-import
-from tensorflow.python.ops import control_flow_ops
-from tensorflow.python.ops import image_grad  # pylint: disable=unused-import
-from tensorflow.python.ops import logging_ops  # pylint: disable=unused-import
-from tensorflow.python.ops import linalg_grad  # pylint: disable=unused-import
-from tensorflow.python.ops import math_grad  # pylint: disable=unused-import
-from tensorflow.python.ops import math_ops
-from tensorflow.python.ops import linalg_ops
-from tensorflow.python.ops import functional_ops
-
-from tensorflow.python.platform import tf_logging as logging
-
-# Warn the user if we convert a sparse representation to dense with at
-# least this number of elements.
-_LARGE_SPARSE_NUM_ELEMENTS = 100000000
-
-
-def _IndexedSlicesToTensor(value, dtype=None, name=None, as_ref=False):
-  """Converts an IndexedSlices object `value` to a Tensor.
-
-  NOTE(mrry): This function is potentially expensive.
-
-  Args:
-    value: An ops.IndexedSlices object.
-    dtype: The dtype of the Tensor to be returned.
-    name: Optional name to use for the returned Tensor.
-    as_ref: True if a ref is requested.
-
-  Returns:
-    A dense Tensor representing the values in the given IndexedSlices.
-
-  Raises:
-    ValueError: If the IndexedSlices does not have the same dtype.
-  """
-  _ = as_ref
-  if dtype and not dtype.is_compatible_with(value.dtype):
-    raise ValueError(
-        "Tensor conversion requested dtype %s for IndexedSlices with dtype %s" %
-        (dtype.name, value.dtype.name))
-  if value.dense_shape is None:
-    raise ValueError(
-        "Tensor conversion requested for IndexedSlices without dense_shape: %s"
-        % str(value))
-  # TODO(mrry): Consider adding static shape information to
-  # IndexedSlices, to avoid using numpy here.
-  dense_shape_value = tensor_util.constant_value(value.dense_shape)
-  if dense_shape_value is not None:
-    num_elements = np.prod(dense_shape_value)
-    if num_elements >= _LARGE_SPARSE_NUM_ELEMENTS:
-      warnings.warn(
-          "Converting sparse IndexedSlices to a dense Tensor with %d elements. "
-          "This may consume a large amount of memory." % num_elements)
-  else:
-    warnings.warn(
-        "Converting sparse IndexedSlices to a dense Tensor of unknown shape. "
-        "This may consume a large amount of memory.")
-  return math_ops.unsorted_segment_sum(
-      value.values, value.indices, value.dense_shape[0], name=name)
-
-
-ops.register_tensor_conversion_function(ops.IndexedSlices,
-                                        _IndexedSlicesToTensor)
-
-
-def _MarkReachedOps(from_ops, reached_ops):
-  """Mark all ops reached from "from_ops".
-
-  Args:
-    from_ops: list of Operations.
-    reached_ops: list of booleans, indexed by operation id.
-  """
-  queue = collections.deque()
-  queue.extend(from_ops)
-  while queue:
-    op = queue.popleft()
-    if not reached_ops[op._id]:
-      reached_ops[op._id] = True
-      for output in op.outputs:
-        queue.extend(output.consumers())
-
-
-def _GatherInputs(to_ops, reached_ops):
-  """List all inputs of to_ops that are in reached_ops.
-
-  Args:
-    to_ops: list of Operations.
-    reached_ops: list of booleans, indexed by operation id.
-
-  Returns:
-    The list of all inputs of to_ops that are in reached_ops.
-    That list includes all elements of to_ops.
-  """
-  inputs = []
-  queue = collections.deque()
-  queue.extend(to_ops)
-  while queue:
-    op = queue.popleft()
-    # We are interested in this op.
-    if reached_ops[op._id]:
-      inputs.append(op)
-      # Clear the boolean so we won't add the inputs again.
-      reached_ops[op._id] = False
-      for inp in op.inputs:
-        queue.append(inp.op)
-  return inputs
-
-
-def _PendingCount(graph, to_ops, from_ops, colocate_gradients_with_ops):
-  """Initialize the pending count for ops between two lists of Operations.
-
-  'pending_count[op._id]' indicates the number of backprop inputs
-  to this operation.
-
-  Args:
-    graph: a Graph.
-    to_ops: list of Operations.
-    from_ops: list of Operations.
-    colocate_gradients_with_ops: Python bool.  See docstring of gradients().
-
-  Returns:
-    A tuple containing: (1) a list of integers indexed by operation id,
-    indicating the number of backprop inputs to this operation, and (2)
-    a ControlFlowState object which is not None if the ops between from_ops
-    and to_ops contain control flow loops.
-  """
-  # Mark reachable ops from from_ops.
-  reached_ops = [False] * (graph._last_id + 1)
-  for op in to_ops:
-    reached_ops[op._id] = True
-  _MarkReachedOps(from_ops, reached_ops)
-
-  # Mark between ops.
-  between_ops = [False] * (graph._last_id + 1)
-  between_op_list = []
-  queue = collections.deque()
-  queue.extend(to_ops)
-  while queue:
-    op = queue.popleft()
-    # We are interested in this op.
-    if reached_ops[op._id]:
-      between_ops[op._id] = True
-      between_op_list.append(op)
-      # Clear the boolean so we won't add the inputs again.
-      reached_ops[op._id] = False
-      for inp in op.inputs:
-        queue.append(inp.op)
-
-  # 'loop_state' is None if there are no while loops.
-  loop_state = control_flow_ops.MaybeCreateControlFlowState(
-      between_op_list, between_ops, colocate_gradients_with_ops)
-
-  # Initialize pending count for between ops.
-  pending_count = [0] * (graph._last_id + 1)
-  for op in between_op_list:
-    for x in op.inputs:
-      if between_ops[x.op._id]:
-        pending_count[x.op._id] += 1
-
-  return pending_count, loop_state
-
-
-def _AsList(x):
-  return x if isinstance(x, (list, tuple)) else [x]
-
-
-def _DefaultGradYs(grad_ys, ys, colocate_gradients_with_ops):
-  """Fill in default values for grad_ys.
-
-  Args:
-    grad_ys: List of gradients, can contain None.
-    ys: List of tensors.
-    colocate_gradients_with_ops: If True, try colocating gradients with
-      the corresponding op.
-
-  Returns:
-    A list of gradients to use, without None.
-
-  Raises:
-    ValueError: If one of the grad_ys is invalid.
-  """
-  if len(grad_ys) != len(ys):
-    raise ValueError("Passed %d grad_ys for %d ys" % (len(grad_ys), len(ys)))
-  grad_ys = ops.convert_n_to_tensor_or_indexed_slices(grad_ys, name="grad_y")
-  for i in xrange(len(grad_ys)):
-    grad_y = grad_ys[i]
-    y = ys[i]
-    if grad_y is None:
-      with _maybe_colocate_with(y.op, colocate_gradients_with_ops):
-        grad_ys[i] = array_ops.fill(
-            array_ops.shape(y), constant_op.constant(
-                1, dtype=y.dtype))
-    else:
-      if grad_y.dtype != y.dtype:
-        raise ValueError("Y and ys_grad must be of the same type, "
-                         "not y: %s, ys_grad: %s " %
-                         (dtypes.as_dtype(y.dtype).name,
-                          dtypes.as_dtype(grad_y.dtype).name))
-  return grad_ys
-
-
-def _IsTrainable(tensor):
-  dtype = dtypes.as_dtype(tensor.dtype)
-  return dtype.base_dtype in (dtypes.float16, dtypes.float32, dtypes.float64,
-                              dtypes.complex64, dtypes.complex128)
-
-
-def _VerifyGeneratedGradients(grads, op):
-  """Verify that gradients are valid in number and type.
-
-  Args:
-    grads: List of generated gradients.
-    op: Operation for which the gradients where generated.
-
-  Raises:
-    ValueError: if the gradients are invalid.
-  """
-  if len(grads) != len(op.inputs):
-    raise ValueError("Num gradients %d generated for op %s do not match num "
-                     "inputs %d" % (len(grads), op.node_def, len(op.inputs)))
-  for i in xrange(len(grads)):
-    grad = grads[i]
-    inp = op.inputs[i]
-    if grad is not None:
-      if not grad.dtype.is_compatible_with(inp.dtype):
-        raise ValueError("Gradient type %s generated for op %s does "
-                         "not match input type %s" %
-                         (dtypes.as_dtype(grad.dtype).name, op.node_def,
-                          dtypes.as_dtype(inp.dtype).name))
-
-
-def _StopOps(from_ops, pending_count):
-  """The set of ops that terminate the gradient computation.
-
-  This computes the frontier of the forward graph *before* which backprop
-  should stop. Operations in the returned set will not be differentiated.
-  This set is defined as the subset of `from_ops` containing ops that have
-  no predecessor in `from_ops`. `pending_count` is the result of
-  `_PendingCount(g, xs, from_ops)`. An 'op' has predecessors in `from_ops`
-  iff pending_count[op._id] > 0.
-
-  Args:
-    from_ops: list of Operations.
-    pending_count: List of integers, indexed by operation id.
-
-  Returns:
-    The set of operations.
-  """
-  stop_ops = set()
-  for op in from_ops:
-    is_stop_op = True
-    for inp in op.inputs:
-      if pending_count[inp.op._id] > 0:
-        is_stop_op = False
-        break
-    if is_stop_op:
-      stop_ops.add(op._id)
-  return stop_ops
-
-
-@contextlib.contextmanager
-def _maybe_colocate_with(op, colocate_gradients_with_ops):
-  """Context to colocate with `op` if `colocate_gradients_with_ops`."""
-  if colocate_gradients_with_ops:
-    with ops.colocate_with(op):
-      yield
-  else:
-    yield
-
-
-def _SymGrad(op, out_grads):
-  """Backprop through a function call node op given its outputs' gradients."""
-  f_in = [x for x in op.inputs] + out_grads
-  f_types = [x.dtype for x in op.inputs]
-  f = attr_value_pb2.NameAttrList()
-  f.name = op.type
-  for k in op.node_def.attr:
-    f.attr[k].CopyFrom(op.node_def.attr[k])
-  # pylint: disable=protected-access
-  in_grads = functional_ops._symbolic_gradient(input=f_in, Tout=f_types, f=f)
-  # pylint: enable=protected-access
-  return in_grads
-
-
-def gradients(ys,
-              xs,
-              grad_ys=None,
-              name="gradients",
-              colocate_gradients_with_ops=False,
-              gate_gradients=False,
-              aggregation_method=None):
-  """Constructs symbolic partial derivatives of sum of `ys` w.r.t. x in `xs`.
-
-  `ys` and `xs` are each a `Tensor` or a list of tensors.  `grad_ys`
-  is a list of `Tensor`, holding the gradients received by the
-  `ys`. The list must be the same length as `ys`.
-
-  `gradients()` adds ops to the graph to output the partial
-  derivatives of `ys` with respect to `xs`.  It returns a list of
-  `Tensor` of length `len(xs)` where each tensor is the `sum(dy/dx)`
-  for y in `ys`.
-
-  `grad_ys` is a list of tensors of the same length as `ys` that holds
-  the initial gradients for each y in `ys`.  When `grad_ys` is None,
-  we fill in a tensor of '1's of the shape of y for each y in `ys`.  A
-  user can provide their own initial `grad_ys` to compute the
-  derivatives using a different initial gradient for each y (e.g., if
-  one wanted to weight the gradient differently for each value in
-  each y).
-
-  Args:
-    ys: A `Tensor` or list of tensors to be differentiated.
-    xs: A `Tensor` or list of tensors to be used for differentiation.
-    grad_ys: Optional. A `Tensor` or list of tensors the same size as
-      `ys` and holding the gradients computed for each y in `ys`.
-    name: Optional name to use for grouping all the gradient ops together.
-      defaults to 'gradients'.
-    colocate_gradients_with_ops: If True, try colocating gradients with
-      the corresponding op.
-    gate_gradients: If True, add a tuple around the gradients returned
-      for an operations.  This avoids some race conditions.
-    aggregation_method: Specifies the method used to combine gradient terms.
-      Accepted values are constants defined in the class `AggregationMethod`.
-
-  Returns:
-    A list of `sum(dy/dx)` for each x in `xs`.
-
-  Raises:
-    LookupError: if one of the operations between `x` and `y` does not
-      have a registered gradient function.
-    ValueError: if the arguments are invalid.
-
-  """
-  ys = _AsList(ys)
-  xs = _AsList(xs)
-  if grad_ys is None:
-    grad_ys = [None] * len(ys)
-  else:
-    grad_ys = _AsList(grad_ys)
-
-  with ops.name_scope(name, "gradients", ys + xs + grad_ys):
-    ys = ops.convert_n_to_tensor_or_indexed_slices(ys, name="y")
-    xs = ops.convert_n_to_tensor_or_indexed_slices(xs, name="x")
-    grad_ys = _DefaultGradYs(grad_ys, ys, colocate_gradients_with_ops)
-
-    # The approach we take here is as follows: Create a list of all ops in the
-    # subgraph between the ys and xs.  Visit these ops in reverse order of ids
-    # to ensure that when we visit an op the gradients w.r.t its outputs have
-    # been collected.  Then aggregate these gradients if needed, call the op's
-    # gradient function, and add the generated gradients to the gradients for
-    # its input.
-
-    # Initialize the pending count for ops in the connected subgraph from ys
-    # to the xs.
-    to_ops = [t.op for t in ys]
-    from_ops = [t.op for t in xs]
-    pending_count, loop_state = _PendingCount(ops.get_default_graph(), to_ops,
-                                              from_ops,
-                                              colocate_gradients_with_ops)
-
-    # Iterate over the collected ops.
-    #
-    # grads: op => list of gradients received on each output endpoint of the
-    # op.  The gradients for each endpoint are initially collected as a list.
-    # When it is time to call the op's gradient function, for each endpoint we
-    # aggregate the list of received gradients into a Add() Operation if there
-    # is more than one.
-    grads = {}
-
-    # Add the initial gradients for the ys.
-    for y, grad_y in zip(ys, grad_ys):
-      _SetGrad(grads, y, grad_y)
-
-    # Initialize queue with to_ops.
-    queue = collections.deque()
-    # Add the ops in 'to_ops' into the queue.
-    to_ops_set = set()
-    for op in to_ops:
-      # 'ready' handles the case where one output gradient relies on
-      # another output's gradient.
-      # pylint: disable=protected-access
-      ready = (pending_count[op._id] == 0)
-      if ready and op._id not in to_ops_set:
-        to_ops_set.add(op._id)
-        queue.append(op)
-      # pylint: enable=protected-access
-
-    if loop_state:
-      loop_exits = loop_state.ProcessUnusedLoopExits(pending_count, to_ops_set)
-      for y in loop_exits:
-        if _IsTrainable(y):
-          _SetGrad(grads, y, loop_state.ZerosLikeForExit(y))
-          queue.append(y.op)
-
-    # The set of 'from_ops'.
-    stop_ops = _StopOps(from_ops, pending_count)
-    while queue:
-      # generate gradient subgraph for op.
-      op = queue.popleft()
-      with _maybe_colocate_with(op, colocate_gradients_with_ops):
-        if loop_state:
-          loop_state.EnterGradWhileContext(op, before=True)
-        out_grads = _AggregatedGrads(grads, op, loop_state, aggregation_method)
-        if loop_state:
-          loop_state.ExitGradWhileContext(op, before=True)
-
-        grad_fn = None
-        # pylint: disable=protected-access
-        is_func_call = ops.get_default_graph()._is_function(op.type)
-        has_out_grads = any(isinstance(g, ops.Tensor) or g for g in out_grads)
-        if has_out_grads and (op._id not in stop_ops):
-          if is_func_call:
-            grad_fn = ops.get_default_graph()._get_function(
-                op.type).python_grad_func
-            # pylint: enable=protected-access
-          else:
-            # A grad_fn must be defined, either as a function or as None
-            # for ops that do not have gradients.
-            try:
-              grad_fn = ops.get_gradient_function(op)
-            except LookupError:
-              raise LookupError(
-                  "No gradient defined for operation '%s' (op type: %s)" %
-                  (op.name, op.type))
-        if loop_state:
-          loop_state.EnterGradWhileContext(op, before=False)
-        if (grad_fn or is_func_call) and has_out_grads:
-          # NOTE: If _AggregatedGrads didn't compute a value for the i'th
-          # output, it means that the cost does not depend on output[i],
-          # therefore dC/doutput[i] is 0.
-          for i, out_grad in enumerate(out_grads):
-            if (not isinstance(out_grad, ops.Tensor) and
-                not out_grad) and _IsTrainable(op.outputs[i]):
-              # Only floating-point outputs get a zero gradient. Gradient
-              # functions should ignore the gradient for other outputs.
-              if loop_state:
-                out_grads[i] = loop_state.ZerosLike(op, i)
-              else:
-                out_grads[i] = control_flow_ops.ZerosLikeOutsideLoop(op, i)
-          with ops.name_scope(op.name + "_grad"):
-            # pylint: disable=protected-access
-            with ops.get_default_graph()._original_op(op):
-              # pylint: enable=protected-access
-              if grad_fn:
-                # If grad_fn was found, do not use SymbolicGradient even for
-                # functions.
-                in_grads = grad_fn(op, *out_grads)
-              else:
-                # For function call ops, we add a 'SymbolicGradient'
-                # node to the graph to compute gradients.
-                in_grads = _SymGrad(op, out_grads)
-              in_grads = _AsList(in_grads)
-              _VerifyGeneratedGradients(in_grads, op)
-              if gate_gradients and len(
-                  [x for x in in_grads if x is not None]) > 1:
-                in_grads = control_flow_ops.tuple(in_grads)
-          _LogOpGradients(op, out_grads, in_grads)
-        else:
-          # If no grad_fn is defined or none of out_grads is available,
-          # just propagates a list of None backwards.
-          in_grads = [None] * len(op.inputs)
-        for t_in, in_grad in zip(op.inputs, in_grads):
-          if in_grad is not None:
-            if isinstance(in_grad, ops.Tensor):
-              in_grad.set_shape(t_in.get_shape())
-            _SetGrad(grads, t_in, in_grad)
-        if loop_state:
-          loop_state.ExitGradWhileContext(op, before=False)
-
-      # Update pending count for the inputs of op and enqueue ready ops.
-      _UpdatePendingAndEnqueueReady(grads, op, queue, pending_count, loop_state)
-
-  if loop_state:
-    loop_state.PostProcessing()
-  return [_GetGrad(grads, x) for x in xs]
-
-
-def _HasAnyNotNoneGrads(grads, op):
-  """Return true iff op has real gradient."""
-  out_grads = _GetGrads(grads, op)
-  for out_grad in out_grads:
-    if isinstance(out_grad, (ops.Tensor, ops.IndexedSlices)):
-      return True
-    if out_grad and isinstance(out_grad, collections.Sequence):
-      if any([g is not None for g in out_grad]):
-        return True
-  return False
-
-
-def _UpdatePendingAndEnqueueReady(grads, op, queue, pending_count, loop_state):
-  """Update pending count for the inputs of op and enqueue ready ops."""
-  for x in op.inputs:
-    # pylint: disable=protected-access
-    pending_count[x.op._id] -= 1
-    ready = (pending_count[x.op._id] == 0)
-    if loop_state and not ready:
-      ready = (pending_count[x.op._id] > 0 and
-               control_flow_ops.IsLoopSwitch(x.op))
-    # pylint: enable=protected-access
-    if ready:
-      if control_flow_ops.IsLoopExit(x.op):
-        # if x is an exit without real gradient, defer processing them.
-        grad_state = loop_state.GetGradState(x.op, before=False)
-        grad_state.deferred_exits.append(x)
-        grad_state.pending_exits_count -= 1
-        if grad_state.pending_exits_count == 0:
-          # We now have all the exits so process them.
-          has_real_grad = False
-          for y in grad_state.deferred_exits:
-            if _HasAnyNotNoneGrads(grads, y.op):
-              has_real_grad = True
-              queue.append(y.op)
-            else:
-              grad_state.unused_exits.append(y)
-          if has_real_grad:
-            # For an unused exit, if it has floating-point outputs, backprop
-            # a zero gradient. Otherwise, just ignore it.
-            for y in grad_state.unused_exits:
-              if _IsTrainable(y):
-                _SetGrad(grads, y, loop_state.ZerosLikeForExit(y))
-              queue.append(y.op)
-          else:
-            # All exits are "unused" so use None as gradient.
-            for y in grad_state.unused_exits:
-              queue.append(y.op)
-      else:
-        queue.append(x.op)
-
-
-def _SetGrad(grads, t, grad):
-  """Sets gradient "grad" in "grads" for tensor "t"."""
-  op = t.op
-  op_grads = grads.get(op)
-  if not op_grads:
-    op_grads = [[] for _ in xrange(len(op.outputs))]
-    grads[op] = op_grads
-  t_grads = op_grads[t.value_index]
-  if isinstance(t_grads, list):
-    t_grads.append(grad)
-  else:
-    assert control_flow_ops.IsLoopSwitch(op)
-    op_grads[t.value_index] = grad
-
-
-def _GetGrad(grads, t):
-  """Gets gradient for tensor "t"."""
-  op = t.op
-  op_grads = grads.get(op)
-  if not op_grads:
-    return None
-  t_grad = op_grads[t.value_index]
-  assert not isinstance(t_grad, list), (
-      "gradients list should have been aggregated by now.")
-  return t_grad
-
-
-def _GetGrads(grads, op):
-  """Gets all gradients for op."""
-  if op in grads:
-    return grads[op]
-  else:
-    return [[] for _ in xrange(len(op.outputs))]
-
-
-def _HandleNestedIndexedSlices(grad):
-  assert isinstance(grad, ops.IndexedSlices)
-  if isinstance(grad.values, ops.Tensor):
-    return grad
-  else:
-    assert isinstance(grad.values, ops.IndexedSlices)
-    g = _HandleNestedIndexedSlices(grad.values)
-    return ops.IndexedSlices(g.values,
-                             array_ops.gather(grad.indices, g.indices),
-                             g.dense_shape)
-
-
-def _AccumulatorShape(inputs):
-  shape = tensor_shape.unknown_shape()
-  for i in inputs:
-    if isinstance(i, ops.Tensor):
-      shape = shape.merge_with(i.get_shape())
-  return shape
-
-
-def _LogOpGradients(op, out_grads, in_grads):
-  """Log the in and out grads of an op."""
-  logging.vlog(1, "Gradient for '" + op.name + "'")
-
-  def _FilterGrad(x):
-    if x is None:
-      return False
-    if isinstance(x, (list, tuple)):
-      return bool(x)
-    else:
-      return True
-
-  logging.vlog(1, "  in  --> %s",
-               ", ".join([x.name for x in out_grads if _FilterGrad(x)]))
-  logging.vlog(1, "  out --> %s",
-               ", ".join([x.name for x in in_grads if _FilterGrad(x)]))
-
-
-def _MultiDeviceAddN(tensor_list):
-  """Adds tensors from potentially multiple devices."""
-  # Basic function structure comes from control_flow_ops.group().
-  # Sort tensors according to their devices.
-  tensors_on_device = collections.defaultdict(lambda: [])
-  for tensor in tensor_list:
-    tensors_on_device[tensor.device].append(tensor)
-
-  # For each device, add the tensors on that device first.
-  # Then gather the partial sums from multiple devices.
-  # TODO(sjhwang): Create hierarchical aggregation tree as pbar's suggestion.
-  # E.g., aggregate per GPU, then per task, and so on.
-  summands = []
-
-  def DeviceKey(dev):
-    return "" if dev is None else dev
-
-  for dev in sorted(six.iterkeys(tensors_on_device), key=DeviceKey):
-    tensors = tensors_on_device[dev]
-    with ops.colocate_with(tensors[0].op, ignore_existing=True):
-      summands.append(math_ops.add_n(tensors))
-
-  return math_ops.add_n(summands)
-
-
-class AggregationMethod(object):
-  """A class listing aggregation methods used to combine gradients.
-
-  Computing partial derivatives can require aggregating gradient
-  contributions. This class lists the various methods that can
-  be used to combine gradients in the graph:
-
-  *  `ADD_N`: All of the gradient terms are summed as part of one
-     operation using the "AddN" op. It has the property that all
-     gradients must be ready before any aggregation is performed.
-  *  `DEFAULT`: The system-chosen default aggregation method.
-  """
-  ADD_N = 0
-  DEFAULT = ADD_N
-  # The following are experimental and may not be supported in future releases.
-  EXPERIMENTAL_TREE = 1
-  EXPERIMENTAL_ACCUMULATE_N = 2
-
-
-def _AggregatedGrads(grads, op, loop_state, aggregation_method=None):
-  """Get the aggregated gradients for op.
-
-  Args:
-    grads: The map of memoized gradients.
-    op: The op to get gradients for.
-    loop_state: An object for maintaining the state of the while loops in the
-                graph. It is of type ControlFlowState. None if the graph
-                contains no while loops.
-    aggregation_method: Specifies the method used to combine gradient terms.
-      Accepted values are constants defined in the class `AggregationMethod`.
-
-  Returns:
-    A list of gradients, one per each output of `op`. If the gradients
-      for a particular output is a list, this function aggregates it
-      before returning.
-
-  Raises:
-    TypeError: if the incoming grads are not Tensors or IndexedSlices.
-    ValueError: if the arguments are invalid.
-
-  """
-  if aggregation_method is None:
-    aggregation_method = AggregationMethod.DEFAULT
-  if aggregation_method not in [
-      AggregationMethod.ADD_N, AggregationMethod.EXPERIMENTAL_TREE,
-      AggregationMethod.EXPERIMENTAL_ACCUMULATE_N
-  ]:
-    raise ValueError("Invalid aggregation_method specified %s." %
-                     aggregation_method)
-  out_grads = _GetGrads(grads, op)
-  for i, out_grad in enumerate(out_grads):
-    if loop_state:
-      if isinstance(out_grad, (ops.Tensor, ops.IndexedSlices)):
-        assert control_flow_ops.IsLoopSwitch(op)
-        continue
-    # Grads have to be Tensors or IndexedSlices
-    if (isinstance(out_grad, collections.Sequence) and not all([
-        isinstance(g, (ops.Tensor, ops.IndexedSlices)) for g in out_grad
-        if g is not None
-    ])):
-      raise TypeError("gradients have to be either all Tensors "
-                      "or all IndexedSlices")
-    # Aggregate multiple gradients, and convert [] to None.
-    if out_grad:
-      if len(out_grad) < 2:
-        used = "nop"
-        out_grads[i] = out_grad[0]
-      elif all([isinstance(g, ops.Tensor) for g in out_grad if g is not None]):
-        tensor_shape = _AccumulatorShape(out_grad)
-        if (aggregation_method == AggregationMethod.EXPERIMENTAL_ACCUMULATE_N
-            and len(out_grad) > 2 and tensor_shape.is_fully_defined()):
-          # The benefit of using AccumulateN is that its inputs can be combined
-          # in any order and this can allow the expression to be evaluated with
-          # a smaller memory footprint.  When used with gpu_allocator_retry,
-          # it is possible to compute a sum of terms which are much larger than
-          # total GPU memory.
-          # AccumulateN can currently only be used if we know the shape for
-          # an accumulator variable.  If this is not known, or if we only have
-          # 2 grads then we fall through to the "tree" case below.
-          used = "accumulate_n"
-          out_grads[i] = math_ops.accumulate_n(out_grad)
-        elif aggregation_method in [
-            AggregationMethod.EXPERIMENTAL_TREE,
-            AggregationMethod.EXPERIMENTAL_ACCUMULATE_N
-        ]:
-          # Aggregate all gradients by doing pairwise sums: this may
-          # reduce performance, but it can improve memory because the
-          # gradients can be released earlier.
-          #
-          # TODO(vrv): Consider replacing this with a version of
-          # tf.AddN() that eagerly frees its inputs as soon as they are
-          # ready, so the order of this tree does not become a problem.
-          used = "tree"
-          with ops.name_scope(op.name + "_gradient_sum"):
-            running_sum = out_grad[0]
-            for grad in out_grad[1:]:
-              running_sum = math_ops.add_n([running_sum, grad])
-            out_grads[i] = running_sum
-        else:
-          used = "add_n"
-          out_grads[i] = _MultiDeviceAddN(out_grad)
-        logging.vlog(2, "  _AggregatedGrads %d x %s using %s",
-                     len(out_grad), tensor_shape, used)
-      else:
-        out_grad = math_ops._as_indexed_slices_list(
-            [g for g in out_grad if g is not None])
-        out_grad = [_HandleNestedIndexedSlices(x) for x in out_grad]
-        # Form IndexedSlices out of the concatenated values and
-        # indices.
-        out_grads[i] = ops.IndexedSlices(
-            array_ops.concat(0, [x.values for x in out_grad]),
-            array_ops.concat(0, [x.indices for x in out_grad]),
-            out_grad[0].dense_shape)
-    else:
-      out_grads[i] = []
-  return out_grads
-
-
-# TODO(vrv): Make this available when we want to make it public.
-def _hessian_vector_product(ys, xs, v):
-  """Multiply the Hessian of `ys` wrt `xs` by `v`.
-
-  This is an efficient construction that uses a backprop-like approach
-  to compute the product between the Hessian and another vector. The
-  Hessian is usually too large to be explicitly computed or even
-  represented, but this method allows us to at least multiply by it
-  for the same big-O cost as backprop.
-
-  Implicit Hessian-vector products are the main practical, scalable way
-  of using second derivatives with neural networks. They allow us to
-  do things like construct Krylov subspaces and approximate conjugate
-  gradient descent.
-
-  Example: if `y` = 1/2 `x`^T A `x`, then `hessian_vector_product(y,
-  x, v)` will return an expression that evaluates to the same values
-  as (A + A.T) `v`.
-
-  Args:
-    ys: A scalar value, or a tensor or list of tensors to be summed to
-        yield a scalar.
-    xs: A list of tensors that we should construct the Hessian over.
-    v: A list of tensors, with the same shapes as xs, that we want to
-       multiply by the Hessian.
-
-  Returns:
-    A list of tensors (or if the list would be length 1, a single tensor)
-    containing the product between the Hessian and `v`.
-
-  Raises:
-    ValueError: `xs` and `v` have different length.
-
-  """
-
-  # Validate the input
-  length = len(xs)
-  if len(v) != length:
-    raise ValueError("xs and v must have the same length.")
-
-  # First backprop
-  grads = gradients(ys, xs)
-
-  assert len(grads) == length
-  elemwise_products = [
-      math_ops.mul(grad_elem, array_ops.stop_gradient(v_elem))
-      for grad_elem, v_elem in zip(grads, v) if grad_elem is not None
-  ]
-
-  # Second backprop
-  return gradients(elemwise_products, xs)
+# pylint: disable=unused-import
+from tensorflow.python.ops.gradients_impl import AggregationMethod
+from tensorflow.python.ops.gradients_impl import gradients
+from tensorflow.python.ops.gradients_impl import hessians
+# pylint: enable=unused-import
+from tensorflow.python.util.all_util import remove_undocumented
+
+_allowed_symbols = [
+    # TODO(drpng): find a good place to reference this.
+    "AggregationMethod",
+    "gradients",  # tf.gradients.gradients.
+    "hessians",  # tf.gradients.hessians
+]
+remove_undocumented(__name__, _allowed_symbols)
diff --git a/tensorflow/python/ops/gradients_impl.py b/tensorflow/python/ops/gradients_impl.py
new file mode 100644
index 00000000000..5db3dd77228
--- /dev/null
+++ b/tensorflow/python/ops/gradients_impl.py
@@ -0,0 +1,895 @@
+# Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Implements the graph generation for computation of gradients."""
+
+from __future__ import absolute_import
+from __future__ import division
+from __future__ import print_function
+
+import collections
+import contextlib
+import warnings
+
+import numpy as np
+import six
+from six.moves import xrange  # pylint: disable=redefined-builtin
+
+from tensorflow.core.framework import attr_value_pb2
+from tensorflow.python.framework import constant_op
+from tensorflow.python.framework import dtypes
+from tensorflow.python.framework import ops
+from tensorflow.python.framework import tensor_shape
+from tensorflow.python.framework import tensor_util
+from tensorflow.python.ops import array_grad  # pylint: disable=unused-import
+from tensorflow.python.ops import array_ops
+from tensorflow.python.ops import control_flow_grad  # pylint: disable=unused-import
+from tensorflow.python.ops import control_flow_ops
+from tensorflow.python.ops import image_grad  # pylint: disable=unused-import
+from tensorflow.python.ops import logging_ops  # pylint: disable=unused-import
+from tensorflow.python.ops import linalg_grad  # pylint: disable=unused-import
+from tensorflow.python.ops import math_grad  # pylint: disable=unused-import
+from tensorflow.python.ops import math_ops
+from tensorflow.python.ops import linalg_ops
+from tensorflow.python.ops import functional_ops
+from tensorflow.python.platform import tf_logging as logging
+
+
+# Warn the user if we convert a sparse representation to dense with at
+# least this number of elements.
+_LARGE_SPARSE_NUM_ELEMENTS = 100000000
+
+
+def _IndexedSlicesToTensor(value, dtype=None, name=None, as_ref=False):
+  """Converts an IndexedSlices object `value` to a Tensor.
+
+  NOTE(mrry): This function is potentially expensive.
+
+  Args:
+    value: An ops.IndexedSlices object.
+    dtype: The dtype of the Tensor to be returned.
+    name: Optional name to use for the returned Tensor.
+    as_ref: True if a ref is requested.
+
+  Returns:
+    A dense Tensor representing the values in the given IndexedSlices.
+
+  Raises:
+    ValueError: If the IndexedSlices does not have the same dtype.
+  """
+  _ = as_ref
+  if dtype and not dtype.is_compatible_with(value.dtype):
+    raise ValueError(
+        "Tensor conversion requested dtype %s for IndexedSlices with dtype %s" %
+        (dtype.name, value.dtype.name))
+  if value.dense_shape is None:
+    raise ValueError(
+        "Tensor conversion requested for IndexedSlices without dense_shape: %s"
+        % str(value))
+  # TODO(mrry): Consider adding static shape information to
+  # IndexedSlices, to avoid using numpy here.
+  dense_shape_value = tensor_util.constant_value(value.dense_shape)
+  if dense_shape_value is not None:
+    num_elements = np.prod(dense_shape_value)
+    if num_elements >= _LARGE_SPARSE_NUM_ELEMENTS:
+      warnings.warn(
+          "Converting sparse IndexedSlices to a dense Tensor with %d elements. "
+          "This may consume a large amount of memory." % num_elements)
+  else:
+    warnings.warn(
+        "Converting sparse IndexedSlices to a dense Tensor of unknown shape. "
+        "This may consume a large amount of memory.")
+  return math_ops.unsorted_segment_sum(
+      value.values, value.indices, value.dense_shape[0], name=name)
+
+
+ops.register_tensor_conversion_function(ops.IndexedSlices,
+                                        _IndexedSlicesToTensor)
+
+
+def _MarkReachedOps(from_ops, reached_ops):
+  """Mark all ops reached from "from_ops".
+
+  Args:
+    from_ops: list of Operations.
+    reached_ops: list of booleans, indexed by operation id.
+  """
+  queue = collections.deque()
+  queue.extend(from_ops)
+  while queue:
+    op = queue.popleft()
+    if not reached_ops[op._id]:
+      reached_ops[op._id] = True
+      for output in op.outputs:
+        queue.extend(output.consumers())
+
+
+def _GatherInputs(to_ops, reached_ops):
+  """List all inputs of to_ops that are in reached_ops.
+
+  Args:
+    to_ops: list of Operations.
+    reached_ops: list of booleans, indexed by operation id.
+
+  Returns:
+    The list of all inputs of to_ops that are in reached_ops.
+    That list includes all elements of to_ops.
+  """
+  inputs = []
+  queue = collections.deque()
+  queue.extend(to_ops)
+  while queue:
+    op = queue.popleft()
+    # We are interested in this op.
+    if reached_ops[op._id]:
+      inputs.append(op)
+      # Clear the boolean so we won't add the inputs again.
+      reached_ops[op._id] = False
+      for inp in op.inputs:
+        queue.append(inp.op)
+  return inputs
+
+
+def _PendingCount(graph, to_ops, from_ops, colocate_gradients_with_ops):
+  """Initialize the pending count for ops between two lists of Operations.
+
+  'pending_count[op._id]' indicates the number of backprop inputs
+  to this operation.
+
+  Args:
+    graph: a Graph.
+    to_ops: list of Operations.
+    from_ops: list of Operations.
+    colocate_gradients_with_ops: Python bool.  See docstring of gradients().
+
+  Returns:
+    A tuple containing: (1) a list of integers indexed by operation id,
+    indicating the number of backprop inputs to this operation, and (2)
+    a ControlFlowState object which is not None if the ops between from_ops
+    and to_ops contain control flow loops.
+  """
+  # Mark reachable ops from from_ops.
+  reached_ops = [False] * (graph._last_id + 1)
+  for op in to_ops:
+    reached_ops[op._id] = True
+  _MarkReachedOps(from_ops, reached_ops)
+
+  # Mark between ops.
+  between_ops = [False] * (graph._last_id + 1)
+  between_op_list = []
+  queue = collections.deque()
+  queue.extend(to_ops)
+  while queue:
+    op = queue.popleft()
+    # We are interested in this op.
+    if reached_ops[op._id]:
+      between_ops[op._id] = True
+      between_op_list.append(op)
+      # Clear the boolean so we won't add the inputs again.
+      reached_ops[op._id] = False
+      for inp in op.inputs:
+        queue.append(inp.op)
+
+  # 'loop_state' is None if there are no while loops.
+  loop_state = control_flow_ops.MaybeCreateControlFlowState(
+      between_op_list, between_ops, colocate_gradients_with_ops)
+
+  # Initialize pending count for between ops.
+  pending_count = [0] * (graph._last_id + 1)
+  for op in between_op_list:
+    for x in op.inputs:
+      if between_ops[x.op._id]:
+        pending_count[x.op._id] += 1
+
+  return pending_count, loop_state
+
+
+def _AsList(x):
+  return x if isinstance(x, (list, tuple)) else [x]
+
+
+def _DefaultGradYs(grad_ys, ys, colocate_gradients_with_ops):
+  """Fill in default values for grad_ys.
+
+  Args:
+    grad_ys: List of gradients, can contain None.
+    ys: List of tensors.
+    colocate_gradients_with_ops: If True, try colocating gradients with
+      the corresponding op.
+
+  Returns:
+    A list of gradients to use, without None.
+
+  Raises:
+    ValueError: If one of the grad_ys is invalid.
+  """
+  if len(grad_ys) != len(ys):
+    raise ValueError("Passed %d grad_ys for %d ys" % (len(grad_ys), len(ys)))
+  grad_ys = ops.convert_n_to_tensor_or_indexed_slices(grad_ys, name="grad_y")
+  for i in xrange(len(grad_ys)):
+    grad_y = grad_ys[i]
+    y = ys[i]
+    if grad_y is None:
+      with _maybe_colocate_with(y.op, colocate_gradients_with_ops):
+        grad_ys[i] = array_ops.fill(
+            array_ops.shape(y), constant_op.constant(
+                1, dtype=y.dtype))
+    else:
+      if grad_y.dtype != y.dtype:
+        raise ValueError("Y and ys_grad must be of the same type, "
+                         "not y: %s, ys_grad: %s " %
+                         (dtypes.as_dtype(y.dtype).name,
+                          dtypes.as_dtype(grad_y.dtype).name))
+  return grad_ys
+
+
+def _IsTrainable(tensor):
+  dtype = dtypes.as_dtype(tensor.dtype)
+  return dtype.base_dtype in (dtypes.float16, dtypes.float32, dtypes.float64,
+                              dtypes.complex64, dtypes.complex128)
+
+
+def _VerifyGeneratedGradients(grads, op):
+  """Verify that gradients are valid in number and type.
+
+  Args:
+    grads: List of generated gradients.
+    op: Operation for which the gradients where generated.
+
+  Raises:
+    ValueError: if the gradients are invalid.
+  """
+  if len(grads) != len(op.inputs):
+    raise ValueError("Num gradients %d generated for op %s do not match num "
+                     "inputs %d" % (len(grads), op.node_def, len(op.inputs)))
+  for i in xrange(len(grads)):
+    grad = grads[i]
+    inp = op.inputs[i]
+    if grad is not None:
+      if not grad.dtype.is_compatible_with(inp.dtype):
+        raise ValueError("Gradient type %s generated for op %s does "
+                         "not match input type %s" %
+                         (dtypes.as_dtype(grad.dtype).name, op.node_def,
+                          dtypes.as_dtype(inp.dtype).name))
+
+
+def _StopOps(from_ops, pending_count):
+  """The set of ops that terminate the gradient computation.
+
+  This computes the frontier of the forward graph *before* which backprop
+  should stop. Operations in the returned set will not be differentiated.
+  This set is defined as the subset of `from_ops` containing ops that have
+  no predecessor in `from_ops`. `pending_count` is the result of
+  `_PendingCount(g, xs, from_ops)`. An 'op' has predecessors in `from_ops`
+  iff pending_count[op._id] > 0.
+
+  Args:
+    from_ops: list of Operations.
+    pending_count: List of integers, indexed by operation id.
+
+  Returns:
+    The set of operations.
+  """
+  stop_ops = set()
+  for op in from_ops:
+    is_stop_op = True
+    for inp in op.inputs:
+      if pending_count[inp.op._id] > 0:
+        is_stop_op = False
+        break
+    if is_stop_op:
+      stop_ops.add(op._id)
+  return stop_ops
+
+
+@contextlib.contextmanager
+def _maybe_colocate_with(op, colocate_gradients_with_ops):
+  """Context to colocate with `op` if `colocate_gradients_with_ops`."""
+  if colocate_gradients_with_ops:
+    with ops.colocate_with(op):
+      yield
+  else:
+    yield
+
+
+def _SymGrad(op, out_grads):
+  """Backprop through a function call node op given its outputs' gradients."""
+  f_in = [x for x in op.inputs] + out_grads
+  f_types = [x.dtype for x in op.inputs]
+  f = attr_value_pb2.NameAttrList()
+  f.name = op.type
+  for k in op.node_def.attr:
+    f.attr[k].CopyFrom(op.node_def.attr[k])
+  # pylint: disable=protected-access
+  in_grads = functional_ops._symbolic_gradient(input=f_in, Tout=f_types, f=f)
+  # pylint: enable=protected-access
+  return in_grads
+
+
+def gradients(ys,
+              xs,
+              grad_ys=None,
+              name="gradients",
+              colocate_gradients_with_ops=False,
+              gate_gradients=False,
+              aggregation_method=None):
+  """Constructs symbolic partial derivatives of sum of `ys` w.r.t. x in `xs`.
+
+  `ys` and `xs` are each a `Tensor` or a list of tensors.  `grad_ys`
+  is a list of `Tensor`, holding the gradients received by the
+  `ys`. The list must be the same length as `ys`.
+
+  `gradients()` adds ops to the graph to output the partial
+  derivatives of `ys` with respect to `xs`.  It returns a list of
+  `Tensor` of length `len(xs)` where each tensor is the `sum(dy/dx)`
+  for y in `ys`.
+
+  `grad_ys` is a list of tensors of the same length as `ys` that holds
+  the initial gradients for each y in `ys`.  When `grad_ys` is None,
+  we fill in a tensor of '1's of the shape of y for each y in `ys`.  A
+  user can provide their own initial `grad_ys` to compute the
+  derivatives using a different initial gradient for each y (e.g., if
+  one wanted to weight the gradient differently for each value in
+  each y).
+
+  Args:
+    ys: A `Tensor` or list of tensors to be differentiated.
+    xs: A `Tensor` or list of tensors to be used for differentiation.
+    grad_ys: Optional. A `Tensor` or list of tensors the same size as
+      `ys` and holding the gradients computed for each y in `ys`.
+    name: Optional name to use for grouping all the gradient ops together.
+      defaults to 'gradients'.
+    colocate_gradients_with_ops: If True, try colocating gradients with
+      the corresponding op.
+    gate_gradients: If True, add a tuple around the gradients returned
+      for an operations.  This avoids some race conditions.
+    aggregation_method: Specifies the method used to combine gradient terms.
+      Accepted values are constants defined in the class `AggregationMethod`.
+
+  Returns:
+    A list of `sum(dy/dx)` for each x in `xs`.
+
+  Raises:
+    LookupError: if one of the operations between `x` and `y` does not
+      have a registered gradient function.
+    ValueError: if the arguments are invalid.
+
+  """
+  ys = _AsList(ys)
+  xs = _AsList(xs)
+  if grad_ys is None:
+    grad_ys = [None] * len(ys)
+  else:
+    grad_ys = _AsList(grad_ys)
+
+  with ops.name_scope(name, "gradients", ys + xs + grad_ys):
+    ys = ops.convert_n_to_tensor_or_indexed_slices(ys, name="y")
+    xs = ops.convert_n_to_tensor_or_indexed_slices(xs, name="x")
+    grad_ys = _DefaultGradYs(grad_ys, ys, colocate_gradients_with_ops)
+
+    # The approach we take here is as follows: Create a list of all ops in the
+    # subgraph between the ys and xs.  Visit these ops in reverse order of ids
+    # to ensure that when we visit an op the gradients w.r.t its outputs have
+    # been collected.  Then aggregate these gradients if needed, call the op's
+    # gradient function, and add the generated gradients to the gradients for
+    # its input.
+
+    # Initialize the pending count for ops in the connected subgraph from ys
+    # to the xs.
+    to_ops = [t.op for t in ys]
+    from_ops = [t.op for t in xs]
+    pending_count, loop_state = _PendingCount(ops.get_default_graph(), to_ops,
+                                              from_ops,
+                                              colocate_gradients_with_ops)
+
+    # Iterate over the collected ops.
+    #
+    # grads: op => list of gradients received on each output endpoint of the
+    # op.  The gradients for each endpoint are initially collected as a list.
+    # When it is time to call the op's gradient function, for each endpoint we
+    # aggregate the list of received gradients into a Add() Operation if there
+    # is more than one.
+    grads = {}
+
+    # Add the initial gradients for the ys.
+    for y, grad_y in zip(ys, grad_ys):
+      _SetGrad(grads, y, grad_y)
+
+    # Initialize queue with to_ops.
+    queue = collections.deque()
+    # Add the ops in 'to_ops' into the queue.
+    to_ops_set = set()
+    for op in to_ops:
+      # 'ready' handles the case where one output gradient relies on
+      # another output's gradient.
+      # pylint: disable=protected-access
+      ready = (pending_count[op._id] == 0)
+      if ready and op._id not in to_ops_set:
+        to_ops_set.add(op._id)
+        queue.append(op)
+      # pylint: enable=protected-access
+
+    if loop_state:
+      loop_exits = loop_state.ProcessUnusedLoopExits(pending_count, to_ops_set)
+      for y in loop_exits:
+        if _IsTrainable(y):
+          _SetGrad(grads, y, loop_state.ZerosLikeForExit(y))
+          queue.append(y.op)
+
+    # The set of 'from_ops'.
+    stop_ops = _StopOps(from_ops, pending_count)
+    while queue:
+      # generate gradient subgraph for op.
+      op = queue.popleft()
+      with _maybe_colocate_with(op, colocate_gradients_with_ops):
+        if loop_state:
+          loop_state.EnterGradWhileContext(op, before=True)
+        out_grads = _AggregatedGrads(grads, op, loop_state, aggregation_method)
+        if loop_state:
+          loop_state.ExitGradWhileContext(op, before=True)
+
+        grad_fn = None
+        # pylint: disable=protected-access
+        is_func_call = ops.get_default_graph()._is_function(op.type)
+        has_out_grads = any(isinstance(g, ops.Tensor) or g for g in out_grads)
+        if has_out_grads and (op._id not in stop_ops):
+          if is_func_call:
+            grad_fn = ops.get_default_graph()._get_function(
+                op.type).python_grad_func
+            # pylint: enable=protected-access
+          else:
+            # A grad_fn must be defined, either as a function or as None
+            # for ops that do not have gradients.
+            try:
+              grad_fn = ops.get_gradient_function(op)
+            except LookupError:
+              raise LookupError(
+                  "No gradient defined for operation '%s' (op type: %s)" %
+                  (op.name, op.type))
+        if loop_state:
+          loop_state.EnterGradWhileContext(op, before=False)
+        if (grad_fn or is_func_call) and has_out_grads:
+          # NOTE: If _AggregatedGrads didn't compute a value for the i'th
+          # output, it means that the cost does not depend on output[i],
+          # therefore dC/doutput[i] is 0.
+          for i, out_grad in enumerate(out_grads):
+            if (not isinstance(out_grad, ops.Tensor) and
+                not out_grad) and _IsTrainable(op.outputs[i]):
+              # Only floating-point outputs get a zero gradient. Gradient
+              # functions should ignore the gradient for other outputs.
+              if loop_state:
+                out_grads[i] = loop_state.ZerosLike(op, i)
+              else:
+                out_grads[i] = control_flow_ops.ZerosLikeOutsideLoop(op, i)
+          with ops.name_scope(op.name + "_grad"):
+            # pylint: disable=protected-access
+            with ops.get_default_graph()._original_op(op):
+              # pylint: enable=protected-access
+              if grad_fn:
+                # If grad_fn was found, do not use SymbolicGradient even for
+                # functions.
+                in_grads = grad_fn(op, *out_grads)
+              else:
+                # For function call ops, we add a 'SymbolicGradient'
+                # node to the graph to compute gradients.
+                in_grads = _SymGrad(op, out_grads)
+              in_grads = _AsList(in_grads)
+              _VerifyGeneratedGradients(in_grads, op)
+              if gate_gradients and len(
+                  [x for x in in_grads if x is not None]) > 1:
+                in_grads = control_flow_ops.tuple(in_grads)
+          _LogOpGradients(op, out_grads, in_grads)
+        else:
+          # If no grad_fn is defined or none of out_grads is available,
+          # just propagates a list of None backwards.
+          in_grads = [None] * len(op.inputs)
+        for t_in, in_grad in zip(op.inputs, in_grads):
+          if in_grad is not None:
+            if isinstance(in_grad, ops.Tensor):
+              in_grad.set_shape(t_in.get_shape())
+            _SetGrad(grads, t_in, in_grad)
+        if loop_state:
+          loop_state.ExitGradWhileContext(op, before=False)
+
+      # Update pending count for the inputs of op and enqueue ready ops.
+      _UpdatePendingAndEnqueueReady(grads, op, queue, pending_count, loop_state)
+
+  if loop_state:
+    loop_state.PostProcessing()
+  return [_GetGrad(grads, x) for x in xs]
+
+
+def _HasAnyNotNoneGrads(grads, op):
+  """Return true iff op has real gradient."""
+  out_grads = _GetGrads(grads, op)
+  for out_grad in out_grads:
+    if isinstance(out_grad, (ops.Tensor, ops.IndexedSlices)):
+      return True
+    if out_grad and isinstance(out_grad, collections.Sequence):
+      if any([g is not None for g in out_grad]):
+        return True
+  return False
+
+
+def _UpdatePendingAndEnqueueReady(grads, op, queue, pending_count, loop_state):
+  """Update pending count for the inputs of op and enqueue ready ops."""
+  for x in op.inputs:
+    # pylint: disable=protected-access
+    pending_count[x.op._id] -= 1
+    ready = (pending_count[x.op._id] == 0)
+    if loop_state and not ready:
+      ready = (pending_count[x.op._id] > 0 and
+               control_flow_ops.IsLoopSwitch(x.op))
+    # pylint: enable=protected-access
+    if ready:
+      if control_flow_ops.IsLoopExit(x.op):
+        # if x is an exit without real gradient, defer processing them.
+        grad_state = loop_state.GetGradState(x.op, before=False)
+        grad_state.deferred_exits.append(x)
+        grad_state.pending_exits_count -= 1
+        if grad_state.pending_exits_count == 0:
+          # We now have all the exits so process them.
+          has_real_grad = False
+          for y in grad_state.deferred_exits:
+            if _HasAnyNotNoneGrads(grads, y.op):
+              has_real_grad = True
+              queue.append(y.op)
+            else:
+              grad_state.unused_exits.append(y)
+          if has_real_grad:
+            # For an unused exit, if it has floating-point outputs, backprop
+            # a zero gradient. Otherwise, just ignore it.
+            for y in grad_state.unused_exits:
+              if _IsTrainable(y):
+                _SetGrad(grads, y, loop_state.ZerosLikeForExit(y))
+              queue.append(y.op)
+          else:
+            # All exits are "unused" so use None as gradient.
+            for y in grad_state.unused_exits:
+              queue.append(y.op)
+      else:
+        queue.append(x.op)
+
+
+def _SetGrad(grads, t, grad):
+  """Sets gradient "grad" in "grads" for tensor "t"."""
+  op = t.op
+  op_grads = grads.get(op)
+  if not op_grads:
+    op_grads = [[] for _ in xrange(len(op.outputs))]
+    grads[op] = op_grads
+  t_grads = op_grads[t.value_index]
+  if isinstance(t_grads, list):
+    t_grads.append(grad)
+  else:
+    assert control_flow_ops.IsLoopSwitch(op)
+    op_grads[t.value_index] = grad
+
+
+def _GetGrad(grads, t):
+  """Gets gradient for tensor "t"."""
+  op = t.op
+  op_grads = grads.get(op)
+  if not op_grads:
+    return None
+  t_grad = op_grads[t.value_index]
+  assert not isinstance(t_grad, list), (
+      "gradients list should have been aggregated by now.")
+  return t_grad
+
+
+def _GetGrads(grads, op):
+  """Gets all gradients for op."""
+  if op in grads:
+    return grads[op]
+  else:
+    return [[] for _ in xrange(len(op.outputs))]
+
+
+def _HandleNestedIndexedSlices(grad):
+  assert isinstance(grad, ops.IndexedSlices)
+  if isinstance(grad.values, ops.Tensor):
+    return grad
+  else:
+    assert isinstance(grad.values, ops.IndexedSlices)
+    g = _HandleNestedIndexedSlices(grad.values)
+    return ops.IndexedSlices(g.values,
+                             array_ops.gather(grad.indices, g.indices),
+                             g.dense_shape)
+
+
+def _AccumulatorShape(inputs):
+  shape = tensor_shape.unknown_shape()
+  for i in inputs:
+    if isinstance(i, ops.Tensor):
+      shape = shape.merge_with(i.get_shape())
+  return shape
+
+
+def _LogOpGradients(op, out_grads, in_grads):
+  """Log the in and out grads of an op."""
+  logging.vlog(1, "Gradient for '" + op.name + "'")
+
+  def _FilterGrad(x):
+    if x is None:
+      return False
+    if isinstance(x, (list, tuple)):
+      return bool(x)
+    else:
+      return True
+
+  logging.vlog(1, "  in  --> %s",
+               ", ".join([x.name for x in out_grads if _FilterGrad(x)]))
+  logging.vlog(1, "  out --> %s",
+               ", ".join([x.name for x in in_grads if _FilterGrad(x)]))
+
+
+def _MultiDeviceAddN(tensor_list):
+  """Adds tensors from potentially multiple devices."""
+  # Basic function structure comes from control_flow_ops.group().
+  # Sort tensors according to their devices.
+  tensors_on_device = collections.defaultdict(lambda: [])
+  for tensor in tensor_list:
+    tensors_on_device[tensor.device].append(tensor)
+
+  # For each device, add the tensors on that device first.
+  # Then gather the partial sums from multiple devices.
+  # TODO(sjhwang): Create hierarchical aggregation tree as pbar's suggestion.
+  # E.g., aggregate per GPU, then per task, and so on.
+  summands = []
+
+  def DeviceKey(dev):
+    return "" if dev is None else dev
+
+  for dev in sorted(six.iterkeys(tensors_on_device), key=DeviceKey):
+    tensors = tensors_on_device[dev]
+    with ops.colocate_with(tensors[0].op, ignore_existing=True):
+      summands.append(math_ops.add_n(tensors))
+
+  return math_ops.add_n(summands)
+
+
+class AggregationMethod(object):
+  """A class listing aggregation methods used to combine gradients.
+
+  Computing partial derivatives can require aggregating gradient
+  contributions. This class lists the various methods that can
+  be used to combine gradients in the graph:
+
+  *  `ADD_N`: All of the gradient terms are summed as part of one
+     operation using the "AddN" op. It has the property that all
+     gradients must be ready before any aggregation is performed.
+  *  `DEFAULT`: The system-chosen default aggregation method.
+  """
+  ADD_N = 0
+  DEFAULT = ADD_N
+  # The following are experimental and may not be supported in future releases.
+  EXPERIMENTAL_TREE = 1
+  EXPERIMENTAL_ACCUMULATE_N = 2
+
+
+def _AggregatedGrads(grads, op, loop_state, aggregation_method=None):
+  """Get the aggregated gradients for op.
+
+  Args:
+    grads: The map of memoized gradients.
+    op: The op to get gradients for.
+    loop_state: An object for maintaining the state of the while loops in the
+                graph. It is of type ControlFlowState. None if the graph
+                contains no while loops.
+    aggregation_method: Specifies the method used to combine gradient terms.
+      Accepted values are constants defined in the class `AggregationMethod`.
+
+  Returns:
+    A list of gradients, one per each output of `op`. If the gradients
+      for a particular output is a list, this function aggregates it
+      before returning.
+
+  Raises:
+    TypeError: if the incoming grads are not Tensors or IndexedSlices.
+    ValueError: if the arguments are invalid.
+
+  """
+  if aggregation_method is None:
+    aggregation_method = AggregationMethod.DEFAULT
+  if aggregation_method not in [
+      AggregationMethod.ADD_N, AggregationMethod.EXPERIMENTAL_TREE,
+      AggregationMethod.EXPERIMENTAL_ACCUMULATE_N
+  ]:
+    raise ValueError("Invalid aggregation_method specified %s." %
+                     aggregation_method)
+  out_grads = _GetGrads(grads, op)
+  for i, out_grad in enumerate(out_grads):
+    if loop_state:
+      if isinstance(out_grad, (ops.Tensor, ops.IndexedSlices)):
+        assert control_flow_ops.IsLoopSwitch(op)
+        continue
+    # Grads have to be Tensors or IndexedSlices
+    if (isinstance(out_grad, collections.Sequence) and not all([
+        isinstance(g, (ops.Tensor, ops.IndexedSlices)) for g in out_grad
+        if g is not None
+    ])):
+      raise TypeError("gradients have to be either all Tensors "
+                      "or all IndexedSlices")
+    # Aggregate multiple gradients, and convert [] to None.
+    if out_grad:
+      if len(out_grad) < 2:
+        used = "nop"
+        out_grads[i] = out_grad[0]
+      elif all([isinstance(g, ops.Tensor) for g in out_grad if g is not None]):
+        tensor_shape = _AccumulatorShape(out_grad)
+        if (aggregation_method == AggregationMethod.EXPERIMENTAL_ACCUMULATE_N
+            and len(out_grad) > 2 and tensor_shape.is_fully_defined()):
+          # The benefit of using AccumulateN is that its inputs can be combined
+          # in any order and this can allow the expression to be evaluated with
+          # a smaller memory footprint.  When used with gpu_allocator_retry,
+          # it is possible to compute a sum of terms which are much larger than
+          # total GPU memory.
+          # AccumulateN can currently only be used if we know the shape for
+          # an accumulator variable.  If this is not known, or if we only have
+          # 2 grads then we fall through to the "tree" case below.
+          used = "accumulate_n"
+          out_grads[i] = math_ops.accumulate_n(out_grad)
+        elif aggregation_method in [
+            AggregationMethod.EXPERIMENTAL_TREE,
+            AggregationMethod.EXPERIMENTAL_ACCUMULATE_N
+        ]:
+          # Aggregate all gradients by doing pairwise sums: this may
+          # reduce performance, but it can improve memory because the
+          # gradients can be released earlier.
+          #
+          # TODO(vrv): Consider replacing this with a version of
+          # tf.AddN() that eagerly frees its inputs as soon as they are
+          # ready, so the order of this tree does not become a problem.
+          used = "tree"
+          with ops.name_scope(op.name + "_gradient_sum"):
+            running_sum = out_grad[0]
+            for grad in out_grad[1:]:
+              running_sum = math_ops.add_n([running_sum, grad])
+            out_grads[i] = running_sum
+        else:
+          used = "add_n"
+          out_grads[i] = _MultiDeviceAddN(out_grad)
+        logging.vlog(2, "  _AggregatedGrads %d x %s using %s",
+                     len(out_grad), tensor_shape, used)
+      else:
+        out_grad = math_ops._as_indexed_slices_list(
+            [g for g in out_grad if g is not None])
+        out_grad = [_HandleNestedIndexedSlices(x) for x in out_grad]
+        # Form IndexedSlices out of the concatenated values and
+        # indices.
+        out_grads[i] = ops.IndexedSlices(
+            array_ops.concat(0, [x.values for x in out_grad]),
+            array_ops.concat(0, [x.indices for x in out_grad]),
+            out_grad[0].dense_shape)
+    else:
+      out_grads[i] = []
+  return out_grads
+
+
+# TODO(vrv): Make this available when we want to make it public.
+def _hessian_vector_product(ys, xs, v):
+  """Multiply the Hessian of `ys` wrt `xs` by `v`.
+
+  This is an efficient construction that uses a backprop-like approach
+  to compute the product between the Hessian and another vector. The
+  Hessian is usually too large to be explicitly computed or even
+  represented, but this method allows us to at least multiply by it
+  for the same big-O cost as backprop.
+
+  Implicit Hessian-vector products are the main practical, scalable way
+  of using second derivatives with neural networks. They allow us to
+  do things like construct Krylov subspaces and approximate conjugate
+  gradient descent.
+
+  Example: if `y` = 1/2 `x`^T A `x`, then `hessian_vector_product(y,
+  x, v)` will return an expression that evaluates to the same values
+  as (A + A.T) `v`.
+
+  Args:
+    ys: A scalar value, or a tensor or list of tensors to be summed to
+        yield a scalar.
+    xs: A list of tensors that we should construct the Hessian over.
+    v: A list of tensors, with the same shapes as xs, that we want to
+       multiply by the Hessian.
+
+  Returns:
+    A list of tensors (or if the list would be length 1, a single tensor)
+    containing the product between the Hessian and `v`.
+
+  Raises:
+    ValueError: `xs` and `v` have different length.
+
+  """
+
+  # Validate the input
+  length = len(xs)
+  if len(v) != length:
+    raise ValueError("xs and v must have the same length.")
+
+  # First backprop
+  grads = gradients(ys, xs)
+
+  assert len(grads) == length
+  elemwise_products = [
+      math_ops.mul(grad_elem, array_ops.stop_gradient(v_elem))
+      for grad_elem, v_elem in zip(grads, v) if grad_elem is not None
+  ]
+
+  # Second backprop
+  return gradients(elemwise_products, xs)
+
+
+def hessians(ys, xs, name="hessians", colocate_gradients_with_ops=False,
+            gate_gradients=False, aggregation_method=None):
+  """Constructs the Hessian of sum of `ys` with respect to `x` in `xs`.
+
+  `hessians()` adds ops to the graph to output the Hessian matrix of `ys`
+  with respect to `xs`.  It returns a list of `Tensor` of length `len(xs)`
+  where each tensor is the Hessian of `sum(ys)`. This function currently
+  only supports evaluating the Hessian with respect to (a list of) one-
+  dimensional tensors.
+
+  The Hessian is a matrix of second-order partial derivatives of a scalar
+  tensor (see https://en.wikipedia.org/wiki/Hessian_matrix for more details).
+
+  Args:
+    ys: A `Tensor` or list of tensors to be differentiated.
+    xs: A `Tensor` or list of tensors to be used for differentiation.
+    name: Optional name to use for grouping all the gradient ops together.
+      defaults to 'hessians'.
+    colocate_gradients_with_ops: See `gradients()` documentation for details.
+    gate_gradients: See `gradients()` documentation for details.
+    aggregation_method: See `gradients()` documentation for details.
+
+  Returns:
+    A list of Hessian matrices of `sum(y)` for each `x` in `xs`.
+
+  Raises:
+    LookupError: if one of the operations between `xs` and `ys` does not
+      have a registered gradient function.
+    ValueError: if the arguments are invalid or not supported. Currently,
+      this function only supports one-dimensional `x` in `xs`.
+  """
+  xs = _AsList(xs)
+  kwargs = {
+      'colocate_gradients_with_ops': colocate_gradients_with_ops,
+      'gate_gradients': gate_gradients,
+      'aggregation_method': aggregation_method
+    }
+  # Compute a hessian matrix for each x in xs
+  hessians = []
+  for i, x in enumerate(xs):
+    # Check dimensions
+    ndims = x.get_shape().ndims
+    if ndims is None:
+      raise ValueError('Cannot compute Hessian because the dimensionality of '
+                       'element number %d of `xs` cannot be determined' % i)
+    elif ndims != 1:
+      raise ValueError('Computing hessians is currently only supported for '
+                       'one-dimensional tensors. Element number %d of `xs` has '
+                       '%d dimensions.' % (i, ndims))
+    with ops.name_scope(name + '_first_derivative'):
+      # Compute the partial derivatives of the input with respect to all
+      # elements of `x`
+      _gradients = gradients(ys, x, **kwargs)[0]
+      # Unpack the gradients into a list so we can take derivatives with
+      # respect to each element
+      _gradients = array_ops.unpack(_gradients)
+    with ops.name_scope(name + '_second_derivative'):
+      # Compute the partial derivatives with respect to each element of the list
+      _hess = [gradients(_gradient, x, **kwargs)[0] for _gradient in _gradients]
+      # Pack the list into a matrix and add to the list of hessians
+      hessians.append(array_ops.pack(_hess, name=name))
+  return hessians
diff --git a/tensorflow/python/ops/gradients_test.py b/tensorflow/python/ops/gradients_test.py
index 1c444de510c..1743cd8caaa 100644
--- a/tensorflow/python/ops/gradients_test.py
+++ b/tensorflow/python/ops/gradients_test.py
@@ -34,6 +34,7 @@ from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import data_flow_grad  # pylint: disable=unused-import
 from tensorflow.python.ops import data_flow_ops  # pylint: disable=unused-import
 from tensorflow.python.ops import gradients
+from tensorflow.python.ops import gradients_impl
 from tensorflow.python.ops import math_grad  # pylint: disable=unused-import
 from tensorflow.python.ops import math_ops
 from tensorflow.python.ops import nn_grad  # pylint: disable=unused-import
@@ -66,8 +67,8 @@ def _OpsBetween(graph, to_ops, from_ops):
   # output ops as reached to avoid recursing past them.
   for op in to_ops:
     reached_ops[op._id] = True
-  gradients._MarkReachedOps(from_ops, reached_ops)
-  between_ops = gradients._GatherInputs(to_ops, reached_ops)
+  gradients_impl._MarkReachedOps(from_ops, reached_ops)
+  between_ops = gradients_impl._GatherInputs(to_ops, reached_ops)
   between_ops.sort(key=lambda x: -x._id)
   return between_ops
 
@@ -414,11 +415,57 @@ class HessianVectorProductTest(test_util.TensorFlowTestCase):
         x = constant_op.constant(x_value)
         mat_x = math_ops.matmul(mat, x, name="Ax")
         x_mat_x = math_ops.matmul(array_ops.transpose(x), mat_x, name="xAx")
-        hess_v = gradients._hessian_vector_product(x_mat_x, [x], [v])[0]
+        hess_v = gradients_impl._hessian_vector_product(x_mat_x, [x], [v])[0]
         hess_v_actual = hess_v.eval()
       self.assertAllClose(hess_v_value, hess_v_actual)
 
 
+class HessianTest(test_util.TensorFlowTestCase):
+
+  def testHessian1D(self):
+    # Manually compute the Hessian explicitly for a low-dimensional problem
+    # and check that `hessian` matches. Specifically, the Hessian of 
+    # f(x) = x^T A x is H = A + A^T.
+    m = 4
+    rng = np.random.RandomState([1, 2, 3])
+    mat_value = rng.randn(m, m).astype("float32")
+    x_value = rng.randn(m).astype("float32")
+    hess_value = mat_value + mat_value.T
+    with self.test_session(use_gpu=True):
+      mat = constant_op.constant(mat_value)
+      x = constant_op.constant(x_value)
+      x_mat_x = math_ops.reduce_sum(x[:, None] * mat * x[None, :])
+      hess = gradients.hessians(x_mat_x, x)[0]
+      hess_actual = hess.eval()
+    self.assertAllClose(hess_value, hess_actual)
+
+  def testHessian1D_multi(self):
+    # Test the computation of the hessian with respect to multiple tensors
+    m = 4
+    n = 3
+    rng = np.random.RandomState([1, 2, 3])
+    mat_values = [rng.randn(m, m).astype("float32") for _ in range(n)]
+    x_values = [rng.randn(m).astype("float32") for _ in range(n)]
+    hess_values = [mat_value + mat_value.T for mat_value in mat_values]
+    with self.test_session(use_gpu=True):
+      mats = [constant_op.constant(mat_value) for mat_value in mat_values]
+      xs = [constant_op.constant(x_value) for x_value in x_values]
+      xs_mats_xs = [math_ops.reduce_sum(x[:, None] * mat * x[None, :]) 
+                    for x, mat in zip(xs, mats)]
+      hessians = gradients.hessians(xs_mats_xs, xs)
+      hessians_actual = [hess.eval() for hess in hessians]
+    for hess_value, hess_actual in zip(hess_values, hessians_actual):
+      self.assertAllClose(hess_value, hess_actual)
+
+  def testHessianInvalidDimension(self):
+    for shape in [(10, 10), None]:
+      with self.test_session(use_gpu=True):
+        x = array_ops.placeholder(tf.float32, shape)
+        # Expect a ValueError because the dimensions are wrong
+        with self.assertRaises(ValueError):
+          gradients.hessians(x, x)
+
+
 class IndexedSlicesToTensorTest(test_util.TensorFlowTestCase):
 
   def testIndexedSlicesToTensor(self):
diff --git a/tensorflow/python/ops/io_ops.py b/tensorflow/python/ops/io_ops.py
index 15605ee42a4..7daf7c8cc82 100644
--- a/tensorflow/python/ops/io_ops.py
+++ b/tensorflow/python/ops/io_ops.py
@@ -92,6 +92,7 @@ Queues](../../how_tos/threading_and_queues/index.md).
 
 @@matching_files
 @@read_file
+@@write_file
 
 ## Input pipeline
 
@@ -521,4 +522,5 @@ ops.RegisterShape("ReaderReadUpTo")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("ReaderReset")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("ReaderRestoreState")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("ReadFile")(common_shapes.call_cpp_shape_fn)
+ops.RegisterShape("WriteFile")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("MatchingFiles")(common_shapes.call_cpp_shape_fn)
diff --git a/tensorflow/python/ops/linalg_grad.py b/tensorflow/python/ops/linalg_grad.py
index 604fd4b3aa1..4b680c69464 100644
--- a/tensorflow/python/ops/linalg_grad.py
+++ b/tensorflow/python/ops/linalg_grad.py
@@ -74,6 +74,92 @@ def _MatrixSolveGrad(op, grad):
   return (grad_a, grad_b)
 
 
+@ops.RegisterGradient("MatrixSolveLs")
+def _MatrixSolveLsGrad(op, grad):
+  """Gradients for MatrixSolveLs."""
+
+  # TODO(rmlarsen): The implementation could be more efficient:
+  #   a) Output the Cholesky factorization from forward op instead of
+  #      recomputing it here.
+  #   b) Implement a symmetric rank-k update op instead of computing
+  #      x*z + transpose(x*z). This pattern occurs other places in TensorFlow.
+
+  def _overdetermined(op, grad):
+    """Gradients for the overdetermined case of MatrixSolveLs.
+
+    This is the backprop for the solution to the normal equations of the first
+    kind:
+       X = F(A, B) = (A^T * A + lambda * I)^{-1} * A^T * B
+    which solve the least squares problem
+       min ||A * X - B||_F^2 + lambda ||X||_F^2.
+    """
+    a = op.inputs[0]
+    b = op.inputs[1]
+    l2_regularizer = op.inputs[2]
+    x = op.outputs[0]
+    a_shape = array_ops.shape(a)
+    batch_shape = a_shape[:-2]
+    n = a_shape[-1]
+
+    identity = linalg_ops.eye(n, batch_shape=batch_shape, dtype=a.dtype)
+    gramian = math_ops.batch_matmul(
+        a, a, adj_x=True) + l2_regularizer * identity
+    chol = linalg_ops.cholesky(gramian)
+    # Temporary z = (A^T * A + lambda * I)^{-1} * grad.
+    z = linalg_ops.cholesky_solve(chol, grad)
+    xzt = math_ops.batch_matmul(x, z, adj_y=True)
+    zx_sym = xzt + array_ops.matrix_transpose(xzt)
+    grad_a = -math_ops.batch_matmul(a, zx_sym) + math_ops.batch_matmul(
+        b, z, adj_y=True)
+    grad_b = math_ops.batch_matmul(a, z)
+    return (grad_a, grad_b, None)
+
+  def _underdetermined(op, grad):
+    """Gradients for the underdetermined case of MatrixSolveLs.
+
+    This is the backprop for the solution to the normal equations of the second
+    kind:
+      X = F(A, B) = A * (A*A^T + lambda*I)^{-1} * B
+    that (for lambda=0) solve the least squares problem
+      min ||X||_F subject to A*X = B.
+    """
+    a = op.inputs[0]
+    b = op.inputs[1]
+    l2_regularizer = op.inputs[2]
+    a_shape = array_ops.shape(a)
+    batch_shape = a_shape[:-2]
+    m = a_shape[-2]
+
+    identity = linalg_ops.eye(m, batch_shape=batch_shape, dtype=a.dtype)
+    gramian = math_ops.batch_matmul(
+        a, a, adj_y=True) + l2_regularizer * identity
+    chol = linalg_ops.cholesky(gramian)
+    grad_b = linalg_ops.cholesky_solve(chol, math_ops.batch_matmul(a, grad))
+    # Temporary z = (A * A^T + lambda * I)^{-1} * B.
+    z = linalg_ops.cholesky_solve(chol, b)
+    bz = -math_ops.batch_matmul(grad_b, z, adj_y=True)
+    bz_sym = bz + array_ops.matrix_transpose(bz)
+    grad_a = math_ops.batch_matmul(bz_sym, a) + math_ops.batch_matmul(z, grad)
+    return (grad_a, grad_b, None)
+
+  fast = op.get_attr("fast")
+  if fast is False:
+    raise ValueError("Gradient not defined for fast=False")
+  matrix_shape = op.inputs[0].get_shape()[-2:]
+  if matrix_shape.is_fully_defined():
+    if matrix_shape[-2] >= matrix_shape[-1]:
+      return _overdetermined(op, grad)
+    else:
+      return _underdetermined(op, grad)
+  else:
+    # We have to defer determining the shape to runtime and use
+    # conditional execution of the appropriate graph.
+    matrix_shape = array_ops.shape(op.inputs[0])[-2:]
+    return control_flow_ops.cond(matrix_shape[-2] >= matrix_shape[-1],
+                                 lambda: _overdetermined(op, grad),
+                                 lambda: _underdetermined(op, grad))
+
+
 @ops.RegisterGradient("MatrixTriangularSolve")
 def _MatrixTriangularSolveGrad(op, grad):
   """Gradient for MatrixTriangularSolve."""
@@ -129,6 +215,6 @@ def _SelfAdjointEigV2Grad(op, grad_e, grad_v):
     # symmetrize and take the lower triangle
     grad_a = array_ops.matrix_band_part(
         grad_a + array_ops.matrix_transpose(grad_a), -1, 0)
-    grad_a = array_ops.matrix_set_diag(grad_a, 0.5 *
-                                       array_ops.matrix_diag_part(grad_a))
+    grad_a = array_ops.matrix_set_diag(grad_a,
+                                       0.5 * array_ops.matrix_diag_part(grad_a))
     return grad_a
diff --git a/tensorflow/python/ops/linalg_ops.py b/tensorflow/python/ops/linalg_ops.py
index da411044384..36cdcc7dc4c 100644
--- a/tensorflow/python/ops/linalg_ops.py
+++ b/tensorflow/python/ops/linalg_ops.py
@@ -239,7 +239,7 @@ def self_adjoint_eigvals(tensor, name=None):
   return e
 
 
-def svd(tensor, compute_uv=True, full_matrices=False, name=None):
+def svd(tensor, full_matrices=False, compute_uv=True, name=None):
   """Computes the singular value decompositions of one or more matrices.
 
   Computes the SVD of each inner matrix in `tensor` such that
@@ -258,12 +258,12 @@ def svd(tensor, compute_uv=True, full_matrices=False, name=None):
   Args:
     matrix: `Tensor` of shape `[..., M, N]`. Let `P` be the minimum of `M` and
       `N`.
-    compute_uv: If `True` then left and right singular vectors will be
-      computed and returned in `u` and `v`, respectively. Otherwise, only the
-      singular values will be computed, which can be significantly faster.
     full_matrices: If true, compute full-sized `u` and `v`. If false
       (the default), compute only the leading `P` singular vectors.
       Ignored if `compute_uv` is `False`.
+    compute_uv: If `True` then left and right singular vectors will be
+      computed and returned in `u` and `v`, respectively. Otherwise, only the
+      singular values will be computed, which can be significantly faster.
     name: string, optional name of the operation.
 
   Returns:
diff --git a/tensorflow/python/ops/math_grad.py b/tensorflow/python/ops/math_grad.py
index 7d8d2390b17..00fb343d47f 100644
--- a/tensorflow/python/ops/math_grad.py
+++ b/tensorflow/python/ops/math_grad.py
@@ -326,6 +326,15 @@ def _LogGrad(op, grad):
     return grad * math_ops.inv(x)
 
 
+@ops.RegisterGradient("Log1p")
+def _Log1pGrad(op, grad):
+  """Returns grad * (1/(1 + x))."""
+  x = op.inputs[0]
+  with ops.control_dependencies([grad.op]):
+    x = math_ops.conj(x)
+    return grad * math_ops.inv(1 + x)
+
+
 @ops.RegisterGradient("Tanh")
 def _TanhGrad(op, grad):
   """Returns grad * (1 - tanh(x) * tanh(x))."""
diff --git a/tensorflow/python/ops/math_ops.py b/tensorflow/python/ops/math_ops.py
index cf4b47757eb..0bd93abc1ed 100644
--- a/tensorflow/python/ops/math_ops.py
+++ b/tensorflow/python/ops/math_ops.py
@@ -51,6 +51,7 @@ mathematical functions to your graph.
 @@pow
 @@exp
 @@log
+@@log1p
 @@ceil
 @@floor
 @@maximum
@@ -217,6 +218,7 @@ from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import graph_util
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import gen_control_flow_ops
@@ -258,13 +260,15 @@ def abs(x, name=None):
       values.
   """
   with ops.name_scope(name, "Abs", [x]) as name:
-    if isinstance(x, ops.SparseTensor):
+    if isinstance(x, sparse_tensor.SparseTensor):
       if x.values.dtype in (dtypes.complex64, dtypes.complex128):
         x_abs = gen_math_ops.complex_abs(x.values,
             Tout=x.values.dtype.real_dtype, name=name)
-        return ops.SparseTensor(indices=x.indices, values=x_abs, shape=x.shape)
+        return sparse_tensor.SparseTensor(
+            indices=x.indices, values=x_abs, shape=x.shape)
       x_abs = gen_math_ops._abs(x.values, name=name)
-      return ops.SparseTensor(indices=x.indices, values=x_abs, shape=x.shape)
+      return sparse_tensor.SparseTensor(
+          indices=x.indices, values=x_abs, shape=x.shape)
     else:
       x = ops.convert_to_tensor(x, name="x")
       if x.dtype in (dtypes.complex64, dtypes.complex128):
@@ -297,9 +301,10 @@ def neg(x, name=None):
     A `Tensor` or `SparseTensor`, respectively. Has the same type as `x`.
   """
   with ops.name_scope(name, "Neg", [x]) as name:
-    if isinstance(x, ops.SparseTensor):
+    if isinstance(x, sparse_tensor.SparseTensor):
       x_neg = gen_math_ops.neg(x.values, name=name)
-      return ops.SparseTensor(indices=x.indices, values=x_neg, shape=x.shape)
+      return sparse_tensor.SparseTensor(
+          indices=x.indices, values=x_neg, shape=x.shape)
     else:
       return gen_math_ops.neg(x, name=name)
 
@@ -320,9 +325,10 @@ def sign(x, name=None):
     A `Tensor` or `SparseTensor`, respectively. Has the same type as `x`.
   """
   with ops.name_scope(name, "Sign", [x]) as name:
-    if isinstance(x, ops.SparseTensor):
+    if isinstance(x, sparse_tensor.SparseTensor):
       x_sign = gen_math_ops.sign(x.values, name=name)
-      return ops.SparseTensor(indices=x.indices, values=x_sign, shape=x.shape)
+      return sparse_tensor.SparseTensor(
+          indices=x.indices, values=x_sign, shape=x.shape)
     else:
       return gen_math_ops.sign(x, name=name)
 
@@ -341,9 +347,10 @@ def square(x, name=None):
     A `Tensor` or `SparseTensor`. Has the same type as `x`.
   """
   with ops.name_scope(name, "Square", [x]) as name:
-    if isinstance(x, ops.SparseTensor):
+    if isinstance(x, sparse_tensor.SparseTensor):
       x_square = gen_math_ops.square(x.values, name=name)
-      return ops.SparseTensor(indices=x.indices, values=x_square, shape=x.shape)
+      return sparse_tensor.SparseTensor(
+          indices=x.indices, values=x_square, shape=x.shape)
     else:
       return gen_math_ops.square(x, name=name)
 
@@ -362,9 +369,10 @@ def sqrt(x, name=None):
     A `Tensor` or `SparseTensor`, respectively. Has the same type as `x`.
   """
   with ops.name_scope(name, "Sqrt", [x]) as name:
-    if isinstance(x, ops.SparseTensor):
+    if isinstance(x, sparse_tensor.SparseTensor):
       x_sqrt = gen_math_ops.sqrt(x.values, name=name)
-      return ops.SparseTensor(indices=x.indices, values=x_sqrt, shape=x.shape)
+      return sparse_tensor.SparseTensor(
+          indices=x.indices, values=x_sqrt, shape=x.shape)
     else:
       return gen_math_ops.sqrt(x, name=name)
 
@@ -381,9 +389,10 @@ def erf(x, name=None):
     A `Tensor` or `SparseTensor`, respectively. Has the same type as `x`.
   """
   with ops.name_scope(name, "Erf", [x]) as name:
-    if isinstance(x, ops.SparseTensor):
+    if isinstance(x, sparse_tensor.SparseTensor):
       x_erf = gen_math_ops.erf(x.values, name=name)
-      return ops.SparseTensor(indices=x.indices, values=x_erf, shape=x.shape)
+      return sparse_tensor.SparseTensor(
+          indices=x.indices, values=x_erf, shape=x.shape)
     else:
       return gen_math_ops.erf(x, name=name)
 
@@ -624,9 +633,9 @@ def cast(x, dtype, name=None):
   """
   base_type = dtypes.as_dtype(dtype).base_dtype
   with ops.name_scope(name, "Cast", [x]) as name:
-    if isinstance(x, ops.SparseTensor):
+    if isinstance(x, sparse_tensor.SparseTensor):
       values_cast = cast(x.values, base_type, name=name)
-      return ops.SparseTensor(x.indices, values_cast, x.shape)
+      return sparse_tensor.SparseTensor(x.indices, values_cast, x.shape)
     else:
       # TODO(touts): Handle what Josh said.
       #
@@ -769,16 +778,17 @@ def _OverrideBinaryOperatorHelper(func, op_name, clazz_object=ops.Tensor):
   """
   def binary_op_wrapper(x, y):
     with ops.name_scope(None, op_name, [x, y]) as name:
-      if not isinstance(y, ops.SparseTensor):
+      if not isinstance(y, sparse_tensor.SparseTensor):
         y = ops.convert_to_tensor(y, dtype=x.dtype.base_dtype, name="y")
       return func(x, y, name=name)
 
   def binary_op_wrapper_sparse(sp_x, y):
     with ops.name_scope(None, op_name, [sp_x, y]) as name:
       y = ops.convert_to_tensor(y, dtype=sp_x.dtype.base_dtype, name="y")
-      return ops.SparseTensor(sp_x.indices, func(sp_x.indices, sp_x.values,
-                                                 sp_x.shape, y, name=name),
-                              sp_x.shape)
+      return sparse_tensor.SparseTensor(
+          sp_x.indices, func(sp_x.indices, sp_x.values,
+                             sp_x.shape, y, name=name),
+          sp_x.shape)
 
   def r_binary_op_wrapper(y, x):
     with ops.name_scope(None, op_name, [x, y]) as name:
@@ -934,18 +944,18 @@ def _mul_dispatch(x, y, name=None):
   if is_tensor_y:
     return gen_math_ops.mul(x, y, name=name)
   else:
-    assert isinstance(y, ops.SparseTensor)  # Case: Dense * Sparse.
+    assert isinstance(y, sparse_tensor.SparseTensor)  # Case: Dense * Sparse.
     new_vals = gen_sparse_ops.sparse_dense_cwise_mul(y.indices, y.values,
                                                      y.shape, x, name)
-    return ops.SparseTensor(y.indices, new_vals, y.shape)
+    return sparse_tensor.SparseTensor(y.indices, new_vals, y.shape)
 
 
 _OverrideBinaryOperatorHelper(gen_sparse_ops.sparse_dense_cwise_div, "div",
-                              ops.SparseTensor)
+                              sparse_tensor.SparseTensor)
 _OverrideBinaryOperatorHelper(_sparse_dense_truediv, "truediv",
-                              ops.SparseTensor)
+                              sparse_tensor.SparseTensor)
 _OverrideBinaryOperatorHelper(gen_sparse_ops.sparse_dense_cwise_mul, "mul",
-                              ops.SparseTensor)
+                              sparse_tensor.SparseTensor)
 
 
 _OverrideBinaryOperatorHelper(gen_math_ops.add, "add")
@@ -1060,7 +1070,7 @@ def _ReductionDims(x, reduction_indices):
     if isinstance(x, ops.Tensor) and x.get_shape().ndims is not None:
       return constant_op.constant(np.arange(x.get_shape().ndims),
                                   dtype=dtypes.int32)
-    if (isinstance(x, ops.SparseTensor) and
+    if (isinstance(x, sparse_tensor.SparseTensor) and
         x.shape.get_shape().is_fully_defined()):
       rank = x.shape.get_shape()[0].value  # sparse.shape is an 1-D tensor.
       return constant_op.constant(np.arange(rank), dtype=dtypes.int32)
@@ -1534,19 +1544,6 @@ def _calc_mat_mul_flops(graph, node):
   return ops.OpStats("flops", (k * output_count * 2))
 
 
-@ops.RegisterStatistics("MatMul", "weight_parameters")
-def _calc_mat_mul_weight_parameters(graph, node):
-  """Calculates the on-disk size of the weights for MatMul."""
-  # We assume here that the weights are always in the second input to the op,
-  # which is generally true by convention for fully-connected layers, but not
-  # enforced or checked.
-  weights_shape = graph_util.tensor_shape_from_node_def_name(graph,
-                                                             node.input[1])
-  weights_shape.assert_is_fully_defined()
-  return ops.OpStats("weight_parameters",
-                     (int(weights_shape[1]) * int(weights_shape[0])))
-
-
 def _as_indexed_slices(x, optimize=True):
   """Convert 'x' to IndexedSlices.
 
@@ -1738,9 +1735,10 @@ def tanh(x, name=None):
     `x.dtype != qint32` otherwise the return type is `quint8`.
   """
   with ops.name_scope(name, "Tanh", [x]) as name:
-    if isinstance(x, ops.SparseTensor):
+    if isinstance(x, sparse_tensor.SparseTensor):
       x_tanh = gen_math_ops._tanh(x.values, name=name)
-      return ops.SparseTensor(indices=x.indices, values=x_tanh, shape=x.shape)
+      return sparse_tensor.SparseTensor(
+          indices=x.indices, values=x_tanh, shape=x.shape)
     else:
       return gen_math_ops._tanh(x, name=name)
 
@@ -1888,6 +1886,7 @@ ops.RegisterShape("IsFinite")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("IsInf")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("IsNan")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("Log")(common_shapes.call_cpp_shape_fn)
+ops.RegisterShape("Log1p")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("LogicalNot")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("Neg")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("Real")(common_shapes.call_cpp_shape_fn)
diff --git a/tensorflow/python/ops/nn.py b/tensorflow/python/ops/nn.py
index ceb55d6daf7..71296ea7986 100644
--- a/tensorflow/python/ops/nn.py
+++ b/tensorflow/python/ops/nn.py
@@ -454,7 +454,7 @@ def sigmoid_cross_entropy_with_logits(logits, targets, name=None):
     relu_logits = math_ops.select(cond, logits, zeros)
     neg_abs_logits = math_ops.select(cond, -logits, logits)
     return math_ops.add(relu_logits - logits * targets,
-                        math_ops.log(1 + math_ops.exp(neg_abs_logits)),
+                        math_ops.log1p(math_ops.exp(neg_abs_logits)),
                         name=name)
 
 
@@ -522,7 +522,7 @@ def weighted_cross_entropy_with_logits(logits, targets, pos_weight, name=None):
     log_weight = 1 + (pos_weight - 1) * targets
     return math_ops.add(
         (1 - targets) * logits,
-        log_weight * (math_ops.log(1 + math_ops.exp(-math_ops.abs(logits))) +
+        log_weight * (math_ops.log1p(math_ops.exp(-math_ops.abs(logits))) +
                       nn_ops.relu(-logits)),
         name=name)
 
diff --git a/tensorflow/python/ops/nn_ops.py b/tensorflow/python/ops/nn_ops.py
index 5b08dcdfb5d..0fdb98f172e 100644
--- a/tensorflow/python/ops/nn_ops.py
+++ b/tensorflow/python/ops/nn_ops.py
@@ -1809,24 +1809,6 @@ def _calc_conv_flops(graph, node):
                                filter_width * 2))
 
 
-@ops.RegisterStatistics("Conv2D", "weight_parameters")
-def _calc_conv_weight_params(graph, node):
-  """Calculates the on-disk size of the weights for Conv2D."""
-  input_shape = graph_util.tensor_shape_from_node_def_name(graph, node.input[0])
-  input_shape.assert_is_fully_defined()
-  filter_shape = graph_util.tensor_shape_from_node_def_name(graph,
-                                                            node.input[1])
-  filter_shape.assert_is_fully_defined()
-  output_shape = graph_util.tensor_shape_from_node_def_name(graph, node.name)
-  output_shape.assert_is_fully_defined()
-  filter_height = int(filter_shape[0])
-  filter_width = int(filter_shape[1])
-  filter_in_depth = int(filter_shape[2])
-  filter_out_depth = int(filter_shape[3])
-  return ops.OpStats("weight_parameters", (filter_height * filter_width *
-                                           filter_in_depth * filter_out_depth))
-
-
 @ops.RegisterStatistics("DepthwiseConv2dNative", "flops")
 def _calc_depthwise_conv_flops(graph, node):
   """Calculates the compute resources needed for DepthwiseConv2dNative."""
@@ -1843,25 +1825,6 @@ def _calc_depthwise_conv_flops(graph, node):
   return ops.OpStats("flops", (output_count * filter_height * filter_width * 2))
 
 
-@ops.RegisterStatistics("DepthwiseConv2dNative", "weight_parameters")
-def _calc_depthwise_conv_weight_params(graph, node):
-  """Calculates the on-disk size of the weights for DepthwiseConv2dNative."""
-  input_shape = graph_util.tensor_shape_from_node_def_name(graph, node.input[0])
-  input_shape.assert_is_fully_defined()
-  filter_shape = graph_util.tensor_shape_from_node_def_name(graph,
-                                                            node.input[1])
-  filter_shape.assert_is_fully_defined()
-  output_shape = graph_util.tensor_shape_from_node_def_name(graph, node.name)
-  output_shape.assert_is_fully_defined()
-  filter_height = int(filter_shape[0])
-  filter_width = int(filter_shape[1])
-  filter_in_depth = int(filter_shape[2])
-  filter_channel_multiplier = int(filter_shape[3])
-  return ops.OpStats("weight_parameters", (filter_height * filter_width *
-                                           filter_in_depth *
-                                           filter_channel_multiplier))
-
-
 ops.RegisterShape("Conv3D")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("MaxPool3D")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("AvgPool3D")(common_shapes.call_cpp_shape_fn)
@@ -1882,15 +1845,6 @@ def _calc_bias_add_flops(graph, node):
   return ops.OpStats("flops", input_count)
 
 
-@ops.RegisterStatistics("BiasAdd", "weight_parameters")
-def _calc_bias_add_weight_params(graph, node):
-  """Calculates the on-disk weight parameters for BiasAdd."""
-  bias_shape = graph_util.tensor_shape_from_node_def_name(graph, node.input[1])
-  bias_shape.assert_is_fully_defined()
-  bias_count = np.prod(bias_shape.as_list())
-  return ops.OpStats("weight_parameters", bias_count)
-
-
 def xw_plus_b(x, weights, biases, name=None):  # pylint: disable=invalid-name
   """Computes matmul(x, weights) + biases.
 
@@ -2112,19 +2066,6 @@ def _calc_dilation2d_flops(graph, node):
   return ops.OpStats("flops", (output_count * filter_height * filter_width * 2))
 
 
-@ops.RegisterStatistics("Dilation2D", "weight_parameters")
-def _calc_dilation2d_weight_params(graph, node):
-  """Calculates the on-disk size of the weights for Dilation2D."""
-  filter_shape = graph_util.tensor_shape_from_node_def_name(graph,
-                                                            node.input[1])
-  filter_shape.assert_is_fully_defined()
-  filter_height = int(filter_shape[0])
-  filter_width = int(filter_shape[1])
-  filter_depth = int(filter_shape[2])
-  return ops.OpStats("weight_parameters",
-                     (filter_height * filter_width * filter_depth))
-
-
 def erosion2d(value, kernel, strides, rates, padding, name=None):
   """Computes the grayscale erosion of 4-D `value` and 3-D `kernel` tensors.
 
diff --git a/tensorflow/python/ops/parsing_ops.py b/tensorflow/python/ops/parsing_ops.py
index 992fe0c331c..c8bea69aee8 100644
--- a/tensorflow/python/ops/parsing_ops.py
+++ b/tensorflow/python/ops/parsing_ops.py
@@ -24,6 +24,7 @@ import re
 from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
@@ -406,8 +407,9 @@ def _parse_example_raw(serialized,
 
     (sparse_indices, sparse_values, sparse_shapes, dense_values) = outputs
 
-    sparse_tensors = [ops.SparseTensor(ix, val, shape) for (ix, val, shape)
-                      in zip(sparse_indices, sparse_values, sparse_shapes)]
+    sparse_tensors = [
+        sparse_tensor.SparseTensor(ix, val, shape) for (ix, val, shape)
+        in zip(sparse_indices, sparse_values, sparse_shapes)]
 
     return dict(
         zip(sparse_keys + dense_keys, sparse_tensors + dense_values))
@@ -530,7 +532,7 @@ def _parse_single_example_raw(serialized,
     if sparse_keys is not None:
       for s in sparse_keys:
         s_name = re.sub("[^A-Za-z0-9_.\\-/]", "_", s)
-        outputs[s] = ops.SparseTensor(
+        outputs[s] = sparse_tensor.SparseTensor(
             array_ops.slice(outputs[s].indices,
                             [0, 1], [-1, -1], name="Slice_Indices_%s" % s_name),
             outputs[s].values,
@@ -841,13 +843,13 @@ def _parse_single_sequence_example_raw(serialized,
      feature_list_sparse_shapes, feature_list_dense_values) = outputs
 
     context_sparse_tensors = [
-        ops.SparseTensor(ix, val, shape) for (ix, val, shape)
+        sparse_tensor.SparseTensor(ix, val, shape) for (ix, val, shape)
         in zip(context_sparse_indices,
                context_sparse_values,
                context_sparse_shapes)]
 
     feature_list_sparse_tensors = [
-        ops.SparseTensor(ix, val, shape) for (ix, val, shape)
+        sparse_tensor.SparseTensor(ix, val, shape) for (ix, val, shape)
         in zip(feature_list_sparse_indices,
                feature_list_sparse_values,
                feature_list_sparse_shapes)]
diff --git a/tensorflow/python/ops/resource_variable_ops.py b/tensorflow/python/ops/resource_variable_ops.py
index 7db9731e198..0057f86486b 100644
--- a/tensorflow/python/ops/resource_variable_ops.py
+++ b/tensorflow/python/ops/resource_variable_ops.py
@@ -28,3 +28,6 @@ from tensorflow.python.ops.gen_resource_variable_ops import *
 
 ops.RegisterShape("VarHandleOp")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("CreateVariableOp")(common_shapes.call_cpp_shape_fn)
+ops.RegisterShape("ReadVariableOp")(common_shapes.call_cpp_shape_fn)
+ops.RegisterShape("AssignVariableOp")(common_shapes.call_cpp_shape_fn)
+ops.RegisterShape("AssignAddVariableOp")(common_shapes.call_cpp_shape_fn)
diff --git a/tensorflow/python/ops/rnn.py b/tensorflow/python/ops/rnn.py
index cc5464d5720..f67f4f35e88 100644
--- a/tensorflow/python/ops/rnn.py
+++ b/tensorflow/python/ops/rnn.py
@@ -1057,8 +1057,8 @@ def raw_rnn(cell, loop_fn,
         time=time + 1, cell_output=output, cell_state=cell_state,
         loop_state=loop_state)
     # Emit zeros and copy forward state for minibatch entries that are finished.
-    state = tf.select(finished, state, next_state)
-    emit = tf.select(finished, tf.zeros_like(emit), emit)
+    state = tf.where(finished, state, next_state)
+    emit = tf.where(finished, tf.zeros_like(emit), emit)
     emit_ta = emit_ta.write(time, emit)
     # If any new minibatch entries are marked as finished, mark these.
     finished = tf.logical_or(finished, next_finished)
diff --git a/tensorflow/python/ops/sparse_grad.py b/tensorflow/python/ops/sparse_grad.py
index f15f3f5b749..0c4041ce545 100644
--- a/tensorflow/python/ops/sparse_grad.py
+++ b/tensorflow/python/ops/sparse_grad.py
@@ -19,6 +19,7 @@ from __future__ import division
 from __future__ import print_function
 
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import gen_sparse_ops
 from tensorflow.python.ops import math_ops
@@ -51,7 +52,8 @@ def _SparseReorderGrad(op, unused_output_indices_grad, output_values_grad):
 
   num_entries = array_ops.shape(input_indices)[0]
   entry_indices = math_ops.range(num_entries)
-  sp_unordered = ops.SparseTensor(input_indices, entry_indices, input_shape)
+  sp_unordered = sparse_tensor.SparseTensor(
+      input_indices, entry_indices, input_shape)
   sp_ordered = sparse_ops.sparse_reorder(sp_unordered)
   inverted_permutation = array_ops.invert_permutation(sp_ordered.values)
 
@@ -134,7 +136,7 @@ def _SparseTensorDenseMatMulGrad(op, grad):
   Raises:
     TypeError: When the two operands don't have the same type.
   """
-  sp_t = ops.SparseTensor(*op.inputs[:3])
+  sp_t = sparse_tensor.SparseTensor(*op.inputs[:3])
   adj_a = op.get_attr("adjoint_a")
   adj_b = op.get_attr("adjoint_b")
 
@@ -209,7 +211,7 @@ def _SparseDenseCwiseMulOrDivGrad(op, grad, is_mul):
   # indices can repeat after scaling, so we can't use sparse_to_dense().
   dy = sparse_ops.sparse_add(
       array_ops.zeros_like(y),
-      ops.SparseTensor(scaled_indices, dy_val, y_shape))
+      sparse_tensor.SparseTensor(scaled_indices, dy_val, y_shape))
 
   # (sp_indices, sp_vals, sp_shape, dense)
   return (None, dx, None, dy)
@@ -246,9 +248,9 @@ def _SparseSoftmaxGrad(op, grad):
   """
   indices, shape = op.inputs[0], op.inputs[2]
   out_vals = op.outputs[0]
-  sp_output = ops.SparseTensor(indices, out_vals, shape)
-  sp_grad = ops.SparseTensor(indices, grad, shape)
-  sp_product = ops.SparseTensor(
+  sp_output = sparse_tensor.SparseTensor(indices, out_vals, shape)
+  sp_grad = sparse_tensor.SparseTensor(indices, grad, shape)
+  sp_product = sparse_tensor.SparseTensor(
       indices, sp_output.values * sp_grad.values, shape)
 
   # [..., B, 1], dense.
diff --git a/tensorflow/python/ops/sparse_ops.py b/tensorflow/python/ops/sparse_ops.py
index 0648662ef0b..990c4861350 100644
--- a/tensorflow/python/ops/sparse_ops.py
+++ b/tensorflow/python/ops/sparse_ops.py
@@ -62,6 +62,7 @@ import numpy as np
 from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import check_ops
 from tensorflow.python.ops import control_flow_ops
@@ -86,9 +87,9 @@ def _convert_to_sparse_tensor(sp_input):
   Raises:
     ValueError: if `sp_input` is neither `SparseTensor` nor `SparseTensorValue`.
   """
-  if isinstance(sp_input, ops.SparseTensorValue):
-    return ops.SparseTensor.from_value(sp_input)
-  if not isinstance(sp_input, ops.SparseTensor):
+  if isinstance(sp_input, sparse_tensor.SparseTensorValue):
+    return sparse_tensor.SparseTensor.from_value(sp_input)
+  if not isinstance(sp_input, sparse_tensor.SparseTensor):
     raise TypeError("Input must be a SparseTensor.")
   return sp_input
 
@@ -232,7 +233,7 @@ def sparse_concat(concat_dim, sp_inputs, name=None, expand_nonconcat_dim=False):
   output_ind, output_val, output_shape = (gen_sparse_ops._sparse_concat(
       inds, vals, shapes, concat_dim, name=name))
 
-  return ops.SparseTensor(output_ind, output_val, output_shape)
+  return sparse_tensor.SparseTensor(output_ind, output_val, output_shape)
 
 
 def sparse_add(a, b, thresh=0):
@@ -284,7 +285,7 @@ def sparse_add(a, b, thresh=0):
   Raises:
     TypeError: If both `a` and `b` are `Tensor`s.  Use `tf.add()` instead.
   """
-  sparse_classes = (ops.SparseTensor, ops.SparseTensorValue)
+  sparse_classes = (sparse_tensor.SparseTensor, sparse_tensor.SparseTensorValue)
   if not any(isinstance(inp, sparse_classes) for inp in [a, b]):
     raise TypeError("At least one input should be SparseTensor; do you mean to"
                     " use tf.add()?")
@@ -295,7 +296,7 @@ def sparse_add(a, b, thresh=0):
         thresh, dtype=a.values.dtype.real_dtype, name="thresh")
     output_ind, output_val, output_shape = (gen_sparse_ops._sparse_add(
         a.indices, a.values, a.shape, b.indices, b.values, b.shape, thresh))
-    return ops.SparseTensor(output_ind, output_val, output_shape)
+    return sparse_tensor.SparseTensor(output_ind, output_val, output_shape)
   else:
     # swap to make `a` the SparseTensor.
     if isinstance(b, sparse_classes):
@@ -329,7 +330,7 @@ def sparse_dense_cwise_add(sp_t, dense_t):
   """
   result = gen_sparse_ops.sparse_dense_cwise_add(sp_t.indices, sp_t.values,
                                                  sp_t.shape, dense_t)
-  return ops.SparseTensor(sp_t.indices, result, sp_t.shape)
+  return sparse_tensor.SparseTensor(sp_t.indices, result, sp_t.shape)
 
 
 ops.RegisterShape("SparseTensorDenseAdd")(common_shapes.call_cpp_shape_fn)
@@ -377,8 +378,8 @@ def sparse_reorder(sp_input, name=None):
   reordered_ind, reordered_val = (gen_sparse_ops._sparse_reorder(
       sp_input.indices, sp_input.values, sp_input.shape, name=name))
 
-  return ops.SparseTensor(reordered_ind, reordered_val,
-                          array_ops.identity(sp_input.shape))
+  return sparse_tensor.SparseTensor(reordered_ind, reordered_val,
+                                    array_ops.identity(sp_input.shape))
 
 
 ops.RegisterShape("SparseReorder")(common_shapes.call_cpp_shape_fn)
@@ -435,8 +436,9 @@ def sparse_reshape(sp_input, shape, name=None):
     reshaped_ind, reshaped_shape = gen_sparse_ops._sparse_reshape(
         sp_input.indices, sp_input.shape, shape, name=name)
 
-    return ops.SparseTensor(reshaped_ind, array_ops.identity(sp_input.values),
-                            reshaped_shape)
+    return sparse_tensor.SparseTensor(
+        reshaped_ind, array_ops.identity(sp_input.values),
+        reshaped_shape)
 
 
 ops.RegisterShape("SparseReshape")(common_shapes.call_cpp_shape_fn)
@@ -488,7 +490,8 @@ def sparse_split(split_dim, num_split, sp_input, name=None):
   sparse_tensors = []
   for i in range(0, num_split):
     sparse_tensors.append(
-        ops.SparseTensor(output_inds[i], output_vals[i], output_shapes[i]))
+        sparse_tensor.SparseTensor(
+            output_inds[i], output_vals[i], output_shapes[i]))
   return sparse_tensors
 
 
@@ -633,7 +636,7 @@ def sparse_reduce_sum_sparse(sp_input, reduction_axes=None, keep_dims=False):
           sp_input.shape, math_ops._ReductionDims(sp_input, reduction_axes),
           keep_dims))
 
-  return ops.SparseTensor(output_ind, output_val, output_shape)
+  return sparse_tensor.SparseTensor(output_ind, output_val, output_shape)
 
 
 ops.RegisterShape("SparseReduceSumSparse")(common_shapes.call_cpp_shape_fn)
@@ -741,7 +744,8 @@ def sparse_to_indicator(sp_input, vocab_size, name=None):
   with ops.name_scope(name, "SparseToIndicator", [sp_input]) as name:
     num_entries = array_ops.shape(sp_input.indices)[0]
     new_values = array_ops.fill(array_ops.expand_dims(num_entries, 0), True)
-    sp_values = ops.SparseTensor(sp_input.indices, new_values, sp_input.shape)
+    sp_values = sparse_tensor.SparseTensor(
+        sp_input.indices, new_values, sp_input.shape)
 
     sp_new = sparse_merge(sp_input, sp_values, vocab_size, name)
 
@@ -851,7 +855,7 @@ def sparse_merge(sp_ids, sp_values, vocab_size, name=None,
         [array_ops.slice(sp_ids.shape, [0], array_ops.expand_dims(rank - 1, 0)),
          math_ops.cast(array_ops.pack([vocab_size]), dtypes.int64)])
 
-    result = ops.SparseTensor(new_indices, new_values, new_shape)
+    result = sparse_tensor.SparseTensor(new_indices, new_values, new_shape)
     return result if already_sorted else sparse_reorder(result)
 
 
@@ -894,8 +898,8 @@ def sparse_retain(sp_input, to_retain):
   where_true = array_ops.reshape(array_ops.where(to_retain), [-1])
   new_indices = array_ops.gather(sp_input.indices, where_true)
   new_values = array_ops.gather(sp_input.values, where_true)
-  return ops.SparseTensor(new_indices, new_values,
-                          array_ops.identity(sp_input.shape))
+  return sparse_tensor.SparseTensor(new_indices, new_values,
+                                    array_ops.identity(sp_input.shape))
 
 
 def sparse_reset_shape(sp_input, new_shape=None):
@@ -967,7 +971,7 @@ def sparse_reset_shape(sp_input, new_shape=None):
     output_shape_tensor.get_shape().assert_has_rank(1)
     output_shape_tensor = math_ops.cast(output_shape_tensor, dtypes.int64)
     # For cases when shape is known during graph construction, this catches the
-    # error before the ops.SparseTensor catches it.
+    # error before the sparse_tensor.SparseTensor catches it.
     output_shape_tensor.get_shape()[0].merge_with(in_shape.get_shape()[0])
 
     # For cases where shape is not known during graph construction.
@@ -979,7 +983,7 @@ def sparse_reset_shape(sp_input, new_shape=None):
         [check_ops.assert_less_equal(in_shape, output_shape_tensor)],
         output_shape_tensor)
 
-  return ops.SparseTensor(in_indices, in_values, output_shape_tensor)
+  return sparse_tensor.SparseTensor(in_indices, in_values, output_shape_tensor)
 
 
 def sparse_fill_empty_rows(sp_input, default_value, name=None):
@@ -1054,8 +1058,9 @@ def sparse_fill_empty_rows(sp_input, default_value, name=None):
                                                  additional_indices])
     all_values_unordered = array_ops.concat(0, [sp_input.values,
                                                 additional_values])
-    sp_unordered_output = ops.SparseTensor(all_indices_unordered,
-                                           all_values_unordered, sp_input.shape)
+    sp_unordered_output = sparse_tensor.SparseTensor(
+        all_indices_unordered,
+        all_values_unordered, sp_input.shape)
     sp_ordered_output = sparse_reorder(sp_unordered_output)
 
     return sp_ordered_output, empty_row_indicator
@@ -1182,7 +1187,7 @@ def deserialize_many_sparse(serialized_sparse, dtype, rank=None, name=None):
   output_indices.set_shape([None, rank])
   output_shape.set_shape([rank])
 
-  return ops.SparseTensor(output_indices, output_values, output_shape)
+  return sparse_tensor.SparseTensor(output_indices, output_values, output_shape)
 
 
 ops.RegisterShape("DeserializeManySparse")(common_shapes.call_cpp_shape_fn)
@@ -1423,7 +1428,8 @@ def sparse_softmax(sp_input, name=None):
                       [sp_input.indices, sp_input.values]) as name:
     out_vals = gen_sparse_ops.sparse_softmax(sp_input.indices, sp_input.values,
                                              sp_input.shape)
-    return ops.SparseTensor(sp_input.indices, out_vals, sp_input.shape)
+    return sparse_tensor.SparseTensor(
+        sp_input.indices, out_vals, sp_input.shape)
 
 
 ops.RegisterShape("SparseSoftmax")(common_shapes.call_cpp_shape_fn)
@@ -1436,8 +1442,8 @@ def sparse_maximum(sp_a, sp_b, name=None):
   Example:
 
   ```python
-  sp_zero = ops.SparseTensor([[0]], [0], [7])
-  sp_one = ops.SparseTensor([[1]], [1], [7])
+  sp_zero = sparse_tensor.SparseTensor([[0]], [0], [7])
+  sp_one = sparse_tensor.SparseTensor([[1]], [1], [7])
   res = tf.sparse_maximum(sp_zero, sp_one).eval()
   # "res" should be equal to SparseTensor([[0], [1]], [0, 1], [7]).
   ```
@@ -1462,7 +1468,7 @@ def sparse_maximum(sp_a, sp_b, name=None):
         sp_b.values,
         sp_b.shape,
         name=name)
-  return ops.SparseTensor(out_indices, out_values, sp_a.shape)
+  return sparse_tensor.SparseTensor(out_indices, out_values, sp_a.shape)
 
 
 def sparse_minimum(sp_a, sp_b, name=None):
@@ -1472,8 +1478,8 @@ def sparse_minimum(sp_a, sp_b, name=None):
   Example:
 
   ```python
-  sp_zero = ops.SparseTensor([[0]], [0], [7])
-  sp_one = ops.SparseTensor([[1]], [1], [7])
+  sp_zero = sparse_tensor.SparseTensor([[0]], [0], [7])
+  sp_one = sparse_tensor.SparseTensor([[1]], [1], [7])
   res = tf.sparse_minimum(sp_zero, sp_one).eval()
   # "res" should be equal to SparseTensor([[0], [1]], [0, 0], [7]).
   ```
@@ -1498,7 +1504,7 @@ def sparse_minimum(sp_a, sp_b, name=None):
         sp_b.values,
         sp_b.shape,
         name=name)
-  return ops.SparseTensor(out_indices, out_values, sp_a.shape)
+  return sparse_tensor.SparseTensor(out_indices, out_values, sp_a.shape)
 
 
 ops.RegisterShape("SparseSparseMaximum")(common_shapes.call_cpp_shape_fn)
@@ -1547,8 +1553,9 @@ def sparse_transpose(sp_input, perm=None, name=None):
         array_ops.gather(array_ops.transpose(indices), perm))
     dense_shape = sp_input.shape
     transposed_dense_shape = array_ops.gather(dense_shape, perm)
-    transposed_st = ops.SparseTensor(transposed_indices, sp_input.values,
-                                     transposed_dense_shape)
+    transposed_st = sparse_tensor.SparseTensor(
+        transposed_indices, sp_input.values,
+        transposed_dense_shape)
     transposed_st = sparse_reorder(transposed_st)
     return transposed_st
 
@@ -1691,7 +1698,7 @@ def _take_many_sparse_from_tensors_map(
   output_indices.set_shape([None, rank])
   output_shape.set_shape([rank])
 
-  return ops.SparseTensor(output_indices, output_values, output_shape)
+  return sparse_tensor.SparseTensor(output_indices, output_values, output_shape)
 
 
 ops.RegisterShape("AddSparseToTensorsMap")(common_shapes.call_cpp_shape_fn)
diff --git a/tensorflow/python/ops/standard_ops.py b/tensorflow/python/ops/standard_ops.py
index 9267b8ef2ee..847d1b99c83 100644
--- a/tensorflow/python/ops/standard_ops.py
+++ b/tensorflow/python/ops/standard_ops.py
@@ -67,6 +67,11 @@ from tensorflow.python.ops.state_ops import scatter_div
 from tensorflow.python.ops.state_ops import scatter_mul
 from tensorflow.python.ops.state_ops import scatter_sub
 from tensorflow.python.ops.state_ops import scatter_update
+from tensorflow.python.ops.state_ops import scatter_nd_add
+from tensorflow.python.ops.state_ops import scatter_nd_sub
+from tensorflow.python.ops.state_ops import scatter_nd_mul
+from tensorflow.python.ops.state_ops import scatter_nd_div
+from tensorflow.python.ops.state_ops import scatter_nd_update
 from tensorflow.python.ops.string_ops import *
 from tensorflow.python.ops.template import *
 from tensorflow.python.ops.tensor_array_ops import *
diff --git a/tensorflow/python/ops/state_grad.py b/tensorflow/python/ops/state_grad.py
index 871ce780c5c..314f9f0c1af 100644
--- a/tensorflow/python/ops/state_grad.py
+++ b/tensorflow/python/ops/state_grad.py
@@ -20,7 +20,7 @@ from __future__ import division
 from __future__ import print_function
 
 from tensorflow.python.framework import ops
-from tensorflow.python.ops import state_ops
+
 
 # TODO(b/31222613): These ops may be differentiable, and there may be
 # latent bugs here.
@@ -43,3 +43,14 @@ ops.NotDifferentiable("ScatterMul")
 
 
 ops.NotDifferentiable("ScatterDiv")
+
+
+ops.NotDifferentiable("ScatterNdUpdate")
+
+ops.NotDifferentiable("ScatterNdAdd")
+
+ops.NotDifferentiable("ScatterNdSub")
+
+ops.NotDifferentiable("ScatterNdMul")
+
+ops.NotDifferentiable("ScatterNdDiv")
diff --git a/tensorflow/python/ops/state_ops.py b/tensorflow/python/ops/state_ops.py
index 636acc3e2ad..2c12865df06 100644
--- a/tensorflow/python/ops/state_ops.py
+++ b/tensorflow/python/ops/state_ops.py
@@ -22,15 +22,15 @@
 TensorFlow provides a set of functions to help manage the set of variables
 collected in the graph.
 
-@@all_variables
-@@trainable_variables
+@@global_variables
 @@local_variables
 @@model_variables
+@@trainable_variables
 @@moving_average_variables
 
-@@initialize_all_variables
-@@initialize_variables
-@@initialize_local_variables
+@@global_variables_initializer
+@@local_variables_initializer
+@@variables_initializer
 @@is_variable_initialized
 @@report_uninitialized_variables
 @@assert_variables_initialized
@@ -95,6 +95,11 @@ automatically by the optimizers in most cases.
 @@scatter_sub
 @@scatter_mul
 @@scatter_div
+@@scatter_nd_update
+@@scatter_nd_add
+@@scatter_nd_sub
+@@scatter_nd_mul
+@@scatter_nd_div
 @@sparse_mask
 @@IndexedSlices
 
@@ -108,6 +113,13 @@ automatically by the optimizers in most cases.
 @@export_meta_graph
 @@import_meta_graph
 
+# Deprecated functions (removed after 2017-03-02). Please don't use them.
+
+@@all_variables
+@@initialize_all_variables
+@@initialize_local_variables
+@@initialize_variables
+
 """
 
 from __future__ import absolute_import
@@ -209,3 +221,34 @@ ops.RegisterShape("ScatterDiv")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("ScatterMul")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("ScatterSub")(common_shapes.call_cpp_shape_fn)
 ops.RegisterShape("ScatterUpdate")(common_shapes.call_cpp_shape_fn)
+
+
+@ops.RegisterShape("ScatterNdAdd")
+@ops.RegisterShape("ScatterNdSub")
+@ops.RegisterShape("ScatterNdMul")
+@ops.RegisterShape("ScatterNdDiv")
+@ops.RegisterShape("ScatterNdUpdate")
+def scatter_nd_update_shape(op):
+  """Shape function for the ScatterNd update ops."""
+  ref_shape = op.inputs[0].get_shape()
+  indices_shape = op.inputs[1].get_shape()
+  updates_shape = op.inputs[2].get_shape()
+
+  if indices_shape.ndims is not None and ref_shape.ndims is not None:
+    outer_dims = len(indices_shape) - 1
+    ixdim = indices_shape[-1].value or 0
+
+    if not indices_shape[:outer_dims].is_compatible_with(
+        updates_shape[:outer_dims]):
+      raise ValueError("The outer %d dimensions of indices.shape=%s must "
+                       "match the outer %d dimensions of updates.shape=%s" % (
+                           outer_dims, indices_shape, outer_dims,
+                           updates_shape))
+
+    if not ref_shape[ixdim:].is_compatible_with(updates_shape[outer_dims:]):
+      raise ValueError("The inner %d dimensions of ref.shape=%s must match "
+                       "the inner %d dimensions of updates.shape=%s" % (
+                           len(ref_shape)-ixdim, ref_shape,
+                           len(updates_shape)-outer_dims, updates_shape))
+
+  return [ref_shape]
diff --git a/tensorflow/python/ops/string_ops.py b/tensorflow/python/ops/string_ops.py
index c3eef9813c3..830134da9f8 100644
--- a/tensorflow/python/ops/string_ops.py
+++ b/tensorflow/python/ops/string_ops.py
@@ -50,6 +50,7 @@ import six
 from tensorflow.python.framework import common_shapes
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 
 # pylint: disable=unused-import
 from tensorflow.python.ops import gen_string_ops
@@ -107,7 +108,7 @@ def string_split(source, delimiter=" "):  # pylint: disable=invalid-name
   indices.set_shape([None, 2])
   values.set_shape([None])
   shape.set_shape([2])
-  return ops.SparseTensor(indices, values, shape)
+  return sparse_tensor.SparseTensor(indices, values, shape)
 
 
 ops.NotDifferentiable("StringToHashBucket")
diff --git a/tensorflow/python/ops/variables.py b/tensorflow/python/ops/variables.py
index 9eec0d215dc..45261ecaac9 100644
--- a/tensorflow/python/ops/variables.py
+++ b/tensorflow/python/ops/variables.py
@@ -26,6 +26,7 @@ from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import gen_state_ops
 from tensorflow.python.ops import math_ops
 from tensorflow.python.ops import state_ops
+from tensorflow.python.util.deprecation import deprecated
 
 
 class Variable(object):
@@ -82,16 +83,16 @@ class Variable(object):
   ```
 
   The most common initialization pattern is to use the convenience function
-  `initialize_all_variables()` to add an Op to the graph that initializes
+  `global_variable_initializers()` to add an Op to the graph that initializes
   all the variables. You then run that Op after launching the graph.
 
   ```python
-  # Add an Op to initialize all variables.
-  init_op = tf.initialize_all_variables()
+  # Add an Op to initialize global variables.
+  init_op = tf.global_variable_initializers()
 
   # Launch the graph in a session.
   with tf.Session() as sess:
-      # Run the Op that initializes all variables.
+      # Run the Op that initializes global variables.
       sess.run(init_op)
       # ...you can now run any Op that uses variable values...
   ```
@@ -102,8 +103,8 @@ class Variable(object):
 
   All variables are automatically collected in the graph where they are
   created. By default, the constructor adds the new variable to the graph
-  collection `GraphKeys.VARIABLES`. The convenience function
-  `all_variables()` returns the contents of that collection.
+  collection `GraphKeys.GLOBAL_VARIABLES`. The convenience function
+  `global_variables()` returns the contents of that collection.
 
   When building a machine learning model it is often convenient to distinguish
   between variables holding the trainable model parameters and other variables
@@ -159,7 +160,7 @@ class Variable(object):
     """Creates a new variable with value `initial_value`.
 
     The new variable is added to the graph collections listed in `collections`,
-    which defaults to `[GraphKeys.VARIABLES]`.
+    which defaults to `[GraphKeys.GLOBAL_VARIABLES]`.
 
     If `trainable` is `True` the variable is also added to the graph collection
     `GraphKeys.TRAINABLE_VARIABLES`.
@@ -178,7 +179,7 @@ class Variable(object):
         collection `GraphKeys.TRAINABLE_VARIABLES`. This collection is used as
         the default list of variables to use by the `Optimizer` classes.
       collections: List of graph collections keys. The new variable is added to
-        these collections. Defaults to `[GraphKeys.VARIABLES]`.
+        these collections. Defaults to `[GraphKeys.GLOBAL_VARIABLES]`.
       validate_shape: If `False`, allows the variable to be initialized with a
         value of unknown shape. If `True`, the default, the shape of
         `initial_value` must be known.
@@ -245,7 +246,7 @@ class Variable(object):
         collection `GraphKeys.TRAINABLE_VARIABLES`. This collection is used as
         the default list of variables to use by the `Optimizer` classes.
       collections: List of graph collections keys. The new variable is added to
-        these collections. Defaults to `[GraphKeys.VARIABLES]`.
+        these collections. Defaults to `[GraphKeys.GLOBAL_VARIABLES]`.
       validate_shape: If `False`, allows the variable to be initialized with a
         value of unknown shape. If `True`, the default, the shape of
         `initial_value` must be known.
@@ -275,7 +276,7 @@ class Variable(object):
           "dtype must also be specified when initial_value is callable.")
 
     if collections is None:
-      collections = [ops.GraphKeys.VARIABLES]
+      collections = [ops.GraphKeys.GLOBAL_VARIABLES]
     if not isinstance(collections, (list, tuple, set)):
       raise ValueError(
           "collections argument to Variable constructor must be a list, tuple, "
@@ -479,7 +480,7 @@ class Variable(object):
 
     ```python
     v = tf.Variable([1, 2])
-    init = tf.initialize_all_variables()
+    init = tf.global_variable_initializers()
 
     with tf.Session() as sess:
         sess.run(init)
@@ -1037,17 +1038,28 @@ class PartitionedVariable(object):
         "assign() has not been implemented for PartitionedVariable.")
 
 
-def all_variables():
-  """Returns all variables that must be saved/restored.
+def global_variables():
+  """Returns global variables.
 
-  The `Variable()` constructor automatically adds new variables to the graph
-  collection `GraphKeys.VARIABLES`. This convenience function returns the
-  contents of that collection.
+  Global variables are variables that are shared across machines in a
+  distributed environment. The `Variable()` constructor or `get_variable()`
+  automatically adds new variables to the graph collection
+  `GraphKeys.GLOBAL_VARIABLES`.
+  This convenience function returns the contents of that collection.
+
+  An alternative to global variables are local variables. See
+  [`tf.local_variables()`](../../api_docs/python/state_ops.md#local_variables)
 
   Returns:
     A list of `Variable` objects.
   """
-  return ops.get_collection(ops.GraphKeys.VARIABLES)
+  return ops.get_collection(ops.GraphKeys.GLOBAL_VARIABLES)
+
+
+@deprecated("2016-03-02", "Please use tf.global_variables instead.")
+def all_variables():
+  """See `tf.global_variables`."""
+  return global_variables()
 
 
 def _all_saveable_objects():
@@ -1057,8 +1069,37 @@ def _all_saveable_objects():
     A list of `Variable` and `SaveableObject` to be checkpointed
   """
   # TODO(andreasst): make this function public once things are settled.
-  return ops.get_collection(ops.GraphKeys.VARIABLES) + ops.get_collection(
-      ops.GraphKeys.SAVEABLE_OBJECTS)
+  return (ops.get_collection(ops.GraphKeys.GLOBAL_VARIABLES) +
+          ops.get_collection(ops.GraphKeys.SAVEABLE_OBJECTS))
+
+
+def local_variables():
+  """Returns local variables.
+
+  Local variables - per process variables, usually not saved/restored to
+  checkpoint and used for temporary or intermediate values.
+  For example, they can be used as counters for metrics computation or
+  number of epochs this machine has read data.
+  The `local_variable()` automatically adds new variable to
+  `GraphKeys.LOCAL_VARIABLES`.
+  This convenience function returns the contents of that collection.
+
+  An alternative to local variables are global variables. See
+  [`tf.global_variables()`](../../api_docs/python/state_ops.md#global_variables)
+
+  Returns:
+    A list of local `Variable` objects.
+  """
+  return ops.get_collection(ops.GraphKeys.LOCAL_VARIABLES)
+
+
+def model_variables():
+  """Returns all variables in the MODEL_VARIABLES collection.
+
+  Returns:
+    A list of local Variable objects.
+  """
+  return ops.get_collection(ops.GraphKeys.MODEL_VARIABLES)
 
 
 def trainable_variables():
@@ -1075,24 +1116,6 @@ def trainable_variables():
   return ops.get_collection(ops.GraphKeys.TRAINABLE_VARIABLES)
 
 
-def local_variables():
-  """Returns all variables created with collection=[LOCAL_VARIABLES].
-
-  Returns:
-    A list of local Variable objects.
-  """
-  return ops.get_collection(ops.GraphKeys.LOCAL_VARIABLES)
-
-
-def model_variables():
-  """Returns all variables in the MODEL_VARIABLES collection.
-
-  Returns:
-    A list of local Variable objects.
-  """
-  return ops.get_collection(ops.GraphKeys.MODEL_VARIABLES)
-
-
 def moving_average_variables():
   """Returns all variables that maintain their moving averages.
 
@@ -1107,7 +1130,7 @@ def moving_average_variables():
   return ops.get_collection(ops.GraphKeys.MOVING_AVERAGE_VARIABLES)
 
 
-def initialize_variables(var_list, name="init"):
+def variables_initializer(var_list, name="init"):
   """Returns an Op that initializes a list of variables.
 
   After you launch the graph in a session, you can run the returned Op to
@@ -1132,26 +1155,44 @@ def initialize_variables(var_list, name="init"):
   return control_flow_ops.no_op(name=name)
 
 
-def initialize_all_variables():
-  """Returns an Op that initializes all variables.
+@deprecated("2017-03-02", "Use `tf.variables_initializer` instead.")
+def initialize_variables(var_list, name="init"):
+  """See `tf.variables_initializer`."""
+  return variables_initializer(var_list, name=name)
 
-  This is just a shortcut for `initialize_variables(all_variables())`
+
+def global_variables_initializer():
+  """Returns an Op that initializes global variables.
+
+  This is just a shortcut for `variable_initializers(global_variables())`
 
   Returns:
-    An Op that initializes all variables in the graph.
+    An Op that initializes global variables in the graph.
   """
-  return initialize_variables(all_variables())
+  return variables_initializer(global_variables())
 
 
-def initialize_local_variables():
+@deprecated("2017-03-02", "Use `tf.global_variables_initializer` instead.")
+def initialize_all_variables():
+  """See `tf.global_variables_initializer`."""
+  return global_variables_initializer()
+
+
+def local_variables_initializer():
   """Returns an Op that initializes all local variables.
 
-  This is just a shortcut for `initialize_variables(local_variables())`
+  This is just a shortcut for `variable_initializers(local_variables())`
 
   Returns:
     An Op that initializes all local variables in the graph.
   """
-  return initialize_variables(local_variables())
+  return variables_initializer(local_variables())
+
+
+@deprecated("2017-03-02", "Use `tf.local_variables_initializer` instead.")
+def initialize_local_variables():
+  """See `tf.local_variables_initializer`."""
+  return local_variables_initializer()
 
 
 def is_variable_initialized(variable):
@@ -1182,13 +1223,13 @@ def assert_variables_initialized(var_list=None):
 
   Args:
     var_list: List of `Variable` objects to check. Defaults to the
-      value of `all_variables().`
+      value of `global_variables().`
 
   Returns:
     An Op, or None if there are no variables.
   """
   if var_list is None:
-    var_list = all_variables() + local_variables()
+    var_list = global_variables() + local_variables()
   # Backwards compatibility for old-style variables. TODO(touts): remove.
   if not var_list:
     var_list = []
@@ -1217,7 +1258,7 @@ def report_uninitialized_variables(var_list=None,
 
   Args:
     var_list: List of `Variable` objects to check. Defaults to the
-      value of `all_variables() + local_variables()`
+      value of `global_variables() + local_variables()`
     name: Optional name of the `Operation`.
 
   Returns:
@@ -1225,7 +1266,7 @@ def report_uninitialized_variables(var_list=None,
     1-D tensor if there are no variables or no uninitialized variables.
   """
   if var_list is None:
-    var_list = all_variables() + local_variables()
+    var_list = global_variables() + local_variables()
     # Backwards compatibility for old-style variables. TODO(touts): remove.
     if not var_list:
       var_list = []
@@ -1257,7 +1298,7 @@ ops.register_tensor_conversion_function(
 
 ops.register_dense_tensor_like_type(Variable)
 ops.register_proto_function(
-    ops.GraphKeys.VARIABLES,
+    ops.GraphKeys.GLOBAL_VARIABLES,
     proto_type=variable_pb2.VariableDef,
     to_proto=Variable.to_proto,
     from_proto=Variable.from_proto)
diff --git a/tensorflow/python/platform/gfile.py b/tensorflow/python/platform/gfile.py
index 16aab787731..33efb0aefaa 100644
--- a/tensorflow/python/platform/gfile.py
+++ b/tensorflow/python/platform/gfile.py
@@ -14,23 +14,37 @@
 # ==============================================================================
 
 """Import router for file_io."""
-# pylint: disable=wildcard-import
 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 
-from tensorflow.python.lib.io import file_io
+# pylint: disable=unused-import
+from tensorflow.python.lib.io.file_io import copy as Copy
+from tensorflow.python.lib.io.file_io import create_dir as MkDir
+from tensorflow.python.lib.io.file_io import delete_file as Remove
+from tensorflow.python.lib.io.file_io import delete_recursively as DeleteRecursively
+from tensorflow.python.lib.io.file_io import file_exists as Exists
+from tensorflow.python.lib.io.file_io import FileIO as _FileIO
+from tensorflow.python.lib.io.file_io import get_matching_files as Glob
+from tensorflow.python.lib.io.file_io import is_directory as IsDirectory
+from tensorflow.python.lib.io.file_io import list_directory as ListDirectory
+from tensorflow.python.lib.io.file_io import recursive_create_dir as MakeDirs
+from tensorflow.python.lib.io.file_io import rename as Rename
+from tensorflow.python.lib.io.file_io import stat as Stat
+from tensorflow.python.lib.io.file_io import walk as Walk
+# pylint: enable=unused-import
+from tensorflow.python.util.all_util import remove_undocumented
 
 
-class GFile(file_io.FileIO):
-  """File I/O wrappers with thread locking."""
+class GFile(_FileIO):
+  """File I/O wrappers without thread locking."""
 
   def __init__(self, name, mode='r'):
     mode = mode.replace('b', '')
     super(GFile, self).__init__(name=name, mode=mode)
 
 
-class FastGFile(file_io.FileIO):
+class FastGFile(_FileIO):
   """File I/O wrappers without thread locking."""
 
   def __init__(self, name, mode='r'):
@@ -38,23 +52,27 @@ class FastGFile(file_io.FileIO):
     super(FastGFile, self).__init__(name=name, mode=mode)
 
 
-# This should be kept consistent with the OSS implementation
-# of the gfile interface.
-
 # Does not alias to Open so that we use our version of GFile to strip
 # 'b' mode.
 Open = GFile
 
-# pylint: disable=invalid-name
-Exists = file_io.file_exists
-IsDirectory = file_io.is_directory
-Glob = file_io.get_matching_files
-MkDir = file_io.create_dir
-MakeDirs = file_io.recursive_create_dir
-Remove = file_io.delete_file
-DeleteRecursively = file_io.delete_recursively
-ListDirectory = file_io.list_directory
-Walk = file_io.walk
-Stat = file_io.stat
-Rename = file_io.rename
-Copy = file_io.copy
+# TODO(drpng): Find the right place to document these.
+_allowed_symbols = [
+    'Copy',
+    'DeleteRecursively',
+    'Exists',
+    'FastGFile',
+    'GFile',
+    'Glob',
+    'IsDirectory',
+    'ListDirectory',
+    'Open',
+    'MakeDirs',
+    'MkDir',
+    'Remove',
+    'Rename',
+    'Stat',
+    'Walk',
+]
+
+remove_undocumented(__name__, _allowed_symbols)
diff --git a/tensorflow/python/saved_model/README.md b/tensorflow/python/saved_model/README.md
new file mode 100644
index 00000000000..1323c91f86a
--- /dev/null
+++ b/tensorflow/python/saved_model/README.md
@@ -0,0 +1,155 @@
+# TensorFlow SavedModel
+
+[TOC]
+
+## Overview
+This document describes SavedModel, the universal serialization format for
+[TensorFlow](https://www.tensorflow.org/) models.
+
+SavedModel provides a language-neutral format to save machine-learned models
+that is recoverable and hermetic. It enables higher-level systems and tools to
+produce, consume and transform TensorFlow models.
+
+## Features
+
+The following is a summary of the features in SavedModel:
+
+* Multiple graphs sharing a single set of variables and assets can be added to a
+  single SavedModel. Each graph is associated with a specific set of tags to
+  allow identification during a load or restore operation.
+* Support for `SignatureDefs`
+    * Graphs that are used for inference tasks typically have a set of inputs
+      and outputs. This is called a `Signature`.
+    * SavedModel uses [SignatureDefs](https://github.com/tensorflow/tensorflow/blob/master/tensorflow/core/protobuf/meta_graph.proto)
+      to allow generic support for signatures that may need to be saved with the graphs.
+* Support for `Assets`.
+    * For cases where ops depend on external files for initialization, such as
+      vocabularies, SavedModel supports this via `assets`.
+    * Assets are copied to the SavedModel location and can be read when loading
+      a specific meta graph def.
+* Support to clear devices before generating the SavedModel.
+
+The following is a summary of features that are NOT supported in SavedModel.
+Higher-level frameworks and tools that use SavedModel may provide these.
+
+* Implicit versioning.
+* Garbage collection.
+* Atomic writes to the SavedModel location.
+
+## Background
+SavedModel manages and builds upon existing TensorFlow primitives such as
+`TensorFlow Saver` and `MetaGraphDef`. Specifically, SavedModel wraps a [TensorFlow Saver](https://github.com/tensorflow/tensorflow/tree/master/tensorflow/python/training/saver.py).
+The Saver is primarily used to generate the variable checkpoints. SavedModel
+will replace the existing [TensorFlow Inference Model Format](https://github.com/tensorflow/tensorflow/blob/master/tensorflow/contrib/session_bundle/README.md)
+as the canonical way to export TensorFlow graphs for serving.
+
+## Components
+A SavedModel directory has the following structure:
+
+```
+assets/
+assets.extra/
+variables/
+    variables.data-?????-of-?????
+    variables.index
+saved_model.pb
+```
+
+* SavedModel protocol buffer
+    * `saved_model.pb` or `saved_model.pbtxt`
+    * Includes the graph definitions as `MetaGraphDef` protocol buffers.
+* Assets
+    * Subfolder called `assets`.
+    * Contains auxiliary files such as vocabularies, etc.
+* Extra assets
+    * Subfolder where higher-level libraries and users can add their own assets
+      that co-exist with the model, but are not loaded by the graph.
+    * This subfolder is not managed by the SavedModel libraries.
+* Variables
+    * Subfolder called `variables`.
+    * Includes output from the [TensorFlow Saver](https://github.com/tensorflow/tensorflow/tree/master/tensorflow/python/training/saver.py).
+        * `variables.data-?????-of-?????`
+        * `variables.index`
+
+## APIs
+The APIs for building and loading a SavedModel are described in this section.
+
+### Builder
+The SavedModel [builder](https://github.com/tensorflow/tensorflow/blob/master/tensorflow/python/saved_model/builder.py)
+is implemented in Python.
+
+The `SavedModelBuilder` class provides functionality to save multiple meta graph
+defs, associated variables and assets.
+
+To build a SavedModel, the first meta graph must be saved with variables.
+Subsequent meta graphs will simply be saved with their graph definitions. If
+assets need to be saved and written or copied to disk, they can be provided
+when the meta graph def is added. If multiple meta graph defs are associated
+with an asset of the same name, only the first version is retained.
+
+#### Tags
+Each meta graph added to the SavedModel must be annotated with user specified
+tags. The tags provide a means to identify the specific meta graph to load and
+restore, along with the shared set of variables and assets. These tags
+typically annotate a MetaGraph with it's functionality (e.g. serving or
+training), and possibly hardware specific aspects such as GPU.
+
+A subset of commonly used tags is specified in [Python](https://github.com/tensorflow/tensorflow/blob/master/tensorflow/python/saved_model/tag_constants.py)
+and [C++](https://github.com/tensorflow/tensorflow/blob/master/tensorflow/cc/saved_model/tag_constants.h)
+for the purpose of easy and consistent usability.
+
+#### Usage
+The typical usage of `builder` is as follows:
+
+~~~python
+export_dir = ...
+...
+builder = saved_model_builder.SavedModelBuilder(export_dir)
+with tf.Session(graph=tf.Graph()) as sess:
+...
+builder.add_meta_graph_and_variables(sess,
+                                     [tag_constants.TRAINING],
+                                     signature_def_map=foo_signatures,
+                                     assets_collection=foo_assets)
+...
+with tf.Session(graph=tf.Graph()) as sess:
+  ...
+  builder.add_meta_graph(["bar-tag", "baz-tag"])
+...
+builder.save()
+~~~
+
+### Loader
+The SavedModel loader is implemented in C++ and Python.
+
+#### Python
+The Python version of the SavedModel [loader](https://github.com/tensorflow/tensorflow/blob/master/tensorflow/python/saved_model/builder.py)
+provides load and restore capability for a SavedModel. The `load` operation
+requires the session in which to restore the graph definition and variables, the
+tags used to identify the meta graph def to load and the location of the
+SavedModel. Upon a load, the subset of variables and assets supplied as part of
+the specific meta graph def, will be restored into the supplied session.
+
+~~~python
+export_dir = ...
+...
+with tf.Session(graph=tf.Graph()) as sess:
+  loader.load(sess, [tag_constants.TRAINING], export_dir)
+  ...
+~~~
+
+#### C++
+The C++ version of the SavedModel [loader](https://github.com/tensorflow/tensorflow/blob/master/tensorflow/cc/saved_model/loader.h)
+provides an API to load a SavedModel from a path, while allowing
+`SessionOptions` and `RunOptions`. Similar to the Python version, the C++
+version requires the tags associated with the graph to be loaded, to be
+specified. The loaded version of SavedModel is referred to as `SavedModelBundle`
+and contains the meta graph def and the session within which it is loaded.
+
+~~~c++
+const string export_dir = ...
+SavedModelBundle bundle;
+...
+LoadSavedModel(session_options, run_options, export_dir, {kSavedModelTagTrain},
+               &bundle);
+~~~
diff --git a/tensorflow/python/saved_model/builder.py b/tensorflow/python/saved_model/builder.py
index 43b97cf70c6..523dd501ba6 100644
--- a/tensorflow/python/saved_model/builder.py
+++ b/tensorflow/python/saved_model/builder.py
@@ -49,10 +49,9 @@ class SavedModelBuilder(object):
 
   To build a SavedModel, the first meta graph must be saved with variables.
   Subsequent meta graphs will simply be saved with their graph definitions. If
-  assets need to be saved and written or copied to disk, they must be provided
-  as part of the first meta graph to be saved. Subsequent meta graphs can
-  provide a subset of the initial assets to be added to the SavedModel
-  definition.
+  assets need to be saved and written or copied to disk, they can be provided
+  when the meta graph def is added. If multiple meta graph defs are associated
+  an asset of the same name, only the first version is retained.
 
   Each meta graph added to the SavedModel must be annotated with tags. The tags
   provide a means to identify the specific meta graph to load and restore, along
@@ -253,7 +252,8 @@ class SavedModelBuilder(object):
                      tags,
                      signature_def_map=None,
                      assets_collection=None,
-                     legacy_init_op=None):
+                     legacy_init_op=None,
+                     clear_devices=False):
     """Adds the current meta graph to the SavedModel.
 
     Creates a Saver in the current scope and uses the Saver to export the meta
@@ -268,7 +268,9 @@ class SavedModelBuilder(object):
           that this collection should be a subset of the assets saved as part of
           the first meta graph in the SavedModel.
       legacy_init_op: Op or group of ops to execute after the restore op upon a
-        load.
+          load.
+      clear_devices: Set to true if the device info on the default graph should
+          be cleared.
 
     Raises:
       AssertionError: If the variables for the SavedModel have not been saved
@@ -290,7 +292,7 @@ class SavedModelBuilder(object):
         sharded=True,
         write_version=saver_pb2.SaverDef.V2)
 
-    meta_graph_def = saver.export_meta_graph()
+    meta_graph_def = saver.export_meta_graph(clear_devices=clear_devices)
 
     # Tag the meta graph def and add it to the SavedModel.
     self._tag_and_add_meta_graph(meta_graph_def, tags, signature_def_map)
@@ -300,7 +302,8 @@ class SavedModelBuilder(object):
                                    tags,
                                    signature_def_map=None,
                                    assets_collection=None,
-                                   legacy_init_op=None):
+                                   legacy_init_op=None,
+                                   clear_devices=False):
     """Adds the current meta graph to the SavedModel and saves variables.
 
     Creates a Saver to save the variables from the provided session. Exports the
@@ -318,6 +321,8 @@ class SavedModelBuilder(object):
       assets_collection: Assets collection to be saved with SavedModel.
       legacy_init_op: Op or group of ops to execute after the restore op upon a
         load.
+      clear_devices: Set to true if the device info on the default graph should
+          be cleared.
     """
     if self._has_saved_variables:
       raise AssertionError("Variables and assets have already been saved. "
@@ -346,7 +351,7 @@ class SavedModelBuilder(object):
         sharded=True,
         write_version=saver_pb2.SaverDef.V2)
     saver.save(sess, variables_path, write_meta_graph=False)
-    meta_graph_def = saver.export_meta_graph()
+    meta_graph_def = saver.export_meta_graph(clear_devices=clear_devices)
 
     # Tag the meta graph def and add it to the SavedModel.
     self._tag_and_add_meta_graph(meta_graph_def, tags, signature_def_map)
diff --git a/tensorflow/python/saved_model/saved_model_test.py b/tensorflow/python/saved_model/saved_model_test.py
index a50620e113c..6f2132b4924 100644
--- a/tensorflow/python/saved_model/saved_model_test.py
+++ b/tensorflow/python/saved_model/saved_model_test.py
@@ -553,6 +553,29 @@ class SavedModelTest(tf.test.TestCase):
       tf.get_collection("init_op")[0].run()
       self.assertEqual(3, tf.get_collection("v")[2].eval())
 
+  def testClearDevices(self):
+    export_dir = os.path.join(tf.test.get_temp_dir(), "test_clear_devices")
+    builder = saved_model_builder.SavedModelBuilder(export_dir)
+
+    # Specify a device and save a variable.
+    tf.reset_default_graph()
+    with tf.Session(
+        target="",
+        config=config_pb2.ConfigProto(device_count={"CPU": 2})) as sess:
+      with sess.graph.device("/cpu:0"):
+        self._init_and_validate_variable(sess, "v", 42)
+        builder.add_meta_graph_and_variables(
+            sess, [tag_constants.TRAINING], clear_devices=True)
+
+    # Save the SavedModel to disk.
+    builder.save()
+
+    # Restore the graph with a single predefined tag whose variables were saved
+    # without any device information.
+    with self.test_session(graph=tf.Graph()) as sess:
+      loader.load(sess, [tag_constants.TRAINING], export_dir)
+      self.assertEqual(42, tf.get_collection(tf.GraphKeys.VARIABLES)[0].eval())
+
 
 if __name__ == "__main__":
   tf.test.main()
diff --git a/tensorflow/python/summary/event_accumulator.py b/tensorflow/python/summary/event_accumulator.py
index 063f100b94f..4c042218c8e 100644
--- a/tensorflow/python/summary/event_accumulator.py
+++ b/tensorflow/python/summary/event_accumulator.py
@@ -19,6 +19,7 @@ from __future__ import print_function
 
 import collections
 import os.path
+import re
 import threading
 
 import numpy as np
@@ -98,10 +99,18 @@ STORE_EVERYTHING_SIZE_GUIDANCE = {
     HISTOGRAMS: 0,
 }
 
+# When files on Colossus are deleted, they are actually renamed.
+_CNS_DELETED_FILE_PATTERN = re.compile(r'\.~\d+~(/|$)')
+
 
 def IsTensorFlowEventsFile(path):
   """Check the path name to see if it is probably a TF Events file."""
-  return 'tfevents' in compat.as_str_any(os.path.basename(path))
+  if 'tfevents' not in compat.as_str_any(os.path.basename(path)):
+    return False
+  if _CNS_DELETED_FILE_PATTERN.search(path):
+    logging.info('Ignoring deleted Colossus file: %s', path)
+    return False
+  return True
 
 
 class EventAccumulator(object):
diff --git a/tensorflow/python/summary/summary.py b/tensorflow/python/summary/summary.py
index a6b348cc991..b5db6b802fa 100644
--- a/tensorflow/python/summary/summary.py
+++ b/tensorflow/python/summary/summary.py
@@ -35,8 +35,6 @@ from __future__ import print_function
 
 import re as _re
 
-import six
-
 from google.protobuf import json_format as _json_format
 from tensorflow.core.framework import summary_pb2 as _summary_pb2
 from tensorflow.python.framework import dtypes as _dtypes
@@ -47,8 +45,8 @@ from tensorflow.python.ops import gen_logging_ops as _gen_logging_ops
 from tensorflow.python.ops.summary_ops import tensor_summary
 # pylint: enable=unused-import
 from tensorflow.python.platform import tf_logging as _logging
-from tensorflow.python.util.all_util import remove_undocumented
 from tensorflow.python.util import compat as _compat
+from tensorflow.python.util.all_util import remove_undocumented
 
 
 def _collect(val, collections, default_collections):
@@ -60,6 +58,7 @@ def _collect(val, collections, default_collections):
 
 _INVALID_TAG_CHARACTERS = _re.compile(r'[^-/\w\.]')
 
+
 def _clean_tag(name):
   # In the past, the first argument to summary ops was a tag, which allowed
   # arbitrary characters. Now we are changing the first argument to be the node
diff --git a/tensorflow/python/tools/BUILD b/tensorflow/python/tools/BUILD
index cf944423087..6ddba9e510d 100644
--- a/tensorflow/python/tools/BUILD
+++ b/tensorflow/python/tools/BUILD
@@ -41,41 +41,6 @@ py_test(
     ],
 )
 
-py_library(
-    name = "graph_metrics_lib",
-    srcs = ["graph_metrics.py"],
-    srcs_version = "PY2AND3",
-    deps = [
-        "//tensorflow:tensorflow_py",
-    ],
-)
-
-py_binary(
-    name = "graph_metrics",
-    srcs = [
-        "graph_metrics.py",
-    ],
-    main = "graph_metrics.py",
-    srcs_version = "PY2AND3",
-    deps = [
-        "//tensorflow:tensorflow_py",
-    ],
-)
-
-py_test(
-    name = "graph_metrics_test",
-    size = "small",
-    srcs = [
-        "graph_metrics_test.py",
-    ],
-    srcs_version = "PY2AND3",
-    deps = [
-        ":graph_metrics_lib",
-        "//tensorflow/python:framework_test_lib",
-        "//tensorflow/python:platform_test",
-    ],
-)
-
 py_binary(
     name = "inspect_checkpoint",
     srcs = [
diff --git a/tensorflow/python/tools/graph_metrics.py b/tensorflow/python/tools/graph_metrics.py
deleted file mode 100644
index ecb0f091f6a..00000000000
--- a/tensorflow/python/tools/graph_metrics.py
+++ /dev/null
@@ -1,141 +0,0 @@
-# Copyright 2015 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-
-"""Gives estimates of computation and parameter sizes for a GraphDef.
-
-This script takes a GraphDef representing a network, and produces rough
-estimates of the number of floating-point operations needed to implement it and
-how many parameters are stored. You need to pass in the input size, and the
-results are only approximate, since it only calculates them for a subset of
-common operations.
-
-If you have downloaded the Inception graph for the label_image example, an
-example of using this script would be:
-
-bazel-bin/third_party/tensorflow/python/tools/graph_metrics \
---graph tensorflow_inception_graph.pb                       \
---statistics=weight_parameters,flops
-
-"""
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import locale
-
-import tensorflow as tf
-
-from google.protobuf import text_format
-
-from tensorflow.core.framework import graph_pb2
-from tensorflow.python.framework import ops
-
-
-FLAGS = tf.flags.FLAGS
-
-tf.flags.DEFINE_string("graph", "", """TensorFlow 'GraphDef' file to load.""")
-tf.flags.DEFINE_bool("input_binary", True,
-                     """Whether the input files are in binary format.""")
-tf.flags.DEFINE_string("input_layer", "Mul:0",
-                       """The name of the input node.""")
-tf.flags.DEFINE_integer("batch_size", 1,
-                        """The batch size to use for the calculations.""")
-tf.flags.DEFINE_string("statistics", "weight_parameters,flops",
-                       """Which statistic types to examine.""")
-tf.flags.DEFINE_string("input_shape_override", "",
-                       """If this is set, the comma-separated values will be"""
-                       """ used to set the shape of the input layer.""")
-tf.flags.DEFINE_boolean("print_nodes", False,
-                        """Whether to show statistics for each op.""")
-
-
-def print_stat(prefix, statistic_type, value):
-  if value is None:
-    friendly_value = "None"
-  else:
-    friendly_value = locale.format("%d", value, grouping=True)
-  print("%s%s=%s" % (prefix, statistic_type, friendly_value))
-
-
-def main(unused_args):
-  if not tf.gfile.Exists(FLAGS.graph):
-    print("Input graph file '" + FLAGS.graph + "' does not exist!")
-    return -1
-  graph_def = graph_pb2.GraphDef()
-  with open(FLAGS.graph, "rb") as f:
-    if FLAGS.input_binary:
-      graph_def.ParseFromString(f.read())
-    else:
-      text_format.Merge(f.read(), graph_def)
-  statistic_types = FLAGS.statistics.split(",")
-  if FLAGS.input_shape_override:
-    input_shape_override = map(int, FLAGS.input_shape_override.split(","))
-  else:
-    input_shape_override = None
-  total_stats, node_stats = calculate_graph_metrics(
-      graph_def, statistic_types, FLAGS.input_layer, input_shape_override,
-      FLAGS.batch_size)
-  if FLAGS.print_nodes:
-    for node in graph_def.node:
-      for statistic_type in statistic_types:
-        current_stats = node_stats[statistic_type][node.name]
-        print_stat(node.name + "(" + node.op + "): ", statistic_type,
-                   current_stats.value)
-  for statistic_type in statistic_types:
-    value = total_stats[statistic_type].value
-    print_stat("Total: ", statistic_type, value)
-
-
-def calculate_graph_metrics(graph_def, statistic_types, input_layer,
-                            input_shape_override, batch_size):
-  """Looks at the performance statistics of all nodes in the graph."""
-  _ = tf.import_graph_def(graph_def, name="")
-  total_stats = {}
-  node_stats = {}
-  for statistic_type in statistic_types:
-    total_stats[statistic_type] = ops.OpStats(statistic_type)
-    node_stats[statistic_type] = {}
-  # Make sure we get pretty-printed numbers with separators.
-  locale.setlocale(locale.LC_ALL, "")
-  with tf.Session() as sess:
-    input_tensor = sess.graph.get_tensor_by_name(input_layer)
-    input_shape_tensor = input_tensor.get_shape()
-    if input_shape_tensor:
-      input_shape = input_shape_tensor.as_list()
-    else:
-      input_shape = None
-    if input_shape_override:
-      input_shape = input_shape_override
-    if input_shape is None:
-      raise ValueError("""No input shape was provided on the command line,"""
-                       """ and the input op itself had no default shape, so"""
-                       """ shape inference couldn't be performed. This is"""
-                       """ required for metrics calculations.""")
-    input_shape[0] = batch_size
-    input_tensor.set_shape(input_shape)
-    for node in graph_def.node:
-      # Ensure that the updated input shape has been fully-propagated before we
-      # ask for the statistics, since they may depend on the output size.
-      op = sess.graph.get_operation_by_name(node.name)
-      ops.set_shapes_for_outputs(op)
-      for statistic_type in statistic_types:
-        current_stats = ops.get_stats_for_node_def(sess.graph, node,
-                                                   statistic_type)
-        node_stats[statistic_type][node.name] = current_stats
-        total_stats[statistic_type] += current_stats
-  return total_stats, node_stats
-
-if __name__ == "__main__":
-  tf.app.run()
diff --git a/tensorflow/python/tools/graph_metrics_test.py b/tensorflow/python/tools/graph_metrics_test.py
deleted file mode 100644
index 827856291e9..00000000000
--- a/tensorflow/python/tools/graph_metrics_test.py
+++ /dev/null
@@ -1,50 +0,0 @@
-# Copyright 2015 The TensorFlow Authors. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ==============================================================================
-"""Tests the graph metrics tool."""
-from __future__ import absolute_import
-from __future__ import division
-from __future__ import print_function
-
-import tensorflow as tf
-
-from tensorflow.python.tools import graph_metrics
-
-
-class GraphMetricsTest(tf.test.TestCase):
-
-  def testGraphMetrics(self):
-    with tf.Graph().as_default():
-      input_node = tf.placeholder(tf.float32, shape=[10, 20], name="input_node")
-      weights_node = tf.constant(0.0,
-                                 dtype=tf.float32,
-                                 shape=[20, 5],
-                                 name="weights_node")
-      tf.matmul(input_node, weights_node, name="matmul_node")
-      sess = tf.Session()
-      graph_def = sess.graph.as_graph_def()
-    statistic_types = ["weight_parameters", "flops"]
-    total_stats, node_stats = graph_metrics.calculate_graph_metrics(
-        graph_def, statistic_types, "input_node:0", None, 10)
-    expected = {"weight_parameters": 100, "flops": 2000}
-    for statistic_type in statistic_types:
-      current_stats = node_stats[statistic_type]["matmul_node"]
-      self.assertEqual(expected[statistic_type], current_stats.value)
-    for statistic_type in statistic_types:
-      current_stats = total_stats[statistic_type]
-      self.assertEqual(expected[statistic_type], current_stats.value)
-
-
-if __name__ == "__main__":
-  tf.test.main()
diff --git a/tensorflow/python/training/input.py b/tensorflow/python/training/input.py
index c976f19775a..3031a907fef 100644
--- a/tensorflow/python/training/input.py
+++ b/tensorflow/python/training/input.py
@@ -31,6 +31,7 @@ from tensorflow.python import summary
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import ops
+from tensorflow.python.framework import sparse_tensor
 from tensorflow.python.framework import tensor_shape
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
@@ -407,7 +408,7 @@ def _store_sparse_tensors(tensor_list, enqueue_many, shared_map_ops=None):
   maybe_shared_map_ops = shared_map_ops or [None] * len(tensor_list)
 
   def _sparse_meta_data(t, storing_op, map_op):
-    if not isinstance(t, ops.SparseTensor):
+    if not isinstance(t, sparse_tensor.SparseTensor):
       return _SparseMetaData(False, None, None)
     rank = t.shape.get_shape().with_rank(1)[0]
     if enqueue_many:
@@ -418,7 +419,7 @@ def _store_sparse_tensors(tensor_list, enqueue_many, shared_map_ops=None):
         sparse=True, map_op=map_op or storing_op, rank=rank)
 
   def _maybe_store(t, shared_map_op):
-    if not isinstance(t, ops.SparseTensor):
+    if not isinstance(t, sparse_tensor.SparseTensor):
       return t
     map_op_name = shared_map_op.name if shared_map_op else None
     return (_store_many_sparse(t, shared_name=map_op_name) if enqueue_many
diff --git a/tensorflow/python/training/queue_runner.py b/tensorflow/python/training/queue_runner.py
index fa8964f69fe..91999fa37db 100644
--- a/tensorflow/python/training/queue_runner.py
+++ b/tensorflow/python/training/queue_runner.py
@@ -225,8 +225,6 @@ class QueueRunner(object):
       coord: Optional Coordinator object for reporting errors and checking
         for stop conditions.
     """
-    if coord:
-      coord.register_thread(threading.current_thread())
     decremented = False
     try:
       while True:
@@ -269,7 +267,6 @@ class QueueRunner(object):
       cancel_op: The Operation to run.
       coord: Coordinator.
     """
-    coord.register_thread(threading.current_thread())
     coord.wait_for_stop()
     try:
       sess.run(cancel_op)
@@ -321,6 +318,8 @@ class QueueRunner(object):
       ret_threads.append(threading.Thread(target=self._close_on_stop,
                                           args=(sess, self._cancel_op, coord)))
     for t in ret_threads:
+      if coord:
+        coord.register_thread(t)
       if daemon:
         t.daemon = True
       if start:
diff --git a/tensorflow/python/training/queue_runner_test.py b/tensorflow/python/training/queue_runner_test.py
index 852935f7984..d21114bf479 100644
--- a/tensorflow/python/training/queue_runner_test.py
+++ b/tensorflow/python/training/queue_runner_test.py
@@ -25,19 +25,6 @@ import tensorflow as tf
 
 class QueueRunnerTest(tf.test.TestCase):
 
-  def _wait_for_thread_registration(self, coord, N):
-    """Wait for N threads to register with the coordinator.
-
-    This is necessary in some tests that launch threads and
-    then want to join() them in the coordinator.
-
-    Args:
-      coord: A Coordinator object.
-      N: Number of threads to wait for.
-    """
-    while len(coord._registered_threads) < N:
-      time.sleep(0.001)
-
   def testBasic(self):
     with self.test_session() as sess:
       # CountUpTo will raise OUT_OF_RANGE when it reaches the count.
@@ -135,7 +122,6 @@ class QueueRunnerTest(tf.test.TestCase):
       threads = qr.create_threads(sess, coord)
       for t in threads:
         t.start()
-      self._wait_for_thread_registration(coord, len(threads))
       coord.join()
       self.assertEqual(0, len(qr.exceptions_raised))
       # The variable should be 0.
@@ -149,7 +135,6 @@ class QueueRunnerTest(tf.test.TestCase):
       threads = qr.create_threads(sess, coord)
       for t in threads:
         t.start()
-      self._wait_for_thread_registration(coord, len(threads))
       # The exception should be re-raised when joining.
       with self.assertRaisesRegexp(ValueError, "Operation not in the graph"):
         coord.join()
@@ -162,9 +147,7 @@ class QueueRunnerTest(tf.test.TestCase):
       dequeue = queue.dequeue()
       qr = tf.train.QueueRunner(queue, [enqueue])
       coord = tf.train.Coordinator()
-      threads = qr.create_threads(sess, coord, start=True)
-      # Wait for the threads to have registered with the coordinator.
-      self._wait_for_thread_registration(coord, len(threads))
+      qr.create_threads(sess, coord, start=True)
       # Dequeue one element and then request stop.
       dequeue.op.run()
       time.sleep(0.02)
diff --git a/tensorflow/python/training/training.py b/tensorflow/python/training/training.py
index 1a11eb86f8d..a0f72e2d23e 100644
--- a/tensorflow/python/training/training.py
+++ b/tensorflow/python/training/training.py
@@ -51,6 +51,8 @@ functions below.
 
 @@stop_gradient
 
+@@hessians
+
 
 ## Gradient Clipping
 
diff --git a/tensorflow/contrib/framework/python/framework/decorator_utils.py b/tensorflow/python/util/decorator_utils.py
similarity index 84%
rename from tensorflow/contrib/framework/python/framework/decorator_utils.py
rename to tensorflow/python/util/decorator_utils.py
index 155003498ce..c4b033d59ae 100644
--- a/tensorflow/contrib/framework/python/framework/decorator_utils.py
+++ b/tensorflow/python/util/decorator_utils.py
@@ -60,3 +60,25 @@ def validate_callable(func, decorator_name):
         ' @property appears before @%s in your source code:'
         '\n\n@property\n@%s\ndef method(...)' % (
             func, decorator_name, decorator_name))
+
+
+class classproperty(object):  # pylint: disable=invalid-name
+  """Class property decorator.
+
+  Example usage:
+
+  class MyClass(object):
+
+    @classproperty
+    def value(cls):
+      return '123'
+
+  > print MyClass.value
+  123
+  """
+
+  def __init__(self, func):
+    self._func = func
+
+  def __get__(self, owner_self, owner_cls):
+    return self._func(owner_cls)
diff --git a/tensorflow/contrib/framework/python/framework/decorator_utils_test.py b/tensorflow/python/util/decorator_utils_test.py
similarity index 97%
rename from tensorflow/contrib/framework/python/framework/decorator_utils_test.py
rename to tensorflow/python/util/decorator_utils_test.py
index de24adcca65..7a72239ad03 100644
--- a/tensorflow/contrib/framework/python/framework/decorator_utils_test.py
+++ b/tensorflow/python/util/decorator_utils_test.py
@@ -22,8 +22,8 @@ from __future__ import print_function
 import functools
 
 import tensorflow as tf
-from tensorflow.contrib.framework.python.framework import decorator_utils
 from tensorflow.python.platform import tf_logging as logging
+from tensorflow.python.util import decorator_utils
 
 
 def _test_function(unused_arg=0):
diff --git a/tensorflow/contrib/framework/python/framework/deprecation.py b/tensorflow/python/util/deprecation.py
similarity index 99%
rename from tensorflow/contrib/framework/python/framework/deprecation.py
rename to tensorflow/python/util/deprecation.py
index a93e23110fa..f92a9b77bc8 100644
--- a/tensorflow/contrib/framework/python/framework/deprecation.py
+++ b/tensorflow/python/util/deprecation.py
@@ -22,8 +22,8 @@ import functools
 import inspect
 import re
 
-from tensorflow.contrib.framework.python.framework import decorator_utils
 from tensorflow.python.platform import tf_logging as logging
+from tensorflow.python.util import decorator_utils
 
 
 def _add_deprecated_function_notice_to_docstring(doc, date, instructions):
diff --git a/tensorflow/contrib/framework/python/framework/deprecation_test.py b/tensorflow/python/util/deprecation_test.py
similarity index 99%
rename from tensorflow/contrib/framework/python/framework/deprecation_test.py
rename to tensorflow/python/util/deprecation_test.py
index c5422f47316..791593189fe 100644
--- a/tensorflow/contrib/framework/python/framework/deprecation_test.py
+++ b/tensorflow/python/util/deprecation_test.py
@@ -20,8 +20,8 @@ from __future__ import division
 from __future__ import print_function
 
 import tensorflow as tf
-from tensorflow.contrib.framework.python.framework import deprecation
 from tensorflow.python.platform import tf_logging as logging
+from tensorflow.python.util import deprecation
 
 
 class DeprecationTest(tf.test.TestCase):
diff --git a/tensorflow/stream_executor/device_memory.h b/tensorflow/stream_executor/device_memory.h
index eb73133d313..bcb0664b043 100644
--- a/tensorflow/stream_executor/device_memory.h
+++ b/tensorflow/stream_executor/device_memory.h
@@ -145,23 +145,6 @@ class DeviceMemory final : public DeviceMemoryBase {
   }
 
   // ------------------------------------------------------------
-  // DO NOT USE - FASTR TEAM-INTERNAL FUNCTIONS
-  // Used internally by gcudacc.
-#ifdef __GCUDACC__
-  // Implicit conversion operators needed to support mixed mode. Since buffer
-  // sizes aren't used in the CUDA launching process, and since the constructed
-  // objects are all temporary, this is safe.
-  // Linter warning disabled as we require an implicit conversion.
-  DeviceMemory(const ElemT *opaque) :  // NOLINT
-        DeviceMemoryBase(reinterpret_cast<void *>(const_cast<ElemT *>(opaque)),
-                         0) {}
-
-  operator ElemT *() { return reinterpret_cast<ElemT *>(opaque()); }
-  operator const ElemT *() {
-    return const_cast<const ElemT *>(reinterpret_cast<ElemT *>(opaque()));
-  }
-#endif
-  // ------------------------------------------------------------
 
  protected:
   // This constructor is solely used from derived classes; it is made protected
diff --git a/tensorflow/tensorboard/TAG b/tensorflow/tensorboard/TAG
index a7873645902..8f92bfdd497 100644
--- a/tensorflow/tensorboard/TAG
+++ b/tensorflow/tensorboard/TAG
@@ -1 +1 @@
-34
+35
diff --git a/tensorflow/tensorboard/backend/server_test.py b/tensorflow/tensorboard/backend/server_test.py
index dba0bbfd0eb..dc7c28e9e1c 100644
--- a/tensorflow/tensorboard/backend/server_test.py
+++ b/tensorflow/tensorboard/backend/server_test.py
@@ -27,6 +27,7 @@ import json
 import numbers
 import os
 import shutil
+import tempfile
 import threading
 import zlib
 
@@ -51,10 +52,10 @@ class TensorboardServerTest(tf.test.TestCase):
   _SCALAR_COUNT = 99
 
   def setUp(self):
-    self._GenerateTestData()
+    temp_dir = self._GenerateTestData()
     self._multiplexer = event_multiplexer.EventMultiplexer(
         size_guidance=server.TENSORBOARD_SIZE_GUIDANCE)
-    server.ReloadMultiplexer(self._multiplexer, {self.get_temp_dir(): None})
+    server.ReloadMultiplexer(self._multiplexer, {temp_dir: None})
     # 0 to pick an unused port.
     self._server = server.BuildServer(
         self._multiplexer, 'localhost', 0, '/foo/logdir/argument')
@@ -322,8 +323,11 @@ class TensorboardServerTest(tf.test.TestCase):
      - scalar events containing the value i at step 10 * i and wall time
          100 * i, for i in [1, _SCALAR_COUNT).
      - a graph definition
+
+    Returns:
+      temp_dir: The directory the test data is generated under.
     """
-    temp_dir = self.get_temp_dir()
+    temp_dir = tempfile.mkdtemp(prefix=self.get_temp_dir())
     self.addCleanup(shutil.rmtree, temp_dir)
     run1_path = os.path.join(temp_dir, 'run1')
     os.makedirs(run1_path)
@@ -396,6 +400,8 @@ class TensorboardServerTest(tf.test.TestCase):
     if 'projector' in REGISTERED_PLUGINS:
       self._GenerateProjectorTestData(run1_path)
 
+    return temp_dir
+
   def _GenerateProjectorTestData(self, run_path):
     # Write a projector config file in run1.
     config_path = os.path.join(run_path, 'projector_config.pbtxt')
diff --git a/tensorflow/tensorboard/bower.json b/tensorflow/tensorboard/bower.json
index 34eb3a28229..74ec32b16ec 100644
--- a/tensorflow/tensorboard/bower.json
+++ b/tensorflow/tensorboard/bower.json
@@ -17,6 +17,7 @@
     "iron-overlay-behavior",
     "iron-range-behavior",
     "iron-resizable-behavior",
+    "iron-scroll-target-behavior",
     "iron-validatable-behavior",
     "neon-animation",
     "paper-dialog-behavior",
@@ -49,14 +50,15 @@
     "iron-form-element-behavior": "PolymerElements/iron-form-element-behavior#1.0.6",
     "iron-icon": "PolymerElements/iron-icon#1.0.11",
     "iron-icons": "PolymerElements/iron-icons#1.1.3",
-    "iron-iconset-svg": "PolymerElements/iron-iconset-svg#1.0.10",
+    "iron-iconset-svg": "PolymerElements/iron-iconset-svg#1.1.0",
     "iron-input": "PolymerElements/iron-input#1.0.10",
     "iron-list": "PolymerElements/iron-list#1.3.9",
     "iron-menu-behavior": "PolymerElements/iron-menu-behavior#1.1.10",
     "iron-meta": "PolymerElements/iron-meta#1.1.1",
-    "iron-overlay-behavior": "PolymerElements/iron-overlay-behavior#1.9.0",
+    "iron-overlay-behavior": "PolymerElements/iron-overlay-behavior#1.10.1",
     "iron-range-behavior": "PolymerElements/iron-range-behavior#1.0.4",
     "iron-resizable-behavior": "PolymerElements/iron-resizable-behavior#1.0.3",
+    "iron-scroll-target-behavior": "PolymerElements/iron-scroll-target-behavior#1.0.3",
     "iron-selector": "PolymerElements/iron-selector#1.5.2",
     "iron-validatable-behavior": "PolymerElements/iron-validatable-behavior#1.1.1",
     "lodash": "3.8.0",
@@ -69,7 +71,7 @@
     "paper-dialog-behavior": "PolymerElements/paper-dialog-behavior#1.2.5",
     "paper-dropdown-menu": "PolymerElements/paper-dropdown-menu#1.4.0",
     "paper-header-panel": "PolymerElements/paper-header-panel#1.1.4",
-    "paper-icon-button": "PolymerElements/paper-icon-button#1.1.2",
+    "paper-icon-button": "PolymerElements/paper-icon-button#1.1.3",
     "paper-input": "PolymerElements/paper-input#1.1.18",
     "paper-item": "PolymerElements/paper-item#1.1.4",
     "paper-listbox": "PolymerElements/paper-listbox#1.1.2",
@@ -129,14 +131,15 @@
     "iron-form-element-behavior": "1.0.6",
     "iron-icon": "1.0.11",
     "iron-icons": "1.1.3",
-    "iron-iconset-svg": "1.0.10",
+    "iron-iconset-svg": "1.1.0",
     "iron-input": "1.0.10",
     "iron-list": "1.3.9",
     "iron-menu-behavior": "1.1.10",
     "iron-meta": "1.1.1",
-    "iron-overlay-behavior": "1.9.0",
+    "iron-overlay-behavior": "1.10.1",
     "iron-range-behavior": "1.0.4",
     "iron-resizable-behavior": "1.0.3",
+    "iron-scroll-target-behavior": "1.0.3",
     "iron-selector": "1.5.2",
     "iron-validatable-behavior": "1.1.1",
     "lodash": "3.8.0",
@@ -149,7 +152,7 @@
     "paper-dialog-behavior": "1.2.5",
     "paper-dropdown-menu": "1.4.0",
     "paper-header-panel": "1.1.4",
-    "paper-icon-button": "1.1.2",
+    "paper-icon-button": "1.1.3",
     "paper-input": "1.1.18",
     "paper-item": "1.1.4",
     "paper-listbox": "1.1.2",
diff --git a/tensorflow/tensorboard/bower/BUILD b/tensorflow/tensorboard/bower/BUILD
index f5445750971..69abaedb12d 100644
--- a/tensorflow/tensorboard/bower/BUILD
+++ b/tensorflow/tensorboard/bower/BUILD
@@ -31,6 +31,7 @@ filegroup(
         "@iron_overlay_behavior//:iron_overlay_behavior",
         "@iron_range_behavior//:iron_range_behavior",
         "@iron_resizable_behavior//:iron_resizable_behavior",
+        "@iron_scroll_target_behavior//:iron_scroll_target_behavior",
         "@iron_selector//:iron_selector",
         "@iron_validatable_behavior//:iron_validatable_behavior",
         "@lodash//:lodash",
diff --git a/tensorflow/tensorboard/components/tf_dashboard_common/tf-multi-checkbox.html b/tensorflow/tensorboard/components/tf_dashboard_common/tf-multi-checkbox.html
index dadad81a343..8dfcb3153db 100644
--- a/tensorflow/tensorboard/components/tf_dashboard_common/tf-multi-checkbox.html
+++ b/tensorflow/tensorboard/components/tf_dashboard_common/tf-multi-checkbox.html
@@ -58,7 +58,7 @@ handle these situations gracefully.
             <paper-checkbox
               class="checkbox vertical-align-center"
               name="[[item]]"
-              checked$="[[_isChecked(item, runToIsCheckedMapping.*)]]"
+              checked$="[[_isChecked(item, runsDisabled.*)]]"
               on-change="_checkboxChange"
             ></paper-checkbox>
 
@@ -161,7 +161,10 @@ handle these situations gracefully.
   Polymer({
     is: "tf-multi-checkbox",
     properties: {
-      names: Array, // All the runs in consideration
+      names: {
+        type: Array,
+        value: function() {return [];},
+      }, // All the runs in consideration
       regexInput: {
         type: String,
         value: TF.URIStorage.getStringInitializer("regexInput", ""),
@@ -175,15 +178,15 @@ handle these situations gracefully.
         type: Array,
         computed: "computeNamesMatchingRegex(names.*, regex)"
       }, // Runs that match the regex
-      runToIsCheckedMapping: {
+      runsDisabled: {
         type: Object,
-        value: TF.URIStorage.getObjectInitializer('runToIsCheckedMapping', {}),
-      }, // run name -> Boolean (if its enabled)
+        value: TF.URIStorage.getObjectInitializer('runsDisabled', {}),
+      }, // Every run that is disabled is stored in the map (with value true)
       // (Allows state to persist across regex filtering)
       outSelected: {
         type: Array,
         notify: true,
-        computed: 'computeOutSelected(namesMatchingRegex.*, runToIsCheckedMapping.*)'
+        computed: 'computeOutSelected(namesMatchingRegex.*, runsDisabled.*)'
       },
       colorScale: {
         type: Object,
@@ -219,11 +222,10 @@ handle these situations gracefully.
       'dom-change': 'synchronizeColors',
     },
     observers: [
-      "_initializeRunToIsCheckedMapping(names.*)",
-      "_setIsolatorIcon(runToIsCheckedMapping)",
-      "_storeRunToIsCheckedMapping(runToIsCheckedMapping)",
+      "_setIsolatorIcon(runsDisabled, names)",
+      "_storeRunToIsCheckedMapping(runsDisabled)",
     ],
-    _storeRunToIsCheckedMapping: TF.URIStorage.getObjectObserver('runToIsCheckedMapping', {}),
+    _storeRunToIsCheckedMapping: TF.URIStorage.getObjectObserver('runsDisabled', {}),
     _makeRegex: function(regex) {
       try {
         return new RegExp(regex)
@@ -232,29 +234,18 @@ handle these situations gracefully.
       }
     },
     _setIsolatorIcon: function() {
-      var runMap = this.runToIsCheckedMapping;
-      var numChecked = _.filter(_.values(runMap)).length;
+      var runMap = this.runsDisabled;
+      var numChecked = this.names.length - _.filter(_.values(runMap)).length;
       var buttons = Array.prototype.slice.call(this.querySelectorAll(".isolator"));
 
       buttons.forEach(function(b) {
-        if (numChecked === 1 && runMap[b.name]) {
+        if (numChecked === 1 && !runMap[b.name]) {
           b.icon = "radio-button-checked";
         } else {
           b.icon = "radio-button-unchecked";
         }
       });
     },
-    _initializeRunToIsCheckedMapping: function(change) {
-      var runToIsCheckedMapping = _.clone(this.runToIsCheckedMapping);
-
-      this.names.forEach(function(n) {
-        if (runToIsCheckedMapping[n] == null) {
-          // runs default to on
-          runToIsCheckedMapping[n] = true;
-        }
-      });
-      this.runToIsCheckedMapping = runToIsCheckedMapping;
-    },
     computeNamesMatchingRegex: function(__, ___) {
       var regex = this.regex;
       return this.names.filter(function(n) {
@@ -262,9 +253,9 @@ handle these situations gracefully.
       });
     },
     computeOutSelected: function(__, ___) {
-      var runToIsCheckedMapping = this.runToIsCheckedMapping;
+      var runsDisabled = this.runsDisabled;
       return this.namesMatchingRegex.filter(function(n) {
-        return runToIsCheckedMapping[n];
+        return !runsDisabled[n];
       });
     },
     synchronizeColors: function(e) {
@@ -296,24 +287,25 @@ handle these situations gracefully.
       // If user clicks on the label for one run, enable it and disable all other runs.
 
       var name = Polymer.dom(e).localTarget.name;
-      var _this = this;
-      _.keys(this.runToIsCheckedMapping).forEach(function(k) {
-        _this.runToIsCheckedMapping[k] = false;
-      });
-      this.runToIsCheckedMapping[name] = true;
-      // we can't use notifyPath because the run names may have periods
-      this.runToIsCheckedMapping = _.clone(this.runToIsCheckedMapping);
+      var newDisabled = {};
+      this.names.forEach(function(n) {
+        newDisabled[n] = true;
+      })
+      delete newDisabled[name];
+      this.runsDisabled = newDisabled;
     },
     _checkboxChange: function(e) {
       var target = Polymer.dom(e).localTarget;
-      var name = target.name;
-      var checked = target.checked;
-      this.runToIsCheckedMapping[name] = checked;
+      if (target.checked) {
+        delete this.runsDisabled[target.name];
+      } else {
+        this.runsDisabled[target.name] = true;
+      }
       // n.b. notifyPath won't work because run names may have periods.
-      this.runToIsCheckedMapping = _.clone(this.runToIsCheckedMapping);
+      this.runsDisabled = _.clone(this.runsDisabled);
     },
     _isChecked: function(item, outSelectedChange) {
-      return this.runToIsCheckedMapping[item];
+      return this.runsDisabled[item] == undefined;
     },
     _initializeRuns: function(change) {
       this.outSelected = change.base.slice();
@@ -322,10 +314,15 @@ handle these situations gracefully.
     toggleAll: function() {
       var _this = this;
       var allOn = this.namesMatchingRegex
-                    .filter(function(n) {return !_this.runToIsCheckedMapping[n]})
+                    .filter(function(n) {return _this.runsDisabled[n]})
                     .length === 0;
-      this.namesMatchingRegex.forEach(function(n) {_this.runToIsCheckedMapping[n] = !allOn});
-      this.runToIsCheckedMapping = _.clone(this.runToIsCheckedMapping);
+      let newRunsDisabled = {}
+      if (allOn) {
+        this.names.forEach(function(n) {
+          newRunsDisabled[n] = true;
+        })
+      }
+      this.runsDisabled = newRunsDisabled;
     },
   });
   </script>
diff --git a/tensorflow/tensorboard/components/tf_globals/globals.ts b/tensorflow/tensorboard/components/tf_globals/globals.ts
index e985941d9cc..33feb26d238 100644
--- a/tensorflow/tensorboard/components/tf_globals/globals.ts
+++ b/tensorflow/tensorboard/components/tf_globals/globals.ts
@@ -15,15 +15,12 @@ limitations under the License.
 
 /* tslint:disable:no-namespace */
 module TF.Globals {
-  const PROJECTOR_LAUNCHED = false;
 
   // The names of TensorBoard tabs.
-  export var TABS =
-      ['scalars', 'images', 'audio', 'graphs', 'distributions', 'histograms'];
-
-  if (PROJECTOR_LAUNCHED) {
-    TABS.push('projections');
-  }
+  export var TABS = [
+    'scalars', 'images', 'audio', 'graphs', 'distributions', 'histograms',
+    'embeddings'
+  ];
 
   // If true, TensorBoard stores its hash in the URI state.
   // If false, tab switching in TensorBoard will not update location hash,
diff --git a/tensorflow/tensorboard/components/tf_image_dashboard/tf-image-dashboard.html b/tensorflow/tensorboard/components/tf_image_dashboard/tf-image-dashboard.html
index 83945032bd1..0274a1f3391 100644
--- a/tensorflow/tensorboard/components/tf_image_dashboard/tf-image-dashboard.html
+++ b/tensorflow/tensorboard/components/tf_image_dashboard/tf-image-dashboard.html
@@ -16,6 +16,8 @@ limitations under the License.
 -->
 
 <link rel="import" href="../polymer/polymer.html">
+<link rel="import" href="../paper-dialog/paper-dialog.html">
+<link rel="import" href="../paper-icon-button/paper-icon-button.html">
 <link rel="import" href="../tf-backend/tf-backend.html">
 <link rel="import" href="../tf-color-scale/tf-color-scale.html">
 <link rel="import" href="../tf-dashboard-common/tf-dashboard.html">
@@ -28,6 +30,7 @@ tf-image-dashboard displays a dashboard that loads images from a TensorFlow run.
 -->
 <dom-module id="tf-image-dashboard">
   <template>
+    <paper-dialog with-backdrop id="actual-image-size-dialog"></paper-dialog>
     <div id="plumbing">
       <tf-color-scale
         id="colorScale"
@@ -60,6 +63,12 @@ tf-image-dashboard displays a dashboard that loads images from a TensorFlow run.
           >
           <template>
             <tf-image-loader color-scale="[[_colorScale]]"></tf-image-loader>
+            <paper-icon-button
+              class="actual-size-button"
+              icon="aspect-ratio"
+              on-tap="_showActualSize"
+              title="Show the image at its true pixel size"
+              ></paper-icon-button>
           </template>
         </tf-panes-helper>
       </div>
@@ -72,6 +81,27 @@ tf-image-dashboard displays a dashboard that loads images from a TensorFlow run.
         --card-expanded-width: 700px;
         --card-expanded-height: auto;
       }
+
+      .actual-size-button {
+        background: #fff;
+        border-radius: 100%;
+        bottom: -35px;
+        color: #2196f3;
+        height: 32px;
+        left: 35px;
+        padding: 4px;
+        pointer-events: auto;
+        position: absolute;
+        width: 32px;
+      }
+
+      .actual-size-button-selected {
+        background: var(--tb-ui-light-accent);
+      }
+
+      #actual-image-size-dialog {
+        overflow: auto;
+      }
     </style>
   </template>
   <script>
@@ -93,6 +123,29 @@ tf-image-dashboard displays a dashboard that loads images from a TensorFlow run.
           this.fire("rendered");
         });
       },
+      _showActualSize: function(e) {
+        var currentTarget = Polymer.dom(e.currentTarget);
+        var card = currentTarget.node.closest('.card');
+
+        // Create a full-size copy of the image.
+        var newImage = card.querySelector('#img').cloneNode();
+        newImage.style.height = 'auto';
+        newImage.style.width = 'auto';
+        newImage.style.margin = 0;
+        newImage.style.padding = 0;
+        newImage.classList.add("actual-size-image");
+
+        // When the user clicks on the image, empty and close the dialog.
+        var dialog = this.$$('#actual-image-size-dialog');
+        newImage.addEventListener('click', function() {
+          dialog.close();
+        });
+
+        // Update dialog content. Show the dialog.
+        dialog.innerHTML = '';
+        dialog.appendChild(newImage);
+        dialog.open();
+      }
     });
   </script>
 </dom-module>
diff --git a/tensorflow/tensorboard/components/tf_image_dashboard/tf-image-loader.html b/tensorflow/tensorboard/components/tf_image_dashboard/tf-image-loader.html
index b2e86bc6727..fc3e383f3c7 100644
--- a/tensorflow/tensorboard/components/tf_image_dashboard/tf-image-loader.html
+++ b/tensorflow/tensorboard/components/tf_image_dashboard/tf-image-loader.html
@@ -40,6 +40,7 @@ future for loading older images.
       }
 
       img {
+        image-rendering: -moz-crisp-edges;
         image-rendering: pixelated;
         display: block;
         width: 100%;
diff --git a/tensorflow/tensorboard/components/tf_tensorboard/tf-tensorboard.html b/tensorflow/tensorboard/components/tf_tensorboard/tf-tensorboard.html
index bdbb915a7a0..3d1f2ecf0bb 100644
--- a/tensorflow/tensorboard/components/tf_tensorboard/tf-tensorboard.html
+++ b/tensorflow/tensorboard/components/tf_tensorboard/tf-tensorboard.html
@@ -125,7 +125,7 @@ allows the user to toggle between various dashboards.
           ></tf-histogram-dashboard>
         </template>
 
-        <template is="dom-if" if="[[_modeIsProjections(mode)]]">
+        <template is="dom-if" if="[[_modeIsEmbeddings(mode)]]">
           <vz-projector-dashboard
             id="projector"
             route-prefix="/data/plugin/projector">
@@ -262,8 +262,8 @@ allows the user to toggle between various dashboards.
       _modeIsGraphs: function(mode) {
         return mode === "graphs";
       },
-      _modeIsProjections: function(mode) {
-        return mode === "projections";
+      _modeIsEmbeddings: function(mode) {
+        return mode === "embeddings";
       },
       _modeIsDistributions: function(mode) {
         return mode === "distributions";
@@ -298,7 +298,7 @@ allows the user to toggle between various dashboards.
         }
       },
       reload: function() {
-        if (this.mode === "graphs" || this.mode === "projections") {
+        if (this.mode === "graphs" || this.mode === "embeddings") {
           return;
         }
         this.selectedDashboard().reload();
diff --git a/tensorflow/tensorboard/components/vz_line_chart/vz-line-chart.ts b/tensorflow/tensorboard/components/vz_line_chart/vz-line-chart.ts
index fd66f8bf212..d39af299d17 100644
--- a/tensorflow/tensorboard/components/vz_line_chart/vz-line-chart.ts
+++ b/tensorflow/tensorboard/components/vz_line_chart/vz-line-chart.ts
@@ -259,27 +259,35 @@ module VZ {
           dataset: null,
         };
 
-        let centerBBox: SVGRect =
-            (<any>this.gridlines.content().node()).getBBox();
-        let points = plot.datasets().map(
-            (dataset) => this.findClosestPoint(target, dataset));
-        let pointsToCircle = points.filter(
-            (p) => p != null &&
-                Plottable.Utils.DOM.intersectsBBox(p.x, p.y, centerBBox));
-        let pts: any = pointsComponent.content().selectAll('.point').data(
-            pointsToCircle,
-            (p: VZ.ChartHelpers.Point) => p.dataset.metadata().name);
-        if (points.length !== 0) {
-          pts.enter().append('circle').classed('point', true);
-          pts.attr('r', VZ.ChartHelpers.TOOLTIP_CIRCLE_SIZE)
+
+        let bbox: SVGRect = (<any>this.gridlines.content().node()).getBBox();
+
+        // pts is the closets point to the tooltip for each dataset
+        let pts = plot.datasets()
+                      .map((dataset) => this.findClosestPoint(target, dataset))
+                      .filter(x => x != null);
+        let intersectsBBox = Plottable.Utils.DOM.intersectsBBox;
+        // We draw tooltips for points that are NaN, or are currently visible
+        let ptsForTooltips = pts.filter(
+            (p) => intersectsBBox(p.x, p.y, bbox) || isNaN(p.datum.scalar));
+        // Only draw little indicator circles for the non-NaN points
+        let ptsToCircle = ptsForTooltips.filter((p) => !isNaN(p.datum.scalar));
+
+        let ptsSelection: any =
+            pointsComponent.content().selectAll('.point').data(
+                ptsToCircle,
+                (p: VZ.ChartHelpers.Point) => p.dataset.metadata().name);
+        if (pts.length !== 0) {
+          ptsSelection.enter().append('circle').classed('point', true);
+          ptsSelection.attr('r', VZ.ChartHelpers.TOOLTIP_CIRCLE_SIZE)
               .attr('cx', (p) => p.x)
               .attr('cy', (p) => p.y)
               .style('stroke', 'none')
               .attr(
                   'fill',
                   (p) => this.colorScale.scale(p.dataset.metadata().name));
-          pts.exit().remove();
-          this.drawTooltips(points, target);
+          ptsSelection.exit().remove();
+          this.drawTooltips(ptsForTooltips, target);
         } else {
           hideTooltips();
         }
@@ -328,7 +336,6 @@ module VZ {
                      .append('tr');
       // Grey out the point if any of the following are true:
       // - The cursor is outside of the x-extent of the dataset
-      // - The point is rendered above or below the screen
       // - The point's y value is NaN
       rows.classed('distant', (d) => {
         let firstPoint = d.dataset.data()[0];
@@ -337,9 +344,7 @@ module VZ {
             this.xScale.scale(this.xAccessor(firstPoint, 0, d.dataset));
         let lastX = this.xScale.scale(this.xAccessor(lastPoint, 0, d.dataset));
         let s = this.smoothingEnabled ? d.datum.smoothed : d.datum.scalar;
-        let yD = this.yScale.domain();
-        return target.x < firstX || target.x > lastX || s < yD[0] ||
-            s > yD[1] || isNaN(s);
+        return target.x < firstX || target.x > lastX || isNaN(s);
       });
       rows.classed('closest', (p) => dist(p) === closestDist);
       // It is a bit hacky that we are manually applying the width to the swatch
diff --git a/tensorflow/tensorboard/components/vz_projector/data-provider-demo.ts b/tensorflow/tensorboard/components/vz_projector/data-provider-demo.ts
index a839ad4a0b3..643862c797a 100644
--- a/tensorflow/tensorboard/components/vz_projector/data-provider-demo.ts
+++ b/tensorflow/tensorboard/components/vz_projector/data-provider-demo.ts
@@ -20,69 +20,15 @@ import * as logging from './logging';
 
 /** Data provider that loads data from a demo folder. */
 export class DemoDataProvider implements DataProvider {
-  /** List of demo datasets for showing the capabilities of the tool. */
-  private DEMO_CONFIG: ProjectorConfig = {
-    embeddings: [
-      {
-        tensorName: 'Word2Vec 5K',
-        tensorShape: [5000, 200],
-        tensorPath: 'word2vec_5000_200d_tensors.tsv',
-        metadataPath: 'word2vec_5000_200d_labels.tsv'
-      },
-      {
-        tensorName: 'Word2Vec 10K',
-        tensorShape: [10000, 200],
-        tensorPath: 'word2vec_10000_200d_tensors.tsv',
-        metadataPath: 'word2vec_10000_200d_labels.tsv'
-      },
-      {
-        tensorName: 'Word2Vec All',
-        tensorShape: [71291, 200],
-        tensorPath: 'word2vec_full_200d_tensors.tsv',
-        metadataPath: 'word2vec_full_200d_labels.tsv'
-      },
-      {
-        tensorName: 'SmartReply 5K',
-        tensorShape: [5000, 256],
-        tensorPath: 'smartreply_5000_256d_tensors.tsv',
-        metadataPath: 'smartreply_5000_256d_labels.tsv'
-      },
-      {
-        tensorName: 'SmartReply All',
-        tensorShape: [35860, 256],
-        tensorPath: 'smartreply_full_256d_tensors.tsv',
-        metadataPath: 'smartreply_full_256d_labels.tsv'
-      },
-      {
-        tensorName: 'Mnist with images 10K',
-        tensorShape: [10000, 784],
-        tensorPath: 'mnist_10k_784d_tensors.tsv',
-        metadataPath: 'mnist_10k_784d_labels.tsv',
-        sprite: {
-          imagePath: 'mnist_10k_sprite.png',
-          singleImageDim: [28, 28]
-        }
-      },
-      {
-        tensorName: 'Iris',
-        tensorShape: [150, 4],
-        tensorPath: 'iris_tensors.tsv',
-        metadataPath: 'iris_labels.tsv'
-      },
-      {
-        tensorName: 'Unit Cube',
-        tensorShape: [8, 3],
-        tensorPath: 'cube_tensors.tsv',
-        metadataPath: 'cube_metadata.tsv'
-      }
-    ],
-    modelCheckpointPath: 'Demo datasets'
-  };
-  /** Name of the folder where the demo datasets are stored. */
-  private DEMO_FOLDER = 'data';
+  private projectorConfigPath: string;
+  private projectorConfig: ProjectorConfig;
+
+  constructor(projectorConfigPath: string) {
+    this.projectorConfigPath = projectorConfigPath;
+  }
 
   private getEmbeddingInfo(tensorName: string): EmbeddingInfo {
-    let embeddings = this.DEMO_CONFIG.embeddings;
+    let embeddings = this.projectorConfig.embeddings;
     for (let i = 0; i < embeddings.length; i++) {
       let embedding = embeddings[i];
       if (embedding.tensorName === tensorName) {
@@ -98,18 +44,28 @@ export class DemoDataProvider implements DataProvider {
 
   retrieveProjectorConfig(run: string, callback: (d: ProjectorConfig) => void)
       : void {
-    callback(this.DEMO_CONFIG);
+    let msgId = logging.setModalMessage('Fetching projector config...');
+    d3.json(this.projectorConfigPath, (err, projectorConfig) => {
+      if (err) {
+        logging.setModalMessage('Error: ' + err.responseText);
+        return;
+      }
+      logging.setModalMessage(null, msgId);
+      this.projectorConfig = projectorConfig;
+      callback(projectorConfig);
+    });
   }
 
   getDefaultTensor(run: string, callback: (tensorName: string) => void) {
-    callback('SmartReply 5K');
+    // Return the first tensor as the default tensor.
+    callback(this.projectorConfig.embeddings[0].tensorName);
   }
 
   retrieveTensor(run: string, tensorName: string,
       callback: (ds: DataSet) => void) {
     let embedding = this.getEmbeddingInfo(tensorName);
     let separator = embedding.tensorPath.substr(-3) === 'tsv' ? '\t' : ' ';
-    let url = `${this.DEMO_FOLDER}/${embedding.tensorPath}`;
+    let url = `${embedding.tensorPath}`;
     logging.setModalMessage('Fetching tensors...', TENSORS_MSG_ID);
     d3.text(url, (error: any, dataString: string) => {
       if (error) {
@@ -125,16 +81,12 @@ export class DemoDataProvider implements DataProvider {
   retrieveSpriteAndMetadata(run: string, tensorName: string,
       callback: (r: SpriteAndMetadataInfo) => void) {
     let embedding = this.getEmbeddingInfo(tensorName);
-    let metadataPath = null;
-    if (embedding.metadataPath) {
-      metadataPath = `${this.DEMO_FOLDER}/${embedding.metadataPath}`;
-    }
     let spriteImagePath = null;
     if (embedding.sprite && embedding.sprite.imagePath) {
-      spriteImagePath = `${this.DEMO_FOLDER}/${embedding.sprite.imagePath}`;
+      spriteImagePath = embedding.sprite.imagePath;
     }
-    dataProvider.retrieveSpriteAndMetadataInfo(metadataPath, spriteImagePath,
-        embedding.sprite, callback);
+    dataProvider.retrieveSpriteAndMetadataInfo(
+        embedding.metadataPath, spriteImagePath, embedding.sprite, callback);
   }
 
   getBookmarks(
diff --git a/tensorflow/tensorboard/components/vz_projector/data-provider.ts b/tensorflow/tensorboard/components/vz_projector/data-provider.ts
index 6337aaa249b..b460e905554 100644
--- a/tensorflow/tensorboard/components/vz_projector/data-provider.ts
+++ b/tensorflow/tensorboard/components/vz_projector/data-provider.ts
@@ -18,7 +18,7 @@ import * as logging from './logging';
 import {runAsyncTask} from './util';
 
 /** Maximum number of colors supported in the color map. */
-const NUM_COLORS_COLOR_MAP = 20;
+const NUM_COLORS_COLOR_MAP = 50;
 
 export const METADATA_MSG_ID = 'metadata';
 export const TENSORS_MSG_ID = 'tensors';
@@ -278,4 +278,4 @@ export function retrieveSpriteAndMetadataInfo(metadataPath: string,
     metadata.spriteMetadata = spriteMetadata;
     callback(metadata);
   });
-}
\ No newline at end of file
+}
diff --git a/tensorflow/tensorboard/components/vz_projector/data.ts b/tensorflow/tensorboard/components/vz_projector/data.ts
index b8b7d884d90..5f865c5139a 100644
--- a/tensorflow/tensorboard/components/vz_projector/data.ts
+++ b/tensorflow/tensorboard/components/vz_projector/data.ts
@@ -23,6 +23,7 @@ import {SpriteMetadata} from './data-provider';
 
 export type DistanceFunction = (a: number[], b: number[]) => number;
 export type PointAccessor = (index: number) => number;
+export type PointAccessors3D = [PointAccessor, PointAccessor, PointAccessor];
 
 export interface PointMetadata {
   [key: string]: number | string;
@@ -118,7 +119,7 @@ export class DataSet {
   nearestK: number;
   tSNEIteration: number = 0;
   tSNEShouldStop = true;
-  dim = [0, 0];
+  dim: [number, number] = [0, 0];
   hasTSNERun: boolean = false;
   spriteAndMetadataInfo: SpriteAndMetadataInfo;
 
@@ -416,6 +417,9 @@ export class State {
   /** The selected projection tab. */
   selectedProjection: Projection;
 
+  /** Dimensions of the DataSet. */
+  dataSetDimensions: [number, number];
+
   /** t-SNE parameters */
   tSNEIteration: number = 0;
   tSNEPerplexity: number = 0;
diff --git a/tensorflow/tensorboard/components/vz_projector/scatterPlot.ts b/tensorflow/tensorboard/components/vz_projector/scatterPlot.ts
index 3b87915e81d..844ffa02694 100644
--- a/tensorflow/tensorboard/components/vz_projector/scatterPlot.ts
+++ b/tensorflow/tensorboard/components/vz_projector/scatterPlot.ts
@@ -13,7 +13,7 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 
-import {PointAccessor, DataSet} from './data';
+import {DataSet, PointAccessors3D} from './data';
 import {HoverContext} from './hoverContext';
 import {LabelRenderParams, RenderContext} from './renderContext';
 import {ScatterPlotVisualizer} from './scatterPlotVisualizer';
@@ -42,7 +42,7 @@ const ORTHO_CAMERA_FRUSTUM_HALF_EXTENT = 1.2;
 const SHIFT_KEY = 16;
 const CTRL_KEY = 17;
 
-const START_CAMERA_POS_3D = new THREE.Vector3(0.6, 1.0, 1.85);
+const START_CAMERA_POS_3D = new THREE.Vector3(0.45, 0.9, 1.6);
 const START_CAMERA_TARGET_3D = new THREE.Vector3(0, 0, 0);
 const START_CAMERA_POS_2D = new THREE.Vector3(0, 0, 1);
 const START_CAMERA_TARGET_2D = new THREE.Vector3(0, 0, 0);
@@ -103,7 +103,7 @@ export class ScatterPlot {
   private onCameraMoveListeners: OnCameraMoveListener[] = [];
 
   // Accessors for rendering and labeling the points.
-  private pointAccessors: [PointAccessor, PointAccessor, PointAccessor];
+  private pointAccessors: PointAccessors3D;
 
   // Scaling functions for each axis.
   private xScale: d3.scale.Linear<number, number>;
@@ -718,8 +718,7 @@ export class ScatterPlot {
     this.renderer.render(this.scene, this.camera);
   }
 
-  setPointAccessors(pointAccessors:
-                        [PointAccessor, PointAccessor, PointAccessor]) {
+  setPointAccessors(pointAccessors: PointAccessors3D) {
     this.pointAccessors = pointAccessors;
   }
 
diff --git a/tensorflow/tensorboard/components/vz_projector/scatterPlotVisualizerCanvasLabels.ts b/tensorflow/tensorboard/components/vz_projector/scatterPlotVisualizerCanvasLabels.ts
index 072d21ca135..5e01b067e5a 100644
--- a/tensorflow/tensorboard/components/vz_projector/scatterPlotVisualizerCanvasLabels.ts
+++ b/tensorflow/tensorboard/components/vz_projector/scatterPlotVisualizerCanvasLabels.ts
@@ -81,6 +81,7 @@ export class ScatterPlotVisualizerCanvasLabels implements
 
     this.gc.lineWidth = 6;
     this.gc.textBaseline = 'middle';
+    this.gc.miterLimit = 2;
 
     // Have extra space between neighboring labels. Don't pack too tightly.
     const labelMargin = 2;
diff --git a/tensorflow/tensorboard/components/vz_projector/scatterPlotVisualizerSprites.ts b/tensorflow/tensorboard/components/vz_projector/scatterPlotVisualizerSprites.ts
index cc03801073e..cdd1ce094d9 100644
--- a/tensorflow/tensorboard/components/vz_projector/scatterPlotVisualizerSprites.ts
+++ b/tensorflow/tensorboard/components/vz_projector/scatterPlotVisualizerSprites.ts
@@ -80,10 +80,7 @@ const FRAGMENT_SHADER_POINT_TEST_CHUNK = `
     vec3 p = vec3(spriteCoord, 0);
     float p_in_v0_v1 = cross(v1 - v0, p - v0).z;
     float p_in_v1_v2 = cross(v2 - v1, p - v1).z;
-    float p_in_v2_v0 = cross(v0 - v2, p - v2).z;
-    vec3 p_inside = vec3(p_in_v0_v1, p_in_v1_v2, p_in_v2_v0);
-    vec3 p_inside_norm = step(vec3(0, 0, 0), p_inside);
-    return all(bvec3(p_inside_norm));
+    return (p_in_v0_v1 > 0.0) && (p_in_v1_v2 > 0.0);
   }
 `;
 
@@ -125,8 +122,11 @@ const FRAGMENT_SHADER_PICKING = `
     if (isImage) {
       gl_FragColor = vec4(vColor, 1);
     } else {
-      float a = float(point_in_unit_circle(gl_PointCoord));
-      gl_FragColor = vec4(vColor, a);
+      bool inside = point_in_unit_circle(gl_PointCoord);
+      if (!inside) {
+        discard;
+      }
+      gl_FragColor = vec4(vColor, 1);
     }
   }`;
 
diff --git a/tensorflow/tensorboard/components/vz_projector/vz-projector-app.html b/tensorflow/tensorboard/components/vz_projector/vz-projector-app.html
index f2a9fcad137..6221485c2d1 100644
--- a/tensorflow/tensorboard/components/vz_projector/vz-projector-app.html
+++ b/tensorflow/tensorboard/components/vz_projector/vz-projector-app.html
@@ -76,7 +76,9 @@ vz-projector {
       </a>
     </div>
   </div>
-  <vz-projector route-prefix="[[routePrefix]]" serving-mode="[[servingMode]]"></vz-projector>
+  <vz-projector route-prefix="[[routePrefix]]"
+      serving-mode="[[servingMode]]"
+      projector-config-json-path="[[projectorConfigJsonPath]]"></vz-projector>
 </div>
 <!-- Google analytics -->
 <script>
diff --git a/tensorflow/tensorboard/components/vz_projector/vz-projector-bookmark-panel.html b/tensorflow/tensorboard/components/vz_projector/vz-projector-bookmark-panel.html
index 283bc7cfdd8..8f7f6b42209 100644
--- a/tensorflow/tensorboard/components/vz_projector/vz-projector-bookmark-panel.html
+++ b/tensorflow/tensorboard/components/vz_projector/vz-projector-bookmark-panel.html
@@ -127,10 +127,9 @@ paper-textarea {
       BOOKMARKS ([[savedStates.length]])
       <paper-icon-button icon="help" class="help-icon"></paper-icon-button>
       <paper-tooltip animation-delay="0" position="top" offset="0">
-        The bookmarks drawer allows you to bookmark a set of views into the
-        projection, saving camera position, selected points, as well as any
-        highlighting you may have. You can then download the file to save it
-        permanently, and later upload it to again view your bookmarks.
+        Open this drawer to save a set of views of the projection, including
+        selected points. A file containing the bookmarks can then be saved and
+        later loaded to view them.
       </paper-tooltip>
     </div>
     <div id="icon-container">
@@ -185,13 +184,14 @@ paper-textarea {
       <div id="action-buttons-container">
         <paper-icon-button
             class="upload-download-icon-button"
-            icon="file-download"
-            title="Download bookmarks"
+            icon="save"
+            title="Save bookmarks"
+            disabled="[[!hasStates]]"
             on-tap="_downloadFile"></paper-icon-button>
         <paper-icon-button
             class="upload-download-icon-button"
             icon="file-upload"
-            title="Upload bookmarks"
+            title="Load bookmarks"
             on-tap="_uploadFile"></paper-icon-button>
         <paper-icon-button
             class="add-icon-button ink-fab"
diff --git a/tensorflow/tensorboard/components/vz_projector/vz-projector-bookmark-panel.ts b/tensorflow/tensorboard/components/vz_projector/vz-projector-bookmark-panel.ts
index 87cdd1a8d58..b622cf33ea0 100644
--- a/tensorflow/tensorboard/components/vz_projector/vz-projector-bookmark-panel.ts
+++ b/tensorflow/tensorboard/components/vz_projector/vz-projector-bookmark-panel.ts
@@ -14,6 +14,7 @@ limitations under the License.
 ==============================================================================*/
 import {State} from './data';
 import {DataProvider, EmbeddingInfo} from './data-provider';
+import * as logging from './logging';
 import {Projector} from './vz-projector';
 // tslint:disable-next-line:no-unused-variable
 import {PolymerElement, PolymerHTMLElement} from './vz-projector-util';
@@ -21,7 +22,13 @@ import {PolymerElement, PolymerHTMLElement} from './vz-projector-util';
 // tslint:disable-next-line
 export let BookmarkPanelPolymer = PolymerElement({
   is: 'vz-projector-bookmark-panel',
-  properties: {savedStates: Object, selectedState: Number}
+  properties: {
+    savedStates: Object,
+    // Keep a separate polymer property because the savedStates doesn't change
+    // when adding and removing states.
+    hasStates: {type: Boolean, value: false},
+    selectedState: Number
+  }
 });
 
 export class BookmarkPanel extends BookmarkPanelPolymer {
@@ -30,6 +37,7 @@ export class BookmarkPanel extends BookmarkPanelPolymer {
 
   // A list containing all of the saved states.
   private savedStates: State[];
+  private hasStates = false;
   private selectedState: number;
 
   private dom: d3.Selection<any>;
@@ -85,6 +93,7 @@ export class BookmarkPanel extends BookmarkPanelPolymer {
     }
 
     this.push('savedStates', currentState as any);
+    this.updateHasStates();
   }
 
   /** Handles a click on the download bookmarks button. */
@@ -114,20 +123,28 @@ export class BookmarkPanel extends BookmarkPanelPolymer {
   private setupUploadButton() {
     // Show and setup the load view button.
     let fileInput = this.dom.select('#state-file');
-    fileInput.on('change', function() {
+    fileInput.on('change', () => {
       let file: File = (d3.event as any).target.files[0];
       // Clear out the value of the file chooser. This ensures that if the user
       // selects the same file, we'll re-read it.
       (d3.event as any).target.value = '';
       let fileReader = new FileReader();
-      fileReader.onload = function(evt) {
+      fileReader.onload = (evt) => {
         let str: string = (evt.target as any).result;
         let savedStates = JSON.parse(str);
-        this.loadAllStates(savedStates);
-        this.loadSavedState(0);
-      }.bind(this);
+
+        // Verify the bookmarks match.
+        if (this.savedStatesValid(savedStates)) {
+          this.loadAllStates(savedStates);
+          this.loadSavedState(0);
+        } else {
+          logging.setWarningMessage(
+              `Unable to load bookmarks: wrong dataset, expected dataset ` +
+              `with shape (${savedStates[0].dataSetDimensions}).`);
+        }
+      };
       fileReader.readAsText(file);
-    }.bind(this));
+    });
   }
 
   loadAllStates(savedStates: State[]) {
@@ -135,6 +152,7 @@ export class BookmarkPanel extends BookmarkPanelPolymer {
       savedStates[i].isSelected = false;
       this.push('savedStates', savedStates[i] as any);
     }
+    this.updateHasStates();
   }
 
   /** Deselects any selected state selection. */
@@ -150,9 +168,7 @@ export class BookmarkPanel extends BookmarkPanelPolymer {
 
   /** Handles a radio button click on a saved state. */
   _radioButtonHandler(evt: Event) {
-    let index =
-        +(evt.target as Element).parentElement.getAttribute('data-index');
-    this.loadSavedState(index);
+    this.loadSavedState(this.getParentDataIndex(evt));
   }
 
   loadSavedState(index: number) {
@@ -174,7 +190,7 @@ export class BookmarkPanel extends BookmarkPanelPolymer {
    * Crawls up the DOM to find an ancestor with a data-index attribute. This is
    * used to match events to their bookmark index.
    */
-  _getParentDataIndex(evt: Event) {
+  private getParentDataIndex(evt: Event) {
     for (let i = 0; i < (evt as any).path.length; i++) {
       let dataIndex = (evt as any).path[i].getAttribute('data-index');
       if (dataIndex != null) {
@@ -186,13 +202,14 @@ export class BookmarkPanel extends BookmarkPanelPolymer {
 
   /** Handles a clear button click on a bookmark. */
   _clearButtonHandler(evt: Event) {
-    let index = this._getParentDataIndex(evt);
+    let index = this.getParentDataIndex(evt);
     this.splice('savedStates', index, 1);
+    this.updateHasStates();
   }
 
   /** Handles a label change event on a bookmark. */
   _labelChange(evt: Event) {
-    let index = this._getParentDataIndex(evt);
+    let index = this.getParentDataIndex(evt);
     this.savedStates[index].label = (evt.target as any).value;
   }
 
@@ -219,6 +236,25 @@ export class BookmarkPanel extends BookmarkPanelPolymer {
    */
   loadSavedStates(serializedStates: string) {
     this.savedStates = JSON.parse(serializedStates);
+    this.updateHasStates();
+  }
+
+  /**
+   * Updates the hasState polymer property.
+   */
+  private updateHasStates() {
+    this.hasStates = (this.savedStates.length !== 0);
+  }
+
+  /** Sanity checks a State array to ensure it matches the current dataset. */
+  private savedStatesValid(states: State[]): boolean {
+    for (let i = 0; i < states.length; i++) {
+      if (states[i].dataSetDimensions[0] !== this.projector.dataSet.dim[0] ||
+          states[i].dataSetDimensions[1] !== this.projector.dataSet.dim[1]) {
+        return false;
+      }
+    }
+    return true;
   }
 }
 document.registerElement(BookmarkPanel.prototype.is, BookmarkPanel);
diff --git a/tensorflow/tensorboard/components/vz_projector/vz-projector-data-panel.ts b/tensorflow/tensorboard/components/vz_projector/vz-projector-data-panel.ts
index df8f7f0f3fd..c9d657a81bc 100644
--- a/tensorflow/tensorboard/components/vz_projector/vz-projector-data-panel.ts
+++ b/tensorflow/tensorboard/components/vz_projector/vz-projector-data-panel.ts
@@ -144,7 +144,9 @@ export class DataPanel extends DataPanelPolymer {
               }
               let desc = stats.tooManyUniqueValues ?
                   'gradient' :
-                  stats.uniqueEntries.length + ' colors';
+                  stats.uniqueEntries.length +
+                      ((stats.uniqueEntries.length > 20) ? ' non-unique' : '') +
+                      ' colors';
               return {name: stats.name, desc, map, items, thresholds};
             });
     if (metadataColorOption.length > 0) {
diff --git a/tensorflow/tensorboard/components/vz_projector/vz-projector-projections-panel.ts b/tensorflow/tensorboard/components/vz_projector/vz-projector-projections-panel.ts
index b319cffc29f..7b28b94060a 100644
--- a/tensorflow/tensorboard/components/vz_projector/vz-projector-projections-panel.ts
+++ b/tensorflow/tensorboard/components/vz_projector/vz-projector-projections-panel.ts
@@ -133,7 +133,7 @@ export class ProjectionsPanel extends ProjectionsPanelPolymer {
     this.polymerChangesTriggerReprojection = true;
   }
 
-  private updateTSNEPerplexityFromUIChange() {
+  private updateTSNEPerplexityFromSliderChange() {
     if (this.perplexitySlider) {
       this.perplexity = +this.perplexitySlider.value;
     }
@@ -161,8 +161,8 @@ export class ProjectionsPanel extends ProjectionsPanelPolymer {
 
     this.perplexitySlider.value = this.perplexity.toString();
     this.perplexitySlider.addEventListener(
-        'change', () => this.updateTSNEPerplexityFromUIChange());
-    this.updateTSNEPerplexityFromUIChange();
+        'change', () => this.updateTSNEPerplexityFromSliderChange());
+    this.updateTSNEPerplexityFromSliderChange();
 
     this.learningRateInput.addEventListener(
         'change', () => this.updateTSNELearningRateFromUIChange());
@@ -217,7 +217,7 @@ export class ProjectionsPanel extends ProjectionsPanelPolymer {
     this.computeAllCentroids();
 
     this.setZDropdownEnabled(this.pcaIs3d);
-    this.updateTSNEPerplexityFromUIChange();
+    this.updateTSNEPerplexityFromSliderChange();
     this.updateTSNELearningRateFromUIChange();
     if (this.iterationLabel) {
       this.iterationLabel.text(bookmark.tSNEIteration.toString());
@@ -284,6 +284,10 @@ export class ProjectionsPanel extends ProjectionsPanelPolymer {
     this.dataSet = dataSet;
     this.originalDataSet = originalDataSet;
     this.dim = dim;
+    let perplexity =
+        Math.max(5, Math.ceil(Math.sqrt(dataSet.points.length) / 4));
+    this.perplexitySlider.value = perplexity.toString();
+    this.updateTSNEPerplexityFromSliderChange();
     this.clearCentroids();
 
     this.dom.select('#tsne-sampling')
diff --git a/tensorflow/tensorboard/components/vz_projector/vz-projector.ts b/tensorflow/tensorboard/components/vz_projector/vz-projector.ts
index 40e68630eb0..277c5c8c358 100644
--- a/tensorflow/tensorboard/components/vz_projector/vz-projector.ts
+++ b/tensorflow/tensorboard/components/vz_projector/vz-projector.ts
@@ -48,7 +48,8 @@ export let ProjectorPolymer = PolymerElement({
   properties: {
     routePrefix: String,
     dataProto: {type: String, observer: '_dataProtoChanged'},
-    servingMode: String
+    servingMode: String,
+    projectorConfigJsonPath: String
   }
 });
 
@@ -59,6 +60,8 @@ export class Projector extends ProjectorPolymer implements SelectionContext,
   // The working subset of the data source's original data set.
   dataSet: DataSet;
   servingMode: ServingMode;
+  // The path to the projector config JSON file for demo mode.
+  projectorConfigJsonPath: string;
 
   private selectionChangedListeners: SelectionChangedListener[];
   private hoverListeners: HoverListener[];
@@ -247,7 +250,7 @@ export class Projector extends ProjectorPolymer implements SelectionContext,
 
   private initializeDataProvider(dataProto?: DataProto) {
     if (this.servingMode === 'demo') {
-      this.dataProvider = new DemoDataProvider();
+      this.dataProvider = new DemoDataProvider(this.projectorConfigJsonPath);
     } else if (this.servingMode === 'server') {
       if (!this.routePrefix) {
         throw 'route-prefix is a required parameter';
@@ -494,6 +497,7 @@ export class Projector extends ProjectorPolymer implements SelectionContext,
       state.projections.push(projections);
     }
     state.selectedProjection = this.selectedProjection;
+    state.dataSetDimensions = this.dataSet.dim;
     state.tSNEIteration = this.dataSet.tSNEIteration;
     state.selectedPoints = this.selectedPointIndices;
     state.cameraDef = this.scatterPlot.getCameraDef();
diff --git a/tensorflow/tensorboard/dist/tf-tensorboard.html b/tensorflow/tensorboard/dist/tf-tensorboard.html
index 49117764333..7ac22237241 100644
--- a/tensorflow/tensorboard/dist/tf-tensorboard.html
+++ b/tensorflow/tensorboard/dist/tf-tensorboard.html
@@ -39,68 +39,10 @@ limitations under the License.
 <link rel="import" href="../paper-checkbox/paper-checkbox.html">
 <link rel="import" href="../paper-toolbar/paper-toolbar.html">
 <link rel="import" href="../paper-button/paper-button.html">
+<link rel="import" href="../paper-icon-button/paper-icon-button.html">
 <link rel="import" href="../paper-header-panel/paper-header-panel.html">
 
-<script>/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
 
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
-==============================================================================*/
-var TF;
-(function (TF) {
-    var TensorBoard;
-    (function (TensorBoard) {
-        TensorBoard.AUTORELOAD_LOCALSTORAGE_KEY = 'TF.TensorBoard.autoReloadEnabled';
-        var getAutoReloadFromLocalStorage = function () {
-            var val = window.localStorage.getItem(TensorBoard.AUTORELOAD_LOCALSTORAGE_KEY);
-            return val === 'true' || val == null; // defaults to true
-        };
-        TensorBoard.AutoReloadBehavior = {
-            properties: {
-                autoReloadEnabled: {
-                    type: Boolean,
-                    observer: '_autoReloadObserver',
-                    value: getAutoReloadFromLocalStorage,
-                },
-                _autoReloadId: {
-                    type: Number,
-                },
-                autoReloadIntervalSecs: {
-                    type: Number,
-                    value: 120,
-                },
-            },
-            detached: function () { window.clearTimeout(this._autoReloadId); },
-            _autoReloadObserver: function (autoReload) {
-                window.localStorage.setItem(TensorBoard.AUTORELOAD_LOCALSTORAGE_KEY, autoReload);
-                if (autoReload) {
-                    var _this = this;
-                    this._autoReloadId = window.setTimeout(this._doAutoReload.bind(this), this.autoReloadIntervalSecs * 1000);
-                }
-                else {
-                    window.clearTimeout(this._autoReloadId);
-                }
-            },
-            _doAutoReload: function () {
-                if (this.reload == null) {
-                    throw new Error('AutoReloadBehavior requires a reload method');
-                }
-                this.reload();
-                this._autoReloadId = window.setTimeout(this._doAutoReload.bind(this), this.autoReloadIntervalSecs * 1000);
-            }
-        };
-    })(TensorBoard = TF.TensorBoard || (TF.TensorBoard = {}));
-})(TF || (TF = {}));
-</script>
 </head><body><div hidden="" by-vulcanize=""><dom-module id="tf-globals" assetpath="../tf-globals/">
   <script>/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
 
@@ -122,7 +64,8 @@ var TF;
     var Globals;
     (function (Globals) {
         // The names of TensorBoard tabs.
-        Globals.TABS = ['events', 'images', 'audio', 'graphs', 'distributions', 'histograms'];
+        Globals.TABS = ['scalars', 'images', 'audio', 'graphs', 'distributions',
+            'histograms', 'embeddings'];
         // If true, TensorBoard stores its hash in the URI state.
         // If false, tab switching in TensorBoard will not update location hash,
         // because hash updates interfere with wct_tests.
@@ -138,7 +81,7 @@ var TF;
 <link rel="import" href="../paper-slider/paper-slider.html">
 <link rel="import" href="../paper-input/paper-input.html">
 
-<dom-module id="tf-smoothing-input" assetpath="../tf-event-dashboard/">
+<dom-module id="tf-smoothing-input" assetpath="../tf-scalar-dashboard/">
   <template>
     <h3 class="title">Smoothing</h3>
     <div class="smoothing-block">
@@ -266,10 +209,12 @@ var VZ;
             var ai = 0;
             var bi = 0;
             while (true) {
-                if (ai === a.length)
+                if (ai === a.length) {
                     return bi === b.length ? 0 : -1;
-                if (bi === b.length)
+                }
+                if (bi === b.length) {
                     return 1;
+                }
                 if (isDigit(a[ai]) && isDigit(b[bi])) {
                     var ais = ai;
                     var bis = bi;
@@ -277,15 +222,18 @@ var VZ;
                     bi = consumeNumber(b, bi + 1);
                     var an = parseFloat(a.slice(ais, ai));
                     var bn = parseFloat(b.slice(bis, bi));
-                    if (an < bn)
+                    if (an < bn) {
                         return -1;
-                    if (an > bn)
+                    }
+                    if (an > bn) {
                         return 1;
+                    }
                     continue;
                 }
                 if (isBreak(a[ai])) {
-                    if (!isBreak(b[bi]))
+                    if (!isBreak(b[bi])) {
                         return -1;
+                    }
                 }
                 else if (isBreak(b[bi])) {
                     return 1;
@@ -339,8 +287,9 @@ var VZ;
                     }
                 }
                 else if (state === State.EXPONENT) {
-                    if (!isDigit(s[i]))
+                    if (!isDigit(s[i])) {
                         break;
+                    }
                 }
             }
             return i;
@@ -600,11 +549,12 @@ var TF;
                     return url;
                 };
             }
-            function individualImageUrl(query) {
+            function individualImageUrl(query, wallTime) {
                 var url = dataDir + '/' + clean('individualImage?' + query);
-                if (demoMode) {
-                    url += '.png';
-                }
+                // Include wall_time just to disambiguate the URL and force the browser
+                // to reload the image when the URL changes. The backend doesn't care
+                // about the value.
+                url += demoMode ? '.png' : '&ts=' + wallTime;
                 return url;
             }
             function individualAudioUrl(query) {
@@ -634,6 +584,7 @@ var TF;
                 return url;
             }
             return {
+                logdir: function () { return dataDir + '/logdir'; },
                 runs: function () { return dataDir + '/runs' + (demoMode ? '.json' : ''); },
                 individualImage: individualImageUrl,
                 individualAudio: individualAudioUrl,
@@ -688,10 +639,16 @@ var TF;
              * @param requestManager The RequestManager, overwritable so you may
              * manually clear request queue, etc. Defaults to a new RequestManager.
              */
-            function Backend(r, requestManager) {
-                this.router = r;
+            function Backend(router, requestManager) {
+                this.router = router;
                 this.requestManager = requestManager || new Backend_1.RequestManager();
             }
+            /**
+             * Returns a promise for requesting the logdir string.
+             */
+            Backend.prototype.logdir = function () {
+                return this.requestManager.request(this.router.logdir());
+            };
             /**
              * Returns a listing of all the available data in the TensorBoard backend.
              */
@@ -820,7 +777,7 @@ var TF;
                     height: x.height,
                     wall_time: timeToDate(x.wall_time),
                     step: x.step,
-                    url: this.router.individualImage(x.query),
+                    url: this.router.individualImage(x.query, x.wall_time),
                 };
             };
             Backend.prototype.createAudio = function (x) {
@@ -1455,7 +1412,7 @@ var TF;
   <template>
     <template is="dom-if" if="[[showWarning]]">
       <div class="warning">
-        <template is="dom-if" if="[[graphMode]]">
+        <template is="dom-if" if="[[_isGraph(dataType)]]">
           <h3>
             No graph definition files were found.
           </h3>
@@ -1471,7 +1428,41 @@ var TF;
             .
           </p>
         </template>
-        <template is="dom-if" if="[[!graphMode]]">
+        <template is="dom-if" if="[[_isProjector(dataType)]]">
+          <h3>
+            No projector data was found.
+          </h3>
+          <p>
+            Probable causes:
+            </p><ul>
+              <li>
+                There is no <code>projector_config.pbtxt</code> in the <code>logdir</code>.
+                To store a config file, create a
+                <a href="https://github.com/tensorflow/tensorflow/blob/master/tensorflow/contrib/tensorboard/plugins/projector/projector_config.proto">
+                  <code>projector.ProjectorConfig</code>
+                </a>
+                proto and a
+                <a href="https://www.tensorflow.org/versions/master/api_docs/python/train.html#SummaryWriter">
+                  <code>tf.train.SummaryWriter</code>
+                </a> and pass them to
+                <code>projector.visualize_embeddings()</code>.
+                The <code>projector</code> module lives in
+                <a href="https://github.com/tensorflow/tensorflow/blob/master/tensorflow/contrib/tensorboard/plugins/projector/__init__.py">
+                  <code>tensorflow.contrib.tensorboard.plugins</code>.
+                </a>
+              </li>
+              <li>
+                There is no checkpoint file. To save your model, create a
+                <a href="https://www.tensorflow.org/versions/master/api_docs/python/state_ops.html#Saver">
+                  <code>tf.train.Saver</code>
+                </a>
+                and save your model periodically
+                by calling <code>saver.save(session, LOG_DIR/model.ckpt, step)</code>.
+              </li>
+            </ul>
+          <p></p>
+        </template>
+        <template is="dom-if" if="[[_isOther(dataType)]]">
           <h3>
             No <span>[[dataType]]</span> data was found.
           </h3>
@@ -1523,12 +1514,17 @@ var TF;
       is: "tf-no-data-warning",
       properties: {
         dataType: String,
-        showWarning: Boolean,
-        graphMode: {type: Boolean, computed: "_isGraph(dataType)"},
+        showWarning: Boolean
       },
       _isGraph: function(dataType) {
         return dataType === "graph";
       },
+      _isProjector: function(dataType) {
+        return dataType === "projector";
+      },
+      _isOther: function(dataType) {
+        return !this._isGraph(dataType) && !this._isProjector(dataType);
+      }
     });
   </script>
 </dom-module>
@@ -1833,10 +1829,12 @@ var TF;
         <div class="layout horizontal wrap">
           <template is="dom-repeat" items="[[_categoryCards(category, selectedRuns.*, run2tag.*)]]">
               <div class="card">
-                <span class="card-title">[[item.tag]]</span>
-                <template is="dom-if" if="[[repeatForRuns]]">
-                  <span class="card-subtitle">[[item.run]]</span>
-                </template>
+                <div class="card-title-container" style="border-color: [[_titleBorderColor(item.run)]]">
+                  <div class="card-title" inner-h-t-m-l="[[_break(item.tag)]]"></div>
+                  <template is="dom-if" if="[[repeatForRuns]]">
+                    <div class="card-subtitle" title="[[item.run]]">[[item.run]]</div>
+                  </template>
+                </div>
                 <div class="card-content">
                   <tf-chart-scaffold tag="[[item.tag]]" data-provider="[[dataProvider]]" visible-series="[[item.runs]]" on-ready="_instantiateTemplate">
                     
@@ -1862,7 +1860,7 @@ var TF;
         display: flex;
         flex-direction: column;
         margin: 5px;
-        padding: 0 30px 30px 0;
+        padding: 0 30px 35px 0;
         -webkit-user-select: none;
         -moz-user-select: none;
         position: relative;
@@ -1903,6 +1901,11 @@ var TF;
         pointer-events: none;
       }
 
+      .card-title-container {
+        border-left: 4px solid;
+        padding-left: 5px;
+      }
+
       .expand-button {
         color: #2196F3;
         width: 32px;
@@ -1934,6 +1937,11 @@ var TF;
          */
         categories: Array,
 
+        /**
+         * Input of the colors that are used for the user's runs.
+         */
+        colorScale: Object,
+
         /**
          * The name of the data type that is used by this dashboard. This will
          * be used to display what is missing when there is no data available.
@@ -2060,6 +2068,9 @@ var TF;
 
         return cards;
       },
+      _titleBorderColor: function(run) {
+        return this.repeatForRuns ? this.colorScale.scale(run) : 'white';
+      },
 
       /*
        * Polymer data binding forwarding functions. Check the
@@ -2078,6 +2089,10 @@ var TF;
       },
       // TODO(renatoutsch): implement the instance forwarding for two-way data
       // binding.
+      // Add breaks to input so it will wrap nicely
+      _break: function(ipt) {
+        return ipt.replace(/([\/_-])/g, "$1<wbr>")
+      },
     });
   </script>
 </dom-module>
@@ -2255,8 +2270,7 @@ var TF;
          * Generates a deep clone of the defaultVal to avoid mutation issues.
          */
         function getObjectInitializer(propertyName, defaultVal) {
-            var clone = _.cloneDeep(defaultVal);
-            return _getInitializer(getObject, propertyName, clone);
+            return _getInitializer(getObject, propertyName, defaultVal);
         }
         URIStorage.getObjectInitializer = getObjectInitializer;
         /**
@@ -2363,9 +2377,29 @@ var TF;
             return function () {
                 var _this = this;
                 var URIStorageName = getURIStorageName(this, propertyName);
+                // setComponentValue will be called every time the hash changes, and is
+                // responsible for ensuring that new state in the hash will be propagated
+                // to the component with that property.
+                // It is important that this function does not re-assign needlessly,
+                // to avoid Polymer observer churn.
                 var setComponentValue = function () {
                     var uriValue = get(URIStorageName);
-                    _this[propertyName] = uriValue !== undefined ? uriValue : defaultVal;
+                    var currentValue = _this[propertyName];
+                    // if uriValue is undefined, we will ensure that the property has the
+                    // default value
+                    if (uriValue === undefined) {
+                        if (!_.isEqual(currentValue, defaultVal)) {
+                            // If we don't have an explicit URI value, then we need to ensure
+                            // the property value is equal to the default value.
+                            // We will assign a clone rather than the canonical default, because
+                            // the component receiving this property may mutate it, and we need
+                            // to keep a pristine copy of the default.
+                            _this[propertyName] = _.clone(defaultVal);
+                        }
+                    }
+                    else if (!_.isEqual(uriValue, currentValue)) {
+                        _this[propertyName] = uriValue;
+                    }
                 };
                 // Set the value on the property.
                 setComponentValue();
@@ -2402,29 +2436,22 @@ var TF;
 })(TF || (TF = {}));
 </script>
 </dom-module>
-<link rel="import" href="../paper-icon-button/paper-icon-button.html">
 
 <dom-module id="tf-regex-group" assetpath="../tf-dashboard-common/">
   <template>
     <div class="regex-list">
       <template is="dom-repeat" items="{{rawRegexes}}">
         <div class="regex-line">
-          <paper-checkbox class="active-button" checked="{{item.active}}" disabled="[[!item.valid]]"></paper-checkbox>
-          <paper-input id="text-input" class="regex-input" label="Write a regex to create a tag group" no-label-float="" bind-value="{{item.regex}}" invalid="[[!item.valid]]" on-keyup="moveFocus"></paper-input>
+          <paper-input id="text-input" class="regex-input" label="Write a regex to create a tag group" no-label-float="" value="{{item.regex}}" invalid="[[!item.valid]]" on-keyup="moveFocus"></paper-input>
           <paper-icon-button icon="close" class="delete-button" aria-label="Delete Regex" tabindex="0" on-tap="deleteRegex"></paper-icon-button>
         </div>
         <style>
           .regex-input {
-            width: 230px;
+            width: 250px;
             display: inline-block;
             margin-left: -3px;
           }
 
-          paper-checkbox {
-            --paper-checkbox-checked-color: var(--tb-ui-dark-accent);
-            --paper-checkbox-unchecked-color: var(--tb-ui-dark-accent);
-          }
-
           .delete-button {
             color: var(--paper-grey-700);
             width: 40px;
@@ -2455,16 +2482,16 @@ var TF;
       properties: {
         rawRegexes: {
           type: Array,
-          value: function() {
-            return [{regex: "", active: true, valid: true}];
-          }
+          value: TF.URIStorage.getObjectInitializer('rawRegexes', [{regex: "", valid: true}]),
         },
         regexes: {type: Array, computed: "usableRegexes(rawRegexes.*)", notify: true},
       },
       observers: [
         "addNewRegexIfNeeded(rawRegexes.*)",
         "checkValidity(rawRegexes.*)",
+        "_uriStoreRegexes(rawRegexes.*)",
       ],
+      _uriStoreRegexes: TF.URIStorage.getObjectObserver('rawRegexes', [{regex: "", valid: true}]),
       checkValidity: function(x) {
         var match = x.path.match(/rawRegexes\.(\d+)\.regex/);
         if (match) {
@@ -2486,7 +2513,7 @@ var TF;
           // Checking validity here (rather than using the data property)
           // is necessary because otherwise we might send invalid regexes due
           // to the fact that this function can call before the observer does
-          return r.regex !== "" && r.active && isValid(r.regex);
+          return r.regex !== "" && isValid(r.regex);
         }).map(function(r) {
           return r.regex;
         });
@@ -2494,7 +2521,7 @@ var TF;
       addNewRegexIfNeeded: function() {
         var last = this.rawRegexes[this.rawRegexes.length - 1];
         if (last.regex !== "") {
-          this.push("rawRegexes", {regex: "", active: true, valid: true});
+          this.push("rawRegexes", {regex: "", valid: true});
         }
       },
       deleteRegex: function(e) {
@@ -2521,7 +2548,7 @@ var TF;
 <dom-module id="tf-categorizer" assetpath="../tf-dashboard-common/">
   <template>
     <div class="inputs">
-      <tf-regex-group id="regex-group" regexes="{{regexes}}"></tf-regex-group>
+      <tf-regex-group id="regexGroup" regexes="{{regexes}}"></tf-regex-group>
     </div>
     <div id="underscore-categorization">
       <paper-checkbox checked="{{splitOnUnderscore}}">Split on underscores</paper-checkbox>
@@ -2767,12 +2794,16 @@ var Categorizer;
   <style include="run-color-style"></style>
 
   <template>
-      <paper-input id="runs-regex" no-label-float="" label="Write a regex to filter runs" value="{{regexInput}}"></paper-input>
+      <paper-input id="runs-regex" no-label-float="" label="Write a regex to filter runs" value="[[regexInput]]" on-bind-value-changed="_debouncedRegexChange"></paper-input>
     <div id="outer-container" class="scrollbar">
       <template is="dom-repeat" items="[[namesMatchingRegex]]">
         <div class="run-row">
-          <div class="checkbox-container vertical-align-container">
+          <div class="icon-container checkbox-container vertical-align-container">
             <paper-checkbox class="checkbox vertical-align-center" name="[[item]]" checked$="[[_isChecked(item, runToIsCheckedMapping.*)]]" on-change="_checkboxChange"></paper-checkbox>
+
+          </div>
+          <div class="icon-container isolator-container vertical-align-container">
+            <paper-icon-button icon="radio-button-unchecked" class="isolator vertical-align-center" on-tap="_isolateRun" name="[[item]]"></paper-icon-button>
           </div>
           <div class="item-label-container">
             <span>[[item]]</span>
@@ -2811,15 +2842,30 @@ var Categorizer;
       flex-direction: row;
       font-size: 13px;
     }
-    .checkbox-container {
+    .icon-container {
       flex-grow: 0;
       flex-shrink: 0;
+      padding-left: 2px;
     }
     .checkbox {
       padding-left: 2px;
-      width: 32px;
+      width: 18px;
+      height: 18px;
+    }
+    .isolator {
+      width: 18px;
+      height: 18px;
+      padding: 0px;
+    }
+    .isolator-container {
+      padding-left: 6px;
+      padding-right: 3px;
+    }
+    .checkbox-container {
+      padding-left: 2px;
     }
     .item-label-container {
+      padding-left: 5px;
       flex-grow: 1;
       flex-shrink: 1;
       width: 0px; /* hack to get the flex-grow to work properly */
@@ -2850,15 +2896,14 @@ var Categorizer;
     is: "tf-multi-checkbox",
     properties: {
       names: Array, // All the runs in consideration
-
       regexInput: {
         type: String,
         value: TF.URIStorage.getStringInitializer("regexInput", ""),
-        observer: "_regexInputObserver"
+        observer: "_regexInputObserver",
       }, // Regex for filtering the runs
       regex: {
         type: Object,
-        computed: "makeRegex(regexInput)"
+        computed: "_makeRegex(regexInput)"
       },
       namesMatchingRegex: {
         type: Array,
@@ -2866,7 +2911,7 @@ var Categorizer;
       }, // Runs that match the regex
       runToIsCheckedMapping: {
         type: Object,
-        value: function() {return {};}
+        value: TF.URIStorage.getObjectInitializer('runToIsCheckedMapping', {}),
       }, // run name -> Boolean (if its enabled)
       // (Allows state to persist across regex filtering)
       outSelected: {
@@ -2878,20 +2923,61 @@ var Categorizer;
         type: Object,
         observer: "synchronizeColors",
       }, // map from run name to css class
+      _debouncedRegexChange: {
+        type: Function,
+        // Updating the regex can be slow, because it involves updating styles
+        // on a large number of Polymer paper-checkboxes. We don't want to do
+        // this while the user is typing, as it may make a bad, laggy UI.
+        // So we debounce the updates that come from user typing.
+        value: function() {
+          _this = this;
+          var debounced = _.debounce(function(r) {
+            _this.regexInput = r;
+          }, 150, {leading: false});
+          return function() {
+            var r = this.$$("#runs-regex").value;
+            if (r == "") {
+              // If the user cleared the field, they may be done typing, so
+              // update more quickly.
+              this.async(function() {
+                _this.regexInput = r;
+              }, 30);
+            } else {
+              debounced(r);
+            };
+          };
+        },
+      },
     },
     listeners: {
       'dom-change': 'synchronizeColors',
     },
     observers: [
       "_initializeRunToIsCheckedMapping(names.*)",
+      "_setIsolatorIcon(runToIsCheckedMapping)",
+      "_storeRunToIsCheckedMapping(runToIsCheckedMapping)",
     ],
-    makeRegex: function(regex) {
+    _storeRunToIsCheckedMapping: TF.URIStorage.getObjectObserver('runToIsCheckedMapping', {}),
+    _makeRegex: function(regex) {
       try {
         return new RegExp(regex)
       } catch (e) {
         return null;
       }
     },
+    _setIsolatorIcon: function() {
+      var runMap = this.runToIsCheckedMapping;
+      var numChecked = _.filter(_.values(runMap)).length;
+      var buttons = Array.prototype.slice.call(this.querySelectorAll(".isolator"));
+
+      buttons.forEach(function(b) {
+        if (numChecked === 1 && runMap[b.name]) {
+          b.icon = "radio-button-checked";
+        } else {
+          b.icon = "radio-button-unchecked";
+        }
+      });
+    },
     _initializeRunToIsCheckedMapping: function(change) {
       var runToIsCheckedMapping = _.clone(this.runToIsCheckedMapping);
 
@@ -2918,6 +3004,8 @@ var Categorizer;
     synchronizeColors: function(e) {
       if (!this.colorScale) return;
 
+      this._setIsolatorIcon();
+
       var checkboxes = Array.prototype.slice.call(this.querySelectorAll("paper-checkbox"));
       var scale = this.colorScale;
       checkboxes.forEach(function(p) {
@@ -2927,16 +3015,31 @@ var Categorizer;
         p.customStyle['--paper-checkbox-unchecked-color'] = color;
         p.customStyle['--paper-checkbox-unchecked-ink-color'] = color;
       });
-      this.updateStyles();
+      var buttons = Array.prototype.slice.call(this.querySelectorAll(".isolator"));
+      buttons.forEach(function(p) {
+        var color = scale.scale(p.name);
+        p.style['color'] = color;
+      });
       // The updateStyles call fails silently if the browser doesn't have focus,
       // e.g. if TensorBoard was opened into a new tab that isn't visible.
-      // As a workaround... we know requestAnimationFrame won't fire until the
-      // page has focus, so updateStyles again on requestAnimationFrame.
+      // So we wait for requestAnimationFrame.
       var _this = this;
       window.requestAnimationFrame(function() {_this.updateStyles();});
     },
+    _isolateRun: function(e) {
+      // If user clicks on the label for one run, enable it and disable all other runs.
+
+      var name = Polymer.dom(e).localTarget.name;
+      var _this = this;
+      _.keys(this.runToIsCheckedMapping).forEach(function(k) {
+        _this.runToIsCheckedMapping[k] = false;
+      });
+      this.runToIsCheckedMapping[name] = true;
+      // we can't use notifyPath because the run names may have periods
+      this.runToIsCheckedMapping = _.clone(this.runToIsCheckedMapping);
+    },
     _checkboxChange: function(e) {
-      var target = e.srcElement || e.target; // Firefox doesn't have srcElement.
+      var target = Polymer.dom(e).localTarget;
       var name = target.name;
       var checked = target.checked;
       this.runToIsCheckedMapping[name] = checked;
@@ -2973,6 +3076,9 @@ var Categorizer;
     <paper-button class="x-button" id="toggle-all" on-tap="_toggleAll">
     Toggle All Runs
     </paper-button>
+    <template is="dom-if" if="[[logdir]]">
+      <div id="logdir" inner-h-t-m-l="{{_breakString(logdir)}}"></div>
+    </template>
     <style>
       :host {
         display: flex;
@@ -2985,7 +3091,6 @@ var Categorizer;
         flex-grow: 0;
         flex-shrink: 0;
         padding-right: 16px;
-        padding-bottom: 6px;
         box-sizing: border-box;
         color: var(--paper-grey-800);
       }
@@ -2997,7 +3102,6 @@ var Categorizer;
       .x-button {
         font-size: 13px;
         background-color: var(--tb-ui-light-accent);
-        margin-top: 5px;
         color: var(--tb-ui-dark-accent);
       }
       #tooltip-help {
@@ -3010,20 +3114,44 @@ var Categorizer;
       paper-button {
         margin-left: 0;
       }
+      #logdir {
+        color: var(--tb-ui-dark-accent);
+        font-size: 13px;
+        margin: 5px 0 0 0;
+        max-width: 288px;
+      }
     </style>
   </template>
   <script>
   Polymer({
     is: "tf-run-selector",
     properties: {
+      backend: Object,
       outSelected: {type: Array, notify: true},
       // runs: an array of strings, representing the run names that may be chosen
       runs: Array,
       colorScale: Object, // TF.ColorScale
+      logdir: {
+        type: String,
+        notify: true,
+      },
+    },
+    ready: function() {
+      // Populate the logdir.
+      this.backend.logdir().then(logdirObject => {
+        this.set('logdir', logdirObject.logdir);
+      }).catch(e => {
+        // Fetching the logdir failed. Prevent the exception from logging to
+        // console. The console already logs a 404 network event.
+      });
     },
     _toggleAll: function() {
       this.$.multiCheckbox.toggleAll();
     },
+    // Break the string at natural points, including commas, equals, and slashes
+    _breakString: function(originalString) {
+      return originalString.replace(/([\/=-_,])/g, "$1<wbr>")
+    },
   });
   </script>
 </dom-module>
@@ -3031,12 +3159,12 @@ var Categorizer;
 <dom-module id="tf-sidebar-helper" assetpath="../tf-dashboard-common/">
   <template>
     <div class="sidebar-section">
-      <tf-categorizer id="categorizer" tags="[[_visibleTags]]" categories="{{categories}}"></tf-categorizer>
+      <tf-categorizer id="categorizer" tags="[[tags]]" categories="{{categories}}"></tf-categorizer>
       <content select=".extend-first-section"></content>
     </div>
     <content></content>
     <div class="sidebar-section">
-      <tf-run-selector id="runSelector" runs="[[runs]]" color-scale="[[colorScale]]" out-selected="{{selectedRuns}}"></tf-run-selector>
+      <tf-run-selector id="runSelector" backend="[[backend]]" runs="[[runs]]" color-scale="[[colorScale]]" out-selected="{{selectedRuns}}"></tf-run-selector>
     </div>
     <style include="dashboard-style"></style>
     <style>
@@ -3080,6 +3208,11 @@ var Categorizer;
     Polymer({
       is: "tf-sidebar-helper",
       properties: {
+        /**
+         * The backend object used to issue requests.
+         */
+        backend: Object,
+
         /**
          * This is an output of the categories that the user selected to
          * separate the different tags. Each category here should be given its
@@ -3114,15 +3247,13 @@ var Categorizer;
           notify: true,
         },
 
-        _visibleTags: {
+        tags: {
           type: Array,
-          computed: "_getVisibleTags(selectedRuns.*, run2tag.*)"
+          computed: "_getTags(run2tag.*)"
         },
       },
-      _getVisibleTags: function() {
-        var keys = this.selectedRuns;
-        var dict = this.run2tag;
-        return _.union.apply(null, keys.map(function(k) {return dict[k]}));
+      _getTags: function() {
+        return _.union.apply(null, _.values(this.run2tag));
       },
     })
   </script>
@@ -3186,7 +3317,7 @@ var Categorizer;
         padding: 8px;
         z-index: 5;
         cursor: none;
-        margin-top: 5px;
+        margin-top: 10px;
       }
       .swatch {
         border-radius: 50%;
@@ -3514,10 +3645,15 @@ var VZ;
         LineChart.prototype._onDatasetChanged = function (dataset) {
             if (this.smoothingEnabled) {
                 this.resmoothDataset(dataset);
-                this.updateSpecialDatasets(this.smoothedAccessor);
+            }
+            this.updateSpecialDatasets();
+        };
+        LineChart.prototype.updateSpecialDatasets = function () {
+            if (this.smoothingEnabled) {
+                this.updateSpecialDatasetsWithAccessor(this.smoothedAccessor);
             }
             else {
-                this.updateSpecialDatasets(this.scalarAccessor);
+                this.updateSpecialDatasetsWithAccessor(this.scalarAccessor);
             }
         };
         /** Constructs special datasets. Each special dataset contains exceptional
@@ -3526,7 +3662,7 @@ var VZ;
          * (since usually those are context in the surrounding dataset).
          * The accessor will point to the correct data to access.
          */
-        LineChart.prototype.updateSpecialDatasets = function (accessor) {
+        LineChart.prototype.updateSpecialDatasetsWithAccessor = function (accessor) {
             var lastPointsData = this.datasets
                 .map(function (d) {
                 var datum = null;
@@ -3792,6 +3928,7 @@ var VZ;
          */
         LineChart.prototype.setVisibleSeries = function (names) {
             var _this = this;
+            names = names.sort();
             this.seriesNames = names;
             names.reverse(); // draw first series on top
             this.datasets.forEach(function (d) { return d.offUpdate(_this.onDatasetChanged); });
@@ -3801,6 +3938,7 @@ var VZ;
             if (this.smoothingEnabled) {
                 this.smoothLinePlot.datasets(this.datasets);
             }
+            this.updateSpecialDatasets();
         };
         /**
          * Set the data of a series on the chart.
@@ -3818,7 +3956,7 @@ var VZ;
                 this.smoothingEnabled = true;
                 this.smoothLinePlot.datasets(this.datasets);
             }
-            this.updateSpecialDatasets(this.smoothedAccessor);
+            this.updateSpecialDatasetsWithAccessor(this.smoothedAccessor);
         };
         LineChart.prototype.smoothingDisable = function () {
             if (this.smoothingEnabled) {
@@ -3826,7 +3964,7 @@ var VZ;
                 this.scatterPlot.y(this.scalarAccessor, this.yScale);
                 this.smoothLinePlot.datasets([]);
                 this.smoothingEnabled = false;
-                this.updateSpecialDatasets(this.scalarAccessor);
+                this.updateSpecialDatasetsWithAccessor(this.scalarAccessor);
             }
         };
         LineChart.prototype.setTooltipSortingMethod = function (method) {
@@ -3836,9 +3974,9 @@ var VZ;
             this.tooltipPosition = position;
         };
         LineChart.prototype.renderTo = function (targetSVG) {
-            this.outer.renderTo(targetSVG);
             this.targetSVG = targetSVG;
             this.setViewBox();
+            this.outer.renderTo(targetSVG);
         };
         /** There's an issue in Chrome where the svg overflow is a bit
          * "flickery". There is a border on the gridlines on the extreme edge of the
@@ -3849,12 +3987,14 @@ var VZ;
         LineChart.prototype.setViewBox = function () {
             // There's an issue in Firefox where if we measure with the old viewbox
             // set, we get horrible results.
-            this.targetSVG.attr('viewBox', '');
-            var svg = this.targetSVG.node();
-            var brect = svg.getBoundingClientRect();
-            var w = brect.width;
-            var h = brect.height;
-            this.targetSVG.attr('viewBox', "0 0 " + (w + 1) + " " + (h + 1));
+            this.targetSVG.attr('viewBox', null);
+            var parent = this.targetSVG.node().parentNode;
+            var w = parent.clientWidth;
+            var h = parent.clientHeight;
+            this.targetSVG.attr({
+                'height': h,
+                'viewBox': "0 0 " + (w + 1) + " " + (h + 1),
+            });
         };
         LineChart.prototype.redraw = function () {
             this.outer.redraw();
@@ -4181,8 +4321,9 @@ var VZ;
         this.scopeSubtree(this.$.chartsvg, true);
       },
       _makeChart: function(xType, yScaleType, colorScale, _attached) {
-        if (this._makeChartAsyncCallbackId === null) {
+        if (this._makeChartAsyncCallbackId !== null) {
           this.cancelAsync(this._makeChartAsyncCallbackId);
+          this._makeChartAsyncCallbackId = null;
         }
 
         this._makeChartAsyncCallbackId = this.async(function() {
@@ -4229,7 +4370,7 @@ var VZ;
   </script>
 </dom-module>
 
-<dom-module id="tf-event-dashboard" assetpath="../tf-event-dashboard/">
+<dom-module id="tf-scalar-dashboard" assetpath="../tf-scalar-dashboard/">
   <template>
     <div id="plumbing">
       <tf-color-scale id="colorScale" runs="[[runs]]" out-color-scale="{{_colorScale}}"></tf-color-scale>
@@ -4237,7 +4378,7 @@ var VZ;
 
     <tf-dashboard-layout>
       <div class="sidebar">
-        <tf-sidebar-helper categories="{{_categories}}" color-scale="[[_colorScale]]" run2tag="[[run2tag]]" runs="[[runs]]" selected-runs="{{_selectedRuns}}">
+        <tf-sidebar-helper backend="[[backend]]" categories="{{_categories}}" color-scale="[[_colorScale]]" run2tag="[[run2tag]]" runs="[[runs]]" selected-runs="{{_selectedRuns}}">
           <div class="extend-first-section">
             <paper-checkbox id="download-option" checked="{{_showDownloadLinks}}">Data download links</paper-checkbox>
             <div id="tooltip-sorting">
@@ -4264,7 +4405,7 @@ var VZ;
         </tf-sidebar-helper>
       </div>
       <div class="center">
-        <tf-panes-helper categories="[[_categories]]" data-type="[[dataType]]" data-provider="[[dataProvider]]" run2tag="[[run2tag]]" selected-runs="[[_selectedRuns]]" show-download-links="[[_showDownloadLinks]]" download-link-url-function="[[scalarUrl]]">
+        <tf-panes-helper categories="[[_categories]]" color-scale="[[_colorScale]]" data-type="[[dataType]]" data-provider="[[dataProvider]]" run2tag="[[run2tag]]" selected-runs="[[_selectedRuns]]" show-download-links="[[_showDownloadLinks]]" download-link-url-function="[[scalarUrl]]">
           <template>
             <vz-line-chart x-type="[[_xType]]" color-scale="[[_colorScale]]" smoothing-enabled="[[_smoothingEnabled]]" smoothing-weight="[[_smoothingWeight]]" tooltip-sorting-method="[[_tooltipSortingMethod]]"></vz-line-chart>
             <paper-icon-button class="log-button" icon="line-weight" on-tap="toggleLogScale" title="Toggle y-axis log scale"></paper-icon-button>
@@ -4278,7 +4419,7 @@ var VZ;
       .log-button {
         position: absolute;
         left: 35px;
-        bottom: -30px;
+        bottom: -35px;
         color: #2196F3;
         background: #fff;
         width: 32px;
@@ -4313,12 +4454,13 @@ var VZ;
 
   <script>
     Polymer({
-      is: "tf-event-dashboard",
+      is: "tf-scalar-dashboard",
       behaviors: [
         TF.Dashboard.ReloadBehavior("tf-chart-scaffold"),
         TF.Backend.Behavior,
       ],
       properties: {
+        backend: Object,
         dataType: {
           type: String,
           value: "scalar"
@@ -4377,7 +4519,7 @@ var VZ;
     });
   </script>
 </dom-module>
-<dom-module id="tf-distribution-chart" assetpath="../tf-distribution-dashboard/">
+<dom-module id="vz-distribution-chart" assetpath="../vz-distribution-chart/">
   <template>
     <svg id="chartsvg"></svg>
     <style>
@@ -4414,8 +4556,8 @@ See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 /* tslint:disable:no-namespace variable-name */
-var TF;
-(function (TF) {
+var VZ;
+(function (VZ) {
     var DistributionChart = (function () {
         function DistributionChart(xType, colorScale) {
             this.run2datasets = {};
@@ -4493,13 +4635,38 @@ var TF;
         DistributionChart.prototype.setSeriesData = function (name, data) {
             this.getDataset(name).data(data);
         };
-        DistributionChart.prototype.renderTo = function (target) { this.outer.renderTo(target); };
-        DistributionChart.prototype.redraw = function () { this.outer.redraw(); };
+        DistributionChart.prototype.renderTo = function (targetSVG) {
+            this.targetSVG = targetSVG;
+            this.setViewBox();
+            this.outer.renderTo(targetSVG);
+        };
+        /** There's an issue in Chrome where the svg overflow is a bit
+         * "flickery". There is a border on the gridlines on the extreme edge of the
+         * chart, which behaves inconsistently and causes the screendiffing tests to
+         * flake. We can solve this by creating 1px effective margin for the svg by
+         * setting the viewBox on the containing svg.
+         */
+        DistributionChart.prototype.setViewBox = function () {
+            // There's an issue in Firefox where if we measure with the old viewbox
+            // set, we get horrible results.
+            this.targetSVG.attr('viewBox', null);
+            var parent = this.targetSVG.node().parentNode;
+            var w = parent.clientWidth;
+            var h = parent.clientHeight;
+            this.targetSVG.attr({
+                'height': h,
+                'viewBox': "0 0 " + (w + 1) + " " + (h + 1),
+            });
+        };
+        DistributionChart.prototype.redraw = function () {
+            this.outer.redraw();
+            this.setViewBox();
+        };
         DistributionChart.prototype.destroy = function () { this.outer.destroy(); };
         return DistributionChart;
     }());
-    TF.DistributionChart = DistributionChart;
-})(TF || (TF = {}));
+    VZ.DistributionChart = DistributionChart;
+})(VZ || (VZ = {}));
 </script>
   <script>/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
 
@@ -4644,10 +4811,34 @@ var VZ;
 </script>
   <script>
     Polymer({
-      is: "tf-distribution-chart",
+      is: "vz-distribution-chart",
       properties: {
-        colorScale: Object,
-        xType: String,
+        /**
+         * Scale that maps series names to colors. The default colors are from
+         * d3.scale.category10() scale. Use this property to replace the default
+         * line colors with colors of your own choice.
+         * @type {Plottable.Scales.Color}
+         * @required
+         */
+        colorScale: {
+          type: Object,
+          value: function() {
+            return new Plottable.Scales.Color()
+                .range(d3.scale.category10().range());
+          }
+        },
+        /**
+         * The way to display the X values. Allows:
+         * - "step" - Linear scale using the  "step" property of the datum.
+         * - "wall_time" - Temporal scale using the "wall_time" property of the
+         * datum.
+         * - "relative" - Temporal scale using the "relative" property of the
+         * datum if it is present or calculating from "wall_time" if it isn't.
+         */
+        xType: {
+          type: String,
+          value: 'step'
+        },
         _attached: Boolean,
         _chart: Object,
         _visibleSeriesCache: {
@@ -4692,7 +4883,7 @@ var VZ;
           this._makeChartAsyncCallbackId = null;
           if (!_attached) return;
           if (this._chart) this._chart.destroy();
-          var chart = new TF.DistributionChart(xType, colorScale);
+          var chart = new VZ.DistributionChart(xType, colorScale);
           var svg = d3.select(this.$.chartsvg);
           chart.renderTo(svg);
           this._chart = chart;
@@ -4724,7 +4915,7 @@ var VZ;
 
     <tf-dashboard-layout>
       <div class="sidebar">
-        <tf-sidebar-helper categories="{{_categories}}" color-scale="[[_colorScale]]" run2tag="[[run2tag]]" runs="[[runs]]" selected-runs="{{_selectedRuns}}">
+        <tf-sidebar-helper backend="[[backend]]" categories="{{_categories}}" color-scale="[[_colorScale]]" run2tag="[[run2tag]]" runs="[[runs]]" selected-runs="{{_selectedRuns}}">
         <div class="sidebar-section">
           <tf-option-selector id="xTypeSelector" name="Horizontal Axis" selected-id="{{_xType}}">
             <paper-button id="step">step</paper-button>
@@ -4736,9 +4927,9 @@ var VZ;
       </div>
 
       <div class="center">
-        <tf-panes-helper categories="[[_categories]]" data-type="[[dataType]]" data-provider="[[dataProvider]]" run2tag="[[run2tag]]" selected-runs="[[_selectedRuns]]" repeat-for-runs="">
+        <tf-panes-helper categories="[[_categories]]" color-scale="[[_colorScale]]" data-type="[[dataType]]" data-provider="[[dataProvider]]" run2tag="[[run2tag]]" selected-runs="[[_selectedRuns]]" repeat-for-runs="">
           <template>
-            <tf-distribution-chart x-type="[[_xType]]" color-scale="[[_colorScale]]"></tf-distribution-chart>
+            <vz-distribution-chart x-type="[[_xType]]" color-scale="[[_colorScale]]"></vz-distribution-chart>
           </template>
         </tf-panes-helper>
       </div>
@@ -4755,6 +4946,7 @@ var VZ;
         TF.Backend.Behavior,
       ],
       properties: {
+        backend: Object,
         _xType: {
           type: String,
           value: "step"
@@ -5453,7 +5645,7 @@ var VZ;
 
     <tf-dashboard-layout>
       <div class="sidebar">
-        <tf-sidebar-helper categories="{{_categories}}" color-scale="[[_colorScale]]" run2tag="[[run2tag]]" runs="[[runs]]" selected-runs="{{_selectedRuns}}" show-download-links="{{_showDownloadLinks}}">
+        <tf-sidebar-helper backend="[[backend]]" categories="{{_categories}}" color-scale="[[_colorScale]]" run2tag="[[run2tag]]" runs="[[runs]]" selected-runs="{{_selectedRuns}}" show-download-links="{{_showDownloadLinks}}">
           <div class="sidebar-section">
             <tf-option-selector id="histogramModeSelector" name="Histogram Mode" selected-id="{{_histogramMode}}">
               <paper-button id="overlay">overlay</paper-button>
@@ -5471,7 +5663,7 @@ var VZ;
       </tf-sidebar-helper></div>
 
       <div class="center">
-        <tf-panes-helper categories="[[_categories]]" data-type="[[dataType]]" data-provider="[[dataProvider]]" run2tag="[[run2tag]]" selected-runs="[[_selectedRuns]]" repeat-for-runs="">
+        <tf-panes-helper categories="[[_categories]]" color-scale="[[_colorScale]]" data-type="[[dataType]]" data-provider="[[dataProvider]]" run2tag="[[run2tag]]" selected-runs="[[_selectedRuns]]" repeat-for-runs="">
           <template>
             <vz-histogram-timeseries time-property="[[_timeProperty]]" mode="[[_histogramMode]]" color-scale="[[_colorScaleFunction]]"></vz-histogram-timeseries>
           </template>
@@ -5496,6 +5688,7 @@ var VZ;
         TF.Backend.Behavior,
       ],
       properties: {
+        backend: Object,
         dataType: {
           type: String,
           value: "histogram"
@@ -5526,154 +5719,42 @@ var VZ;
 </dom-module>
 
 <dom-module id="tf-image-loader" assetpath="../tf-image-dashboard/">
-  <style>
-  :host {
-    display: block;
-  }
-  img {
-    image-rendering: pixelated;
-    border: 1px solid #555;
-  }
-  </style>
   <template>
-    <img src="[[imageUrl]]" width="300" height="[[height]]" on-error="reload">
-  </template>
-  <script>
-    Polymer({
-      is: "tf-image-loader",
-      properties: {
-        run: String,
-        tag: String,
-        imagesGenerator: Function,
-        imageUrl: String,
-        height: {
-          type: Number,
-          value: 300
-        }
-      },
-      reload: function() {
-        var _this = this;
-        this.imageUrl = ""; // force reload
-        this.imagesGenerator(this.tag, this.run).then(function(metadatas) {
-          var last_metadata = _.last(metadatas);
-          _this.imageUrl = last_metadata.url;
-          _this.height = 300 / last_metadata.width * last_metadata.height;
-        });
-      },
-      ready: function() {
-        // Need to test so that it will not error if it is constructed w/o
-        // all properties (so that it's possible to use stub to mock it out)
-        if (this.run != null && this.tag != null && this.imagesGenerator != null) {
-          this.reload();
-        }
-      },
-    });
-  </script>
-</dom-module>
-
-<dom-module id="tf-image-grid" assetpath="../tf-image-dashboard/">
-  <template>
-    <style include="scrollbar-style"></style>
-    <div id="fullContainer" class="container scrollbar">
-      <div id="topRow" class="container">
-        <div class="noshrink cell" id="paddingCell"></div>
-        <template is="dom-repeat" items="[[runs]]" as="run">
-        <div class="run-name-cell cell noshrink">
-          <span>[[run]]</span>
-        </div>
-      </template>
-      </div>
-      <div id="bottomContainer" class="container">
-        <template is="dom-repeat" items="[[tags]]" as="tag">
-          <div class="image-row container noshrink">
-            <div class="tag-name-cell cell noshrink">
-              <span class="tag-name">[[tag]]</span>
-            </div>
-            <template is="dom-repeat" items="[[runs]]" as="run">
-              <div class="image-cell cell noshrink">
-                <template is="dom-if" if="[[_exists(run, tag, runToImages.*)]]">
-                  <tf-image-loader id="loader" run="[[run]]" tag="[[tag]]" images-generator="[[imagesGenerator]]">
-                  </tf-image-loader>
-                </template>
-              </div>
-            </template>
-          </div>
-        </template>
-      </div>
-    </div>
+    <img id="img" src="[[imageUrl]]" on-error="reload">
     <style>
       :host {
         display: block;
-        height: 100%;
-      }
-      .container {
-        display: flex;
-        flex-wrap: nowrap;
-      }
-      #fullContainer {
         width: 100%;
-        height: 100%;
-        flex-direction: column;
-        padding-top: 20px;
-        overflow: auto;
-        -webkit-box-sizing: border-box;
-        -moz-box-sizing: border-box;
-        box-sizing: border-box;
+        height: auto;
+        position: relative;
       }
-      #topRow {
-        flex-direction: row;
-      }
-      #bottomContainer {
-        flex-direction: column;
-        height: 100%;
+
+      img {
+        image-rendering: pixelated;
+        display: block;
         width: 100%;
-      }
-      .cell {
-        margin-right: 10px;
-      }
-      .image-row {
-        flex-direction: row;
-        padding-top: 10px;
-      }
-      .image-cell {
-        width: 300px;
-      }
-      .tag-name-cell {
-        width: 300px;
-        display:flex;
-        flex-direction: column;
-        justify-content: center;
-      }
-      .tag-name {
-        word-wrap: break-word;
-        text-align: center;
-        white-space: nowrap;
-      }
-      .run-name-cell {
-        width: 300px;
-        word-break:break-all;
-        text-align: center;
-      }
-      .noshrink {
-        flex-shrink: 0;
-      }
-      #paddingCell {
-        width: 300px;
-        height: 30px;
+        height: auto;
       }
     </style>
   </template>
   <script>
     Polymer({
-      is: "tf-image-grid",
+      is: "tf-image-loader",
       properties: {
-        runToImages: Object,
-        tags: Array,
-        runs: Array,
-        imagesGenerator: Function,
+        colorScale: Object,
+        imageUrl: String,
       },
-      _exists: function (run, tag) {
-        return this.runToImages[run].indexOf(tag) !== -1;
+      setVisibleSeries: function(runs) {
+        // Do nothing.
+      },
+      setSeriesData: function(run, data) {
+        var last = _.last(data);
+        this.redraw(last.url);
+      },
+      redraw: function(newUrl) {
+        var url = newUrl || this.imageUrl;
+        this.imageUrl = ""; // Force redraw
+        this.imageUrl = url;
       },
     });
   </script>
@@ -5681,46 +5762,52 @@ var VZ;
 
 <dom-module id="tf-image-dashboard" assetpath="../tf-image-dashboard/">
   <template>
-    <div class="center">
-      <tf-no-data-warning data-type="image" show-warning="[[dataNotFound]]"></tf-no-data-warning>
-      <tf-image-grid id="imagegrid" run-to-images="[[run2tag]]" images-generator="[[dataProvider]]" tags="[[tags]]" runs="[[runs]]"></tf-image-grid>
+    <div id="plumbing">
+      <tf-color-scale id="colorScale" runs="[[runs]]" out-color-scale="{{_colorScale}}"></tf-color-scale>
     </div>
 
+    <tf-dashboard-layout>
+      <div class="sidebar">
+        <tf-sidebar-helper backend="[[backend]]" categories="{{_categories}}" color-scale="[[_colorScale]]" run2tag="[[run2tag]]" runs="[[runs]]" selected-runs="{{_selectedRuns}}">
+        </tf-sidebar-helper>
+      </div>
+      <div class="center">
+        <tf-panes-helper categories="[[_categories]]" color-scale="[[_colorScale]]" data-type="[[dataType]]" data-provider="[[dataProvider]]" run2tag="[[run2tag]]" selected-runs="[[_selectedRuns]]" repeat-for-runs="">
+          <template>
+            <tf-image-loader color-scale="[[_colorScale]]"></tf-image-loader>
+          </template>
+        </tf-panes-helper>
+      </div>
+    </tf-dashboard-layout>
+    <style include="dashboard-style"></style>
     <style>
-      .center {
-        height: 100%;
-        width: 100%;
-        -webkit-box-sizing: border-box;
-        -moz-box-sizing: border-box;
-        box-sizing: border-box;
+      tf-panes-helper {
+        --card-width: 340px;
+        --card-height: auto;
+        --card-expanded-width: 700px;
+        --card-expanded-height: auto;
       }
-      :host {
-        height: 100%;
-        display: block;
-      }
-
     </style>
   </template>
   <script>
     Polymer({
       is: "tf-image-dashboard",
       properties: {
-        dataType: {value: "image"},
+        backend: Object,
+        dataType: {
+          type: String,
+          value: "image"
+        },
       },
       behaviors: [
-        TF.Dashboard.ReloadBehavior("tf-image-loader"),
-        TF.Backend.Behavior
+          TF.Dashboard.ReloadBehavior("tf-chart-scaffold"),
+          TF.Backend.Behavior,
       ],
       attached: function() {
         this.async(function() {
           this.fire("rendered");
         });
       },
-      _hasImages: function(runToImagesChange) {
-        return _.values(runToImagesChange.base).some(function(arr) {
-          return arr.length > 0;
-        });
-      },
     });
   </script>
 </dom-module>
@@ -6019,6 +6106,11 @@ Polymer({
     var dataTracker = tf.graph.util.getSubtaskTracker(tracker, 30, 'Data');
     tf.graph.parser.fetchAndParseGraphData(path, pbTxtFile, dataTracker)
     .then(function(graph) {
+      if (!graph) {
+        throw 'The graph is empty. Make sure that the graph is passed to the ' +
+            'SummaryWriter after the graph is defined.';
+      }
+
       // Build the flat graph (consists only of Op nodes).
 
       // This is the whitelist of inputs on op types that are considered
@@ -8528,13 +8620,12 @@ var tf;
              */
             function fetchPbTxt(filepath) {
                 return new Promise(function (resolve, reject) {
-                    d3.text(filepath, function (error, text) {
-                        if (error) {
-                            reject(error);
-                            return;
-                        }
-                        resolve(text);
-                    });
+                    var request = new XMLHttpRequest();
+                    request.open('GET', filepath);
+                    request.responseType = 'arraybuffer';
+                    request.onerror = function () { return reject(request.status); };
+                    request.onload = function () { return resolve(request.response); };
+                    request.send(null);
                 });
             }
             parser.fetchPbTxt = fetchPbTxt;
@@ -8547,27 +8638,38 @@ var tf;
                     if (path == null) {
                         return Promise.resolve(null);
                     }
-                    return fetchPbTxt(path).then(function (text) { return new Blob([text]); });
+                    return fetchPbTxt(path);
                 }, tracker)
-                    .then(function (blob) {
-                    return tf.graph.util.runTask('Parsing metadata.pbtxt', 60, function () {
-                        return blob != null ? parseStatsPbTxt(blob) : null;
+                    .then(function (arrayBuffer) {
+                    return tf.graph.util.runAsyncPromiseTask('Parsing metadata.pbtxt', 60, function () {
+                        return arrayBuffer != null ? parseStatsPbTxt(arrayBuffer) :
+                            Promise.resolve(null);
                     }, tracker);
                 });
             }
             parser.fetchAndParseMetadata = fetchAndParseMetadata;
             /**
-             * Fetches the graph file, parses it and returns a promise of the result.
+             * Fetches the graph file, parses it and returns a promise of the result. The
+             * result will be undefined if the graph is empty.
              */
             function fetchAndParseGraphData(path, pbTxtFile, tracker) {
                 return tf.graph.util
                     .runTask('Reading graph pbtxt', 40, function () {
-                    return pbTxtFile ? Promise.resolve(pbTxtFile) :
-                        fetchPbTxt(path).then(function (text) { return new Blob([text]); });
+                    if (pbTxtFile) {
+                        return new Promise(function (resolve, reject) {
+                            var fileReader = new FileReader();
+                            fileReader.onload = function () { return resolve(fileReader.result); };
+                            fileReader.onerror = function () { return reject(fileReader.error); };
+                            fileReader.readAsArrayBuffer(pbTxtFile);
+                        });
+                    }
+                    else {
+                        return fetchPbTxt(path);
+                    }
                 }, tracker)
-                    .then(function (blob) {
+                    .then(function (arrayBuffer) {
                     return tf.graph.util.runTask('Parsing graph.pbtxt', 60, function () {
-                        return parseGraphPbTxt(blob);
+                        return parseGraphPbTxt(arrayBuffer);
                     }, tracker);
                 });
             }
@@ -8575,42 +8677,34 @@ var tf;
             /**
              * Parse a file object in a streaming fashion line by line (or custom delim).
              * Can handle very large files.
-             * @param input The file object
+             * @param input The file object as an array buffer.
              * @param callback The callback called on each line
              * @param chunkSize The size of each read chunk. (optional)
              * @param delim The delimiter used to split a line. (optional)
              * @returns A promise for when it is finished.
              */
-            function streamParse(file, callback, chunkSize, delim) {
+            function streamParse(arrayBuffer, callback, chunkSize, delim) {
                 if (chunkSize === void 0) { chunkSize = 1000000; }
                 if (delim === void 0) { delim = '\n'; }
                 return new Promise(function (resolve, reject) {
                     var offset = 0;
-                    var fileSize = file.size - 1;
+                    var bufferSize = arrayBuffer.byteLength - 1;
                     var data = '';
-                    function readHandler(evt) {
-                        if (evt.target.error == null) {
-                            offset += evt.target.result.length;
-                            var str = evt.target.result;
-                            var parts = str.split(delim);
-                            var first = data + parts[0];
-                            if (parts.length === 1) {
-                                data = first;
-                                readChunk(offset, chunkSize);
-                                return;
-                            }
-                            data = parts[parts.length - 1];
-                            callback(first);
-                            for (var i = 1; i < parts.length - 1; i++) {
-                                callback(parts[i]);
-                            }
-                        }
-                        else {
-                            // read error
-                            reject(evt.target.error);
+                    function readHandler(str) {
+                        offset += chunkSize;
+                        var parts = str.split(delim);
+                        var first = data + parts[0];
+                        if (parts.length === 1) {
+                            data = first;
+                            readChunk(offset, chunkSize);
                             return;
                         }
-                        if (offset >= fileSize) {
+                        data = parts[parts.length - 1];
+                        callback(first);
+                        for (var i = 1; i < parts.length - 1; i++) {
+                            callback(parts[i]);
+                        }
+                        if (offset >= bufferSize) {
                             if (data) {
                                 callback(data);
                             }
@@ -8620,10 +8714,11 @@ var tf;
                         readChunk(offset, chunkSize);
                     }
                     function readChunk(offset, size) {
-                        var reader = new FileReader();
-                        var blob = file.slice(offset, offset + size);
-                        reader.onload = readHandler;
-                        reader.readAsText(blob);
+                        var arrayBufferChunk = arrayBuffer.slice(offset, offset + size);
+                        var blob = new Blob([arrayBufferChunk]);
+                        var file = new FileReader();
+                        file.onload = function (e) { return readHandler(e.target.result); };
+                        file.readAsText(blob);
                     }
                     readChunk(offset, chunkSize);
                 });
@@ -8656,14 +8751,14 @@ var tf;
                 'step_stats.dev_stats.node_stats.output.tensor_description.shape.dim': true
             };
             /**
-             * Parses a blob of proto txt file into a raw Graph object.
+             * Parses an ArrayBuffer of a proto txt file into a raw Graph object.
              */
             function parseGraphPbTxt(input) {
                 return parsePbtxtFile(input, GRAPH_REPEATED_FIELDS).then(function (obj) { return obj['node']; });
             }
             parser.parseGraphPbTxt = parseGraphPbTxt;
             /**
-             * Parses a blob of proto txt file into a StepStats object.
+             * Parses an ArrayBuffer of a proto txt file into a StepStats object.
              */
             function parseStatsPbTxt(input) {
                 return parsePbtxtFile(input, METADATA_REPEATED_FIELDS)
@@ -8671,9 +8766,9 @@ var tf;
             }
             parser.parseStatsPbTxt = parseStatsPbTxt;
             /**
-             * Parses a blob of proto txt file into javascript object.
+             * Parses a ArrayBuffer of a proto txt file into javascript object.
              *
-             * @param input The Blob or file object implementing slice.
+             * @param input The ArrayBuffer or file object implementing slice.
              * @param repeatedFields Map (Set) of all the repeated fields, since you can't
              *   tell directly from the pbtxt if a field is repeated or not.
              * @returns The parsed object.
@@ -8847,15 +8942,16 @@ var tf;
                  */
                 enableExtraction: true,
                 /**
-                 * Maximum in-degree that a node can have without being considered as
-                 * high in-degree node.
+                 * The minimum number of nodes for a graph to have in order for high in and
+                 * out degree nodes to be extracted in auxiliary. The aim here is to prevent
+                 * nodes from being extracted from small graphs.
                  */
-                maxInDegree: 4,
+                minNodeCountForExtraction: 15,
                 /**
-                 * Maximum out-degree that a node can have without being considered as
-                 * high out-degree node.
+                 * The minimum in or out degree a node must have in order to be possibly
+                 * extracted.
                  */
-                maxOutDegree: 4,
+                minDegreeForExtraction: 5,
                 /**
                  * Maximum number of control edges a node can have before they aren't
                  * displayed.
@@ -8872,7 +8968,7 @@ var tf;
                  * Types patterns for predefined in-extract nodes, which are
                  * source-like nodes that will be extracted from the main graph.
                  */
-                inExtractTypes: ['Variable'],
+                inExtractTypes: [],
                 /**
                  * When removing edges from a high degree node, remove all of its edges if
                  * detachAllEdgesForHighDegree is true.  Otherwise remove all in-edges if
@@ -9181,9 +9277,14 @@ var tf;
                         var _b = inbound ?
                             [renderNodeInfo.inAnnotations, childRenderInfo.inAnnotations] :
                             [renderNodeInfo.outAnnotations, childRenderInfo.outAnnotations], childAnnotations = _b[1];
-                        var isOtherHighDegree = inbound ?
-                            otherCounts.out[otherName] > PARAMS.maxOutDegree :
-                            otherCounts.in[otherName] > PARAMS.maxInDegree;
+                        // Do not render a bridge path to a node if the node is extracted into the
+                        // auxiliary graph for having a high degree. If we are not sure now,
+                        // default to not rendering a bridge path.
+                        var isOtherHighDegree = true;
+                        if (otherRenderInfo) {
+                            isOtherHighDegree = inbound ? otherRenderInfo.isOutExtract :
+                                otherRenderInfo.isInExtract;
+                        }
                         // The adjoining render metaedge info from the parent's coreGraph, if any.
                         // It will either be a Metaedge involving this node directly, if it
                         // previously came from a metagraph, or it'll be a Metaedge involving
@@ -9477,6 +9578,12 @@ var tf;
                     this.dy = 0;
                     this.width = 0;
                     this.height = 0;
+                    // Properties needed for generating an ID for the edge's path element if
+                    // this annotation is associated with a metaedge.
+                    if (renderMetaedgeInfo && renderMetaedgeInfo.metaedge) {
+                        this.v = renderMetaedgeInfo.metaedge.v;
+                        this.w = renderMetaedgeInfo.metaedge.w;
+                    }
                     this.isIn = isIn;
                     this.points = [];
                 }
@@ -9772,57 +9879,87 @@ var tf;
                     }
                 });
             }
-            /** Extract from nodes with in-degree > maxInDegree */
-            function extractHighInDegree(renderNode) {
+            /** Extract nodes deemed to have either high in-degree or high out-degree. */
+            function extractHighInOrOutDegree(renderNode) {
                 var graph = renderNode.coreGraph;
-                var maxInDegree = PARAMS.maxInDegree;
-                // detect first so degrees don't get affected by other removal
-                var highInDegreeNames = _.filter(graph.nodes(), function (n) {
-                    if (graph.node(n).node.include !== graph_1.InclusionType.UNSPECIFIED) {
-                        return false;
+                // Create mappings from node to in and out degrees. Count the number of valid
+                // nodes along the way.
+                var nodeToInDegree = {};
+                var nodeToOutDegree = {};
+                var validNodeCount = 0;
+                _.each(graph.nodes(), function (currentNode) {
+                    if (graph.node(currentNode).node.include !== graph_1.InclusionType.UNSPECIFIED) {
+                        // This node is not included in the first place.
+                        return;
                     }
-                    // Count the in-degree based on only regular edges, unless there are
-                    // no regular edges, in which case use the number of control edges.
-                    // This is done so that control edges don't effect if nodes are extracted
+                    // Count the in and out degrees based on only regular edges, unless there
+                    // are no regular edges, in which case use the number of control edges.
+                    // This is done so that control edges don't affect if nodes are extracted
                     // from the core graph, unless the node is only used for control.
-                    var numEdgesToCount = _.reduce(graph.predecessors(n), function (numEdgesToCount, pred) {
-                        var metaedge = graph.edge(pred, n).metaedge;
-                        return numEdgesToCount + (metaedge.numRegularEdges ? 1 : 0);
+                    var inDegree = _.reduce(graph.predecessors(currentNode), function (inDegree, pred) {
+                        var metaedge = graph.edge(pred, currentNode).metaedge;
+                        return inDegree + (metaedge.numRegularEdges ? 1 : 0);
                     }, 0);
-                    if (numEdgesToCount === 0 && graph.predecessors(n).length > 0) {
-                        numEdgesToCount = graph.predecessors(n).length;
+                    if (inDegree === 0 && graph.predecessors(currentNode).length > 0) {
+                        inDegree = graph.predecessors(currentNode).length;
                     }
-                    return numEdgesToCount > maxInDegree;
-                });
-                _.each(highInDegreeNames, function (n) {
-                    makeOutExtract(renderNode, n);
-                });
-            }
-            /** Extract nodes with out-degree > maxOutDegree */
-            function extractHighOutDegree(renderNode) {
-                var graph = renderNode.coreGraph;
-                var maxOutDegree = PARAMS.maxOutDegree;
-                // detect first so degrees don't get affected by other removal
-                var highOutDegreeNames = _.filter(graph.nodes(), function (n) {
-                    if (graph.node(n).node.include !== graph_1.InclusionType.UNSPECIFIED) {
-                        return false;
-                    }
-                    // Count the out-degree based on only regular edges, unless there are
-                    // no regular edges, in which case use the number of control edges.
-                    // This is done so that control edges don't effect if nodes are extracted
-                    // from the core graph, unless the node is only used for control.
-                    var numEdgesToCount = _.reduce(graph.successors(n), function (numEdgesToCount, succ) {
-                        var metaedge = graph.edge(n, succ).metaedge;
-                        return numEdgesToCount + (metaedge.numRegularEdges ? 1 : 0);
+                    var outDegree = _.reduce(graph.successors(currentNode), function (outDegree, succ) {
+                        var metaedge = graph.edge(currentNode, succ).metaedge;
+                        return outDegree + (metaedge.numRegularEdges ? 1 : 0);
                     }, 0);
-                    if (numEdgesToCount === 0 && graph.successors(n).length > 0) {
-                        numEdgesToCount = graph.successors(n).length;
+                    if (outDegree === 0 && graph.successors(currentNode).length > 0) {
+                        outDegree = graph.successors(currentNode).length;
                     }
-                    return numEdgesToCount > maxOutDegree;
+                    // Store the in and out degrees of this node to avoid recomputing.
+                    nodeToInDegree[currentNode] = inDegree;
+                    nodeToOutDegree[currentNode] = outDegree;
+                    validNodeCount++;
                 });
-                _.each(highOutDegreeNames, function (n) {
-                    makeInExtract(renderNode, n);
+                if (validNodeCount < PARAMS.minNodeCountForExtraction) {
+                    // This graph has few nodes. Do not extract any nodes.
+                    return;
+                }
+                // We only extract if the node has a min in or out degree greater than this.
+                var minUpperBound = PARAMS.minDegreeForExtraction - 1;
+                // Mark for extraction nodes with in-degree > Q3 + (Q3 - Q1).
+                var q3Index = Math.round(validNodeCount * 0.75);
+                var q1Index = Math.round(validNodeCount * 0.25);
+                var sortedByInDegree = Object.keys(nodeToInDegree).sort(function (node0, node1) {
+                    return nodeToInDegree[node0] - nodeToInDegree[node1];
                 });
+                var inDegreeQ3 = nodeToInDegree[sortedByInDegree[q3Index]];
+                var inDegreeQ1 = nodeToInDegree[sortedByInDegree[q1Index]];
+                var inDegreeUpperBound = inDegreeQ3 + inDegreeQ3 - inDegreeQ1;
+                // Only extract if the upper bound is high enough.
+                inDegreeUpperBound = Math.max(inDegreeUpperBound, minUpperBound);
+                for (var i = validNodeCount - 1; nodeToInDegree[sortedByInDegree[i]] > inDegreeUpperBound; i--) {
+                    // Extract a high in-degree node.
+                    makeInExtract(renderNode, sortedByInDegree[i]);
+                }
+                // Mark for extraction nodes with out-degree > Q3 + (Q3 - Q1) * 4.
+                var sortedByOutDegree = Object.keys(nodeToOutDegree).sort(function (node0, node1) {
+                    return nodeToOutDegree[node0] - nodeToOutDegree[node1];
+                });
+                var outDegreeQ3 = nodeToOutDegree[sortedByOutDegree[q3Index]];
+                var outDegreeQ1 = nodeToOutDegree[sortedByOutDegree[q1Index]];
+                // The upper bound for extracting out-degree nodes is higher than that for
+                // extracting in-degree ones (Note the "* 4") because, in practice, some
+                // graphs look worse with a smaller out-degree bound. For instance, a smaller
+                // out-degree bound removes the convolution nodes from cifar 10 train's graph.
+                var outDegreeUpperBound = outDegreeQ3 + (outDegreeQ3 - outDegreeQ1) * 4;
+                // Only extract if the upper bound is high enough.
+                outDegreeUpperBound = Math.max(outDegreeUpperBound, minUpperBound);
+                for (var i = validNodeCount - 1; nodeToOutDegree[sortedByOutDegree[i]] > outDegreeUpperBound; i--) {
+                    var node = graph.node(sortedByOutDegree[i]);
+                    if (!node || node.isInExtract) {
+                        // This node has already been extracted due to high in-degree. It might
+                        // have been removed from the graph in general (during in-degree
+                        // extraction) due to a lack of neighbors. Do not extract this node twice.
+                        continue;
+                    }
+                    // Extract a high out-degree node that has not already been extracted.
+                    makeOutExtract(renderNode, sortedByOutDegree[i]);
+                }
             }
             /** Remove control edges from nodes that have too many control edges */
             function removeControlEdges(renderNode) {
@@ -9879,15 +10016,7 @@ var tf;
                 if (PARAMS.inExtractTypes) {
                     extractPredefinedSource(renderNode);
                 }
-                // This has to come before extract high out-degree to protect the core part
-                // that output to many places as there are more high-degree sinks than
-                // sources.
-                if (PARAMS.maxInDegree) {
-                    extractHighInDegree(renderNode);
-                }
-                if (PARAMS.maxOutDegree) {
-                    extractHighOutDegree(renderNode);
-                }
+                extractHighInOrOutDegree(renderNode);
                 if (PARAMS.maxControlDegree) {
                     removeControlEdges(renderNode);
                 }
@@ -12386,6 +12515,44 @@ var tf;
                 });
             }
             util.runAsyncTask = runAsyncTask;
+            /**
+             * Asynchronously runs an expensive task that returns a promise. Updates the
+             * tracker's progress after the promise resolves. Returns a new promise that
+             * resolves after the progress is updated.
+             */
+            function runAsyncPromiseTask(msg, incProgressValue, task, tracker) {
+                return new Promise(function (resolve, reject) {
+                    var handleError = function (e) {
+                        // Errors that happen inside asynchronous tasks are
+                        // reported to the tracker using a user-friendly message.
+                        tracker.reportError('Failed ' + msg, e);
+                        reject(e);
+                    };
+                    // Update the progress message to say the current running task.
+                    tracker.setMessage(msg);
+                    // Run the expensive task with a delay that gives enough time for the
+                    // UI to update.
+                    setTimeout(function () {
+                        try {
+                            var start_1 = Date.now();
+                            task()
+                                .then(function (value) {
+                                /* tslint:disable */
+                                console.log(msg, ':', Date.now() - start_1, 'ms');
+                                // Update the progress value.
+                                tracker.updateProgress(incProgressValue);
+                                // Return the result to be used by other tasks.
+                                resolve(value);
+                            })
+                                .catch(handleError);
+                        }
+                        catch (e) {
+                            handleError(e);
+                        }
+                    }, ASYNC_TASK_DELAY);
+                });
+            }
+            util.runAsyncPromiseTask = runAsyncPromiseTask;
             /**
              * Returns a query selector with escaped special characters that are not
              * allowed in a query selector.
@@ -12712,7 +12879,8 @@ var tf;
                     var blob = new Blob([svgXml], { type: 'image/svg+xml;charset=utf-8' });
                     image.src = URL.createObjectURL(blob);
                 };
-                image.src = 'data:image/svg+xml;charset=utf-8,' + encodeURIComponent(svgXml);
+                image.src =
+                    'data:image/svg+xml;charset=utf-8,' + encodeURIComponent(svgXml);
             };
             /**
              * Handles changes in zooming/panning. Should be called from the main svg
@@ -12851,6 +13019,8 @@ Polymer({
 ::content #svg {
   overflow: hidden;
   flex: 1;
+  height: 100%;
+  width: 100%;
 }
 
 ::content #hidden {
@@ -13295,6 +13465,7 @@ Polymer({
 
 .titleContainer {
   position: relative;
+  top: 20px;
 }
 
 .title {
@@ -13313,7 +13484,7 @@ Polymer({
 </style>
 <div class="titleContainer">
   <div id="title" class="title">Main Graph</div>
-  <div id="auxTitle" class="auxTitle">Auxiliary nodes</div>
+  <div id="auxTitle" class="auxTitle">Auxiliary Nodes</div>
 </div>
 <svg id="svg">
   <defs>
@@ -13603,7 +13774,8 @@ Polymer({
     setTimeout(this.fit.bind(this), tf.graph.layout.PARAMS.animation.duration);
   },
   _updateLabels: function(showLabels) {
-    var titleStyle = this.getElementsByClassName('title')[0].style;
+    var mainGraphTitleElement = this.getElementsByClassName('title')[0];
+    var titleStyle = mainGraphTitleElement.style;
     var auxTitleStyle = this.getElementsByClassName('auxTitle')[0].style;
     var core = d3.select("." + tf.graph.scene.Class.Scene.GROUP + ">." +
       tf.graph.scene.Class.Scene.CORE)[0][0];
@@ -13620,6 +13792,12 @@ Polymer({
       titleStyle.left = coreX + 'px';
       if (auxX !== null && auxX !== coreX) {
         auxTitleStyle.display = 'inline';
+
+        // Make sure that the aux title is positioned rightwards enough so as to
+        // prevent overlap with the main graph title.
+        auxX = Math.max(
+            coreX + mainGraphTitleElement.getBoundingClientRect().width, auxX);
+
         auxTitleStyle.left = auxX + 'px';
       } else {
         auxTitleStyle.display = 'none';
@@ -13812,7 +13990,9 @@ paper-button {
 </style>
 <div class="container">
   <div class="vertical">
-    <h2>[[title]]</h2>
+    <template is="dom-if" if="[[title]]">
+      <h2>[[title]]</h2>
+    </template>
     <tf-graph-scene id="scene" class="auto" render-hierarchy="[[renderHierarchy]]" highlighted-node="[[_getVisible(highlightedNode)]]" selected-node="[[selectedNode]]" color-by="[[colorBy]]" progress="[[progress]]"></tf-graph-scene>
   </div>
 </div>
@@ -15953,19 +16133,20 @@ Polymer({
   reload: function() {
     Promise.all([this.backend.graphRuns(), this.backend.runMetadataRuns()])
     .then(function(result) {
-      var runsWithGraph = result[0];
+      var runsWithGraph = result[0].sort(VZ.Sorting.compareTagNames);
       var runToMetadata = result[1];
       var datasets = _.map(runsWithGraph, function(runName) {
         return {
           name: runName,
           path: this.backend.router.graph(runName, tf.graph.LIMIT_ATTR_SIZE,
             tf.graph.LARGE_ATTRS_KEY),
-          runMetadata: runToMetadata[runName] ? _.map(runToMetadata[runName].sort(), function(tag) {
-            return {
-              tag: tag,
-              path: this.backend.router.runMetadata(tag, runName)
-            };
-          }, this) : []
+          runMetadata: runToMetadata[runName] ? _.map(
+            runToMetadata[runName].sort(VZ.Sorting.compareTagNames), function(tag) {
+              return {
+                tag: tag,
+                path: this.backend.router.runMetadata(tag, runName)
+              };
+            }, this) : []
         };
       }, this);
       this.set('_datasets', datasets);
@@ -15977,7 +16158,1467 @@ Polymer({
 });
 })();
 </script>
-</div><dom-module id="tf-tensorboard">
+<dom-module id="vz-projector-styles" assetpath="../vz-projector/">
+<template>
+<style>
+:host {
+  --paper-input-container-label: {
+    font-size: 14px;
+  };
+  --paper-input-container-input: {
+    font-size: 14px;
+  };
+  /* TODO: Figure out why this doesn't work */
+  --paper-dropdown-menu-input: {
+    font-size: 14px;
+  };
+}
+
+paper-dropdown-menu paper-item {
+  font-size: 13px;
+}
+
+paper-tooltip {
+  max-width: 200px;
+  --paper-tooltip: {
+    font-size: 12px;
+  };
+}
+
+paper-checkbox {
+  --paper-checkbox-checked-color: #880E4F;
+}
+
+paper-toggle-button {
+  --paper-toggle-button-checked-bar-color:  #880E4F;
+  --paper-toggle-button-checked-button-color:  #880E4F;
+  --paper-toggle-button-checked-ink-color: #880E4F;
+}
+
+paper-icon-button {
+  border-radius: 50%;
+}
+
+paper-icon-button[active] {
+  color: white;
+  background-color: #880E4F;
+}
+
+.slider {
+  display: flex;
+  align-items: center;
+  margin-bottom: 10px;
+  justify-content: space-between;
+}
+
+.slider span {
+  width: 35px;
+  text-align: right;
+}
+
+.slider label {
+  align-items: center;
+  display: flex;
+}
+
+.help-icon {
+  height: 15px;
+  left: 2px;
+  min-width: 15px;
+  min-height: 15px;
+  margin: 0;
+  padding: 0;
+  top: -2px;
+  width: 15px;
+}
+
+.ink-panel {
+  display: flex;
+  flex-direction: column;
+  font-size: 14px;
+}
+
+.ink-panel h4 {
+  border-bottom: 1px solid #ddd;
+  font-size: 14px;
+  font-weight: 500;
+  margin: 0;
+  margin-bottom: 10px;
+  padding-bottom: 5px;
+}
+
+.ink-panel-header {
+  border-bottom: 1px solid rgba(0, 0, 0, 0.1);
+  border-top: 1px solid rgba(0, 0, 0, 0.1);
+  height: 50px;
+}
+
+.ink-panel-content {
+  display: none;
+  height: 100%;
+}
+
+.ink-panel-content.active {
+  display: block;
+}
+
+.ink-panel-content h3 {
+  font-weight: 500;
+  font-size: 14px;
+  margin-top: 20px;
+  margin-bottom: 5px;
+  text-transform: uppercase;
+}
+
+.ink-panel-header h3 {
+  font-weight: 500;
+  font-size: 14px;
+  margin: 0;
+  padding: 0 24px;
+  text-transform: uppercase;
+}
+
+
+/* - Tabs */
+.ink-tab-group {
+  align-items: center;
+  box-sizing: border-box;
+  display: flex;
+  height: 100%;
+  justify-content: space-around;
+}
+
+.ink-tab-group .projection-tab {
+  color: rgba(0, 0, 0, 0.5);
+  cursor: pointer;
+  font-weight: 300;
+  line-height: 49px;
+  padding: 0 12px;
+  text-align: center;
+  text-transform: uppercase;
+}
+
+.ink-tab-group .projection-tab:hover {
+  color: black;
+}
+
+.ink-tab-group .projection-tab.active {
+  border-bottom: 2px solid black;
+  color: black;
+  font-weight: 500;
+}
+</style>
+</template>
+</dom-module>
+<link rel="import" href="../paper-input/paper-textarea.html">
+<dom-module id="vz-projector-bookmark-panel" assetpath="../vz-projector/">
+<template>
+<style include="vz-projector-styles"></style>
+<style>
+#title {
+  background-color: #fafafa;
+  color: black;
+  font-weight: 500;
+  left: 0;
+  line-height: 60px;
+  padding-left: 24px;
+  position: absolute;
+  width: 276px;
+}
+#bookmark-container {
+  background-color: #fafafa;
+}
+#icon-container {
+  line-height: 60px;
+  position: absolute;
+  right: 0;
+}
+#header {
+  border-top: 1px solid rgba(0, 0, 0, 0.1);
+  position: relative;
+}
+#panel {
+  background-color: #fafafa;
+  position: relative;
+  overflow-y: scroll;
+  top: 60px;
+  max-height: 50vh;
+}
+paper-button {
+  border: 1px solid #ccc;
+}
+
+#save-container {
+  text-align: center;
+}
+
+.state-radio {
+  display: table-cell;
+  vertical-align: middle;
+  padding-top: 16px;
+}
+
+.state-label {
+  display: table-cell;
+  vertical-align: middle;
+  top: 14px;
+}
+
+.state-label-input {
+  width: 194px;
+}
+
+.state-clear {
+  display: table-cell;
+  vertical-align: middle;
+  padding-top: 20px;
+}
+#state-file {
+  display: none;
+}
+#no-bookmarks {
+  padding: 0 24px;
+}
+#action-buttons-container .add-icon-button {
+  background-color: #03a9f4;
+  color: white;
+  margin: 0 4px 4px auto;
+  right: 7px;
+  top: -4px;
+}
+.upload-download-icon-button {
+  padding: 0;
+}
+#action-buttons-container {
+  display: flex;
+  margin-left: 34px;
+  margin-top: 6px;
+}
+.ink-fab {
+  border-radius: 50%;
+  background: white;
+  box-shadow: 0 1px 3px rgba(0, 0, 0, 0.3);
+}
+paper-textarea {
+  --paper-input-container-input: {
+    font-size: 12px;
+  }
+  --paper-font-caption: {
+    display: none
+  }
+}
+</style>
+
+
+<div id="bookmark-container">
+  <div id="header">
+    <div id="title">
+      BOOKMARKS ([[savedStates.length]])
+      <paper-icon-button icon="help" class="help-icon"></paper-icon-button>
+      <paper-tooltip animation-delay="0" position="top" offset="0">
+        The bookmarks drawer allows you to bookmark a set of views into the
+        projection, saving camera position, selected points, as well as any
+        highlighting you may have. You can then download the file to save it
+        permanently, and later upload it to again view your bookmarks.
+      </paper-tooltip>
+    </div>
+    <div id="icon-container">
+      
+      <paper-icon-button id="expand-more" icon="expand-less" on-tap="_expandMore"></paper-icon-button>
+      <paper-icon-button id="expand-less" style="display: none" icon="expand-more" on-tap="_expandLess"></paper-icon-button>
+    </div>
+  </div>
+  <iron-collapse id="panel">
+    
+    <div id="state-section">
+      <template is="dom-if" if="[[!savedStates.length]]">
+        <p id="no-bookmarks">
+            No bookmarks yet, upload a bookmarks file or add a new bookmark by clicking the "+" below.
+        </p>
+      </template>
+
+      <template is="dom-repeat" items="{{savedStates}}">
+        <div class="state-row">
+          <div class="state-radio">
+            <template is="dom-if" if="{{item.isSelected}}">
+              <paper-icon-button icon="radio-button-checked"></paper-icon-button>
+            </template>
+            <template is="dom-if" if="{{!item.isSelected}}">
+              <paper-icon-button icon="radio-button-unchecked" data-index$="{{index}}" on-tap="_radioButtonHandler"></paper-icon-button>
+            </template>
+          </div>
+          <div class="state-label">
+            <paper-textarea value="[[item.label]]" class="state-label-input" on-keyup="_labelChange" data-index$="[[index]]" autoresizing="">
+          </paper-textarea></div>
+          <div class="state-clear">
+            <paper-icon-button icon="clear" data-index$="{{index}}" on-tap="_clearButtonHandler"></paper-icon-button>
+          </div>
+        </div>
+      </template>
+
+      <div id="action-buttons-container">
+        <paper-icon-button class="upload-download-icon-button" icon="file-download" title="Download bookmarks" on-tap="_downloadFile"></paper-icon-button>
+        <paper-icon-button class="upload-download-icon-button" icon="file-upload" title="Upload bookmarks" on-tap="_uploadFile"></paper-icon-button>
+        <paper-icon-button class="add-icon-button ink-fab" icon="add" title="Add bookmark" on-tap="_addBookmark"></paper-icon-button>
+        <input type="file" id="state-file" name="state-file">
+      </div>
+    </div>
+  </iron-collapse>
+</div>
+
+</template>
+</dom-module>
+<dom-module id="vz-projector-legend" assetpath="../vz-projector/">
+<template>
+<style include="vz-projector-styles"></style>
+<style>
+.item {
+  display: flex;
+  align-items: flex-start;
+  margin-bottom: 10px;
+}
+
+.shape {
+  width: 10px;
+  height: 10px;
+  margin-right: 10px;
+  margin-top: 5px;
+  border-radius: 50%;
+}
+
+.label {
+  flex-grow: 1;
+}
+
+.gradient {
+  width: 100%;
+  height: 10px;
+}
+
+.gradient-boundaries {
+  display: flex;
+  justify-content: space-between;
+}
+</style>
+
+<template is="dom-repeat" items="[[renderInfo.items]]">
+  <div class="item">
+    <div class="shape" style="background-color: [[item.color]];"></div>
+    <div class="label">[[item.label]]</div>
+    <div class="info" style="color: [[item.color]];">[[item.count]]</div>
+  </div>
+</template>
+
+<template is="dom-if" if="[[renderInfo.thresholds]]">
+  <svg class="gradient">
+    <defs>
+      <linearGradient id="gradient" x1="0%" y1="100%" x2="100%" y2="100%"></linearGradient>
+    </defs>
+    <rect height="10" style="fill: url(&quot;#gradient&quot;);"></rect>
+  </svg>
+  <div class="gradient-boundaries">
+    <div>[[renderInfo.thresholds.0.value]]</div>
+    <div>[[_getLastThreshold(renderInfo.thresholds)]]</div>
+  </div>
+</template>
+
+</template>
+</dom-module><dom-module id="vz-projector-data-panel" assetpath="../vz-projector/">
+<template>
+<style include="vz-projector-styles"></style>
+<style>
+.container {
+  padding: 10px 20px 20px 20px;
+}
+
+input[type=file] {
+  display: none;
+}
+
+.file-name {
+  margin-right: 10px;
+}
+
+.dirs {
+  color: rgba(0, 0, 0, 0.7);
+  display: flex;
+  flex-direction: column;
+  font-size: 12px;
+  margin: 15px 0;
+  line-height: 20px;
+}
+
+.dir {
+  white-space: nowrap;
+  overflow: hidden;
+  text-overflow: ellipsis;
+}
+
+paper-item {
+  --paper-item-disabled: {
+    border-bottom: 1px solid black;
+    justify-content: center;
+    font-size: 12px;
+    line-height: normal;
+    min-height: 0px;
+  };
+}
+
+.item-details {
+  margin-left: 5px;
+  color: gray;
+  font-size: 12px;
+}
+
+paper-dropdown-menu {
+  width: 100%;
+}
+
+paper-dropdown-menu paper-item {
+  justify-content: space-between;
+}
+
+.title {
+  align-items: center;
+  border-bottom: 1px solid rgba(0, 0, 0, 0.1);
+  color: black;
+  display: flex;
+  font-weight: 500;
+  height: 59px;
+  padding-left: 20px;
+}
+
+#upload-buttons {
+  display: flex;
+  justify-content: space-between;
+}
+
+#normalize-data-checkbox {
+  margin: 10px 0;
+}
+</style>
+<div class="title">DATA</div>
+<div class="container">
+  
+  <template is="dom-if" if="[[_hasChoices(runNames)]]">
+    <paper-dropdown-menu no-animations="" label="[[_getNumRunsLabel(runNames)]] found">
+      <paper-listbox attr-for-selected="value" class="dropdown-content" selected="{{selectedRun}}">
+        <template is="dom-repeat" items="[[runNames]]">
+          <paper-item value="[[item]]" label="[[item]]">
+            [[item]]
+          </paper-item>
+        </template>
+      </paper-listbox>
+    </paper-dropdown-menu>
+  </template>
+
+  <template is="dom-if" if="[[tensorNames]]">
+    
+    <paper-dropdown-menu no-animations="" label="[[_getNumTensorsLabel(tensorNames)]] found">
+      <paper-listbox attr-for-selected="value" class="dropdown-content" selected="{{selectedTensor}}">
+        <template is="dom-repeat" items="[[tensorNames]]">
+          <paper-item value="[[item.name]]" label="[[item.name]]">
+            [[item.name]]
+            <span class="item-details">
+              [[item.shape.0]]x[[item.shape.1]]
+            </span>
+          </paper-item>
+        </template>
+      </paper-listbox>
+    </paper-dropdown-menu>
+  </template>
+  
+  <template is="dom-if" if="[[_hasChoices(labelOptions)]]">
+    <paper-dropdown-menu no-animations="" label="Label by">
+      <paper-listbox attr-for-selected="value" class="dropdown-content" selected="{{selectedLabelOption}}">
+        <template is="dom-repeat" items="[[labelOptions]]">
+          <paper-item value="[[item]]" label="[[item]]">
+            [[item]]
+          </paper-item>
+        </template>
+      </paper-listbox>
+    </paper-dropdown-menu>
+  </template>
+
+  
+  <template is="dom-if" if="[[_hasChoices(colorOptions)]]">
+    <paper-dropdown-menu id="colorby" no-animations="" label="Color by">
+      <paper-listbox attr-for-selected="value" class="dropdown-content" selected="{{selectedColorOptionName}}">
+        <template is="dom-repeat" items="[[colorOptions]]">
+          <paper-item class$="[[getSeparatorClass(item.isSeparator)]]" value="[[item.name]]" label="[[item.name]]" disabled="[[item.isSeparator]]">
+            [[item.name]]
+            <span class="item-details">[[item.desc]]</span>
+          </paper-item>
+        </template>
+      </paper-listbox>
+    </paper-dropdown-menu>
+    <vz-projector-legend render-info="[[colorLegendRenderInfo]]"></vz-projector-legend>
+  </template>
+  <paper-checkbox id="normalize-data-checkbox" checked="{{normalizeData}}">
+    Sphereize data
+    <paper-icon-button icon="help" class="help-icon"></paper-icon-button>
+    <paper-tooltip position="bottom" animation-delay="0" fit-to-visible-bounds="">
+      The data is normalized by shifting each point by the centroid and making
+      it unit norm.
+    </paper-tooltip>
+  </paper-checkbox>
+  
+  <div id="upload-buttons">
+    
+    <div>
+      <button id="upload" title="Upload a TSV file" class="ink-button">Upload data</button>
+      <input type="file" id="file" name="file">
+    </div>
+    
+    <div>
+      <button id="upload-metadata" title="Upload a TSV metadata file" class="ink-button">Upload Metadata</button>
+      <input type="file" id="file-metadata" name="file-metadata">
+    </div>
+  </div>
+    <div class="dirs">
+    <div class="dir">Checkpoint: <span id="checkpoint-file"></span></div>
+    <div class="dir">Metadata: <span id="metadata-file"></span></div>
+  </div>
+</div>
+
+</template>
+</dom-module>
+<dom-module id="vz-projector-input" assetpath="../vz-projector/">
+<template>
+<style include="vz-projector-styles"></style>
+<style>
+.info {
+  color: rgba(0, 0, 0, 0.5);
+  display: block;
+  font-size: 11px;
+}
+
+.toggle {
+  font-size: 12px;
+  height: 21px;
+  margin: 0px;
+  min-width: 0px;
+  min-height: 0px;
+  padding: 0;
+  width: 17px;
+}
+
+.toggle[active] {
+  background-color: #880E4F;
+  color: white;
+}
+</style>
+
+<paper-input label="[[label]]">
+  <div class="slash" prefix="">/</div>
+  <div class="slash" suffix="">/</div>
+  <div suffix="">
+    <paper-button id="regex" toggles="" class="toggle">.*</paper-button>
+  </div>
+</paper-input>
+<paper-tooltip for="regex" position="bottom" animation-delay="0" fit-to-visible-bounds="">
+  Enable/disable regex mode.
+</paper-tooltip>
+<span class="info">[[message]]</span>
+
+
+</template>
+</dom-module><dom-module id="vz-projector-inspector-panel" assetpath="../vz-projector/">
+<style include="vz-projector-styles"></style>
+<style>
+:host {
+   display: flex;
+   flex-direction: column;
+   /* Account for the bookmark pane at the bottom */
+   height: calc(100% - 55px);
+}
+
+.container {
+  display: block;
+  padding: 10px 20px 0 20px;
+}
+
+.buttons {
+  display: flex;
+  height: 60px;
+}
+
+.button {
+  margin-right: 10px;
+  border: none;
+  border-radius: 7px;
+  font-size: 13px;
+  padding: 10px;
+  background: #e3e3e3;
+}
+
+.button:last-child {
+  margin-right: 0;
+}
+
+.nn {
+  display: flex;
+  flex-direction: column;
+}
+
+.nn > * {
+  padding: 0 20px;
+}
+
+.nn-list {
+  overflow-y: auto;
+}
+
+.nn-list .neighbor {
+  font-size: 12px;
+  margin-bottom: 8px;
+}
+
+.nn-list .label-and-value {
+  display: flex;
+  justify-content: space-between;
+}
+
+.label {
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+}
+
+.nn-list .value {
+  color: #666;
+  float: right;
+  font-weight: 300;
+  margin-left: 8px;
+}
+
+.nn-list .bar {
+  position: relative;
+  border-top: 1px solid rgba(0, 0, 0, 0.15);
+  margin: 2px 0;
+}
+
+.nn-list .bar .fill {
+  position: absolute;
+  top: -1px;
+  border-top: 1px solid white;
+}
+
+.nn-list .tick {
+  position: absolute;
+  top: 0px;
+  height: 3px;
+  border-left: 1px solid rgba(0, 0, 0, 0.15);
+}
+
+.nn-list .neighbor-link:hover {
+  cursor: pointer;
+}
+
+.search-by {
+  display: flex;
+}
+
+.search-by vz-projector-input {
+  width: 100%;
+}
+
+.search-by paper-dropdown-menu {
+  margin-left: 10px;
+  width: 100px;
+}
+
+.distance .options {
+  float: right;
+}
+
+.options a {
+  color: #727272;
+  font-size: 13px;
+  margin-left: 12px;
+  text-decoration: none;
+}
+
+.options a.selected {
+  color: #009EFE;
+}
+
+.neighbors {
+  margin-bottom: 30px;
+}
+
+.neighbors-options {
+  margin-top: 6px;
+}
+
+.neighbors-options .option-label, .distance .option-label {
+  color: #727272;
+  margin-right: 2px;
+  width: auto;
+}
+
+.num-neighbors-container {
+  display: inline-block;
+}
+
+#nn-slider {
+  margin: 0 -12px 0 10px;
+}
+
+.euclidian {
+  margin-right: 10px;
+}
+
+.matches-list {
+  padding: 0 20px;
+}
+
+.matches-list .row {
+  border-bottom: 1px solid #ddd;
+  cursor: pointer;
+  display: flex;
+  font-size: 12px;
+  margin: 5px 0;
+  padding: 4px 0;
+}
+
+.results {
+  display: flex;
+  flex-direction: column;
+}
+</style>
+<template>
+<div class="container">
+  <div class="buttons">
+    <button class="button reset-filter">Show All Data</button>
+    <button class="button set-filter">Isolate selection</button>
+    <button class="button clear-selection">Clear selection</button>
+  </div>
+  <div class="search-by">
+    <vz-projector-input id="search-box" label="Search"></vz-projector-input>
+    <paper-dropdown-menu no-animations="" label="by">
+      <paper-listbox attr-for-selected="value" class="dropdown-content" selected="{{selectedMetadataField}}">
+        <template is="dom-repeat" items="[[metadataFields]]">
+          <paper-item value="[[item]]" label="[[item]]">
+            [[item]]
+          </paper-item>
+        </template>
+      </paper-listbox>
+    </paper-dropdown-menu>
+  </div>
+</div>
+<div class="results">
+  <div class="nn" style="display: none">
+    <div class="neighbors">
+      <div class="neighbors-options">
+        <div class="slider num-nn">
+          <span class="option-label">neighbors</span>
+          <paper-icon-button icon="help" class="help-icon"></paper-icon-button>
+          <paper-tooltip position="bottom" animation-delay="0" fit-to-visible-bounds="">
+            The number of neighbors (in the original space) to show when clicking on a point.
+          </paper-tooltip>
+          <paper-slider id="nn-slider" pin="" min="5" max="1000" value="100"></paper-slider>
+          <span class="nn-count"></span>
+        </div>
+      </div>
+      <div class="distance">
+        <span class="option-label">distance</span>
+        <div class="options">
+          <a class="selected cosine" href="javascript:void(0);">COSINE</a>
+          <a class="euclidean" href="javascript:void(0);">EUCLIDIAN</a>
+        </div>
+      </div>
+    </div>
+    <p>Nearest points in the original space:
+    </p><div class="nn-list"></div>
+  </div>
+  <div class="matches-list" style="display: none">
+    <div class="list"></div>
+    <div class="limit-msg">Showing only the first 100 results...</div>
+  </div>
+</div>
+
+</template>
+</dom-module>
+<dom-module id="vz-projector-metadata-card" assetpath="../vz-projector/">
+<template>
+<style>
+#metadata-card {
+  background-color: rgba(255,255,255,0.9);
+  box-shadow: 0 2px 2px 0 rgba(0, 0, 0, 0.14),
+      0 1px 5px 0 rgba(0, 0, 0, 0.12), 0 3px 1px -2px rgba(0, 0, 0, 0.2);
+  width: 280px;
+}
+
+#header {
+  background: #e9e9e9;
+}
+
+#icon-container {
+  position: absolute;
+  right: 0;
+  top: 4px;
+}
+
+#metadata-label {
+  font-weight: 400;
+  font-size: 14px;
+  line-height: 24px;
+  padding: 12px 12px 8px;
+  width: 230px;
+}
+
+#metadata-table {
+  display: table;
+  padding: 8px 12px 4px;
+}
+
+.metadata-row {
+  display: table-row;
+}
+
+.metadata-key {
+  font-weight: bold;
+}
+
+.metadata-key, .metadata-value {
+  display: table-cell;
+  font-size: 12px;
+  padding: 3px 3px;
+}
+</style>
+
+<template is="dom-if" if="[[hasMetadata]]">
+  <div id="metadata-card">
+    <div id="icon-container">
+      <paper-icon-button id="expand-more" style="display: none" icon="expand-more" on-tap="_expandMore"></paper-icon-button>
+      <paper-icon-button id="expand-less" on-tap="_expandLess" icon="expand-less"></paper-icon-button>
+    </div>
+    <div id="header">
+      <div id="metadata-label">[[label]]</div>
+    </div>
+    <iron-collapse id="metadata-container" opened="">
+      <div id="metadata-table">
+        <template is="dom-repeat" items="[[metadata]]">
+          <div class="metadata-row">
+            <div class="metadata-key">[[item.key]]</div>
+            <div class="metadata-value">[[item.value]]</div>
+          </div>
+        </template>
+      </div>
+    </iron-collapse>
+  </div>
+</template>
+</template>
+</dom-module>
+<dom-module id="vz-projector-projections-panel" assetpath="../vz-projector/">
+<template>
+<style include="vz-projector-styles"></style>
+<style>
+:host {
+  transition: height 0.2s;
+}
+
+.ink-button, ::shadow .ink-button {
+  border: none;
+  border-radius: 2px;
+  font-size: 13px;
+  padding: 10px;
+  min-width: 100px;
+  flex-shrink: 0;
+  background: #e3e3e3;
+}
+
+.ink-panel-buttons {
+  margin-bottom: 10px;
+}
+
+.two-way-toggle {
+  display: flex;
+  flex-direction: row;
+}
+
+.two-way-toggle span {
+  padding-right: 7px;
+}
+
+.has-border {
+  border: 1px solid rgba(0, 0, 0, 0.1);
+}
+
+.toggle {
+  min-width: 0px;
+  font-size: 12px;
+  width: 17px;
+  min-height: 0px;
+  height: 21px;
+  padding: 0;
+  margin: 0px;
+}
+
+.toggle[active] {
+  background-color: #880E4F;
+  color: white;
+}
+
+.two-columns {
+  display:flex;
+  justify-content: space-between;
+}
+
+.two-columns > :first-child {
+  margin-right: 15px;
+}
+
+.two-columns > div {
+  width: 50%;
+}
+
+.dropdown-item {
+  justify-content: space-between;
+}
+
+#z-container {
+  display: flex;
+  align-items: center;
+  width: 50%;
+}
+
+#z-checkbox {
+  margin: 27px 0 0 5px;
+  width: 18px;
+}
+
+#z-dropdown {
+  flex-grow: 1;
+}
+
+.notice {
+  color: #880E4F;
+}
+
+.container {
+  padding: 20px;
+}
+
+.book-icon {
+  height: 20px;
+  color: rgba(0, 0, 0, 0.7);
+}
+</style>
+<div id="main">
+  <div class="ink-panel-header">
+    <div class="ink-tab-group">
+
+      <div data-tab="tsne" id="tsne-tab" class="ink-tab projection-tab">t-SNE</div>
+      <paper-tooltip for="tsne-tab" position="bottom" animation-delay="0" fit-to-visible-bounds="">
+        t-distributed stochastic neighbor embedding
+      </paper-tooltip>
+
+      <div data-tab="pca" id="pca-tab" class="ink-tab projection-tab">PCA</div>
+      <paper-tooltip for="pca-tab" position="bottom" animation-delay="0" fit-to-visible-bounds="">
+        Principal component analysis
+      </paper-tooltip>
+
+      <div data-tab="custom" id="custom-tab" class="ink-tab projection-tab" title="Linear projection of two custom vectors">Custom</div>
+      <paper-tooltip for="custom-tab" position="bottom" animation-delay="0" fit-to-visible-bounds="">
+        Search for two vectors upon which to project all points.
+      </paper-tooltip>
+
+    </div>
+  </div>
+  <div class="container">
+    
+    <div data-panel="tsne" class="ink-panel-content">
+      <div class="slider">
+        <label>Dimension</label>
+        <div class="two-way-toggle">
+          <span>2D</span>
+          <paper-toggle-button id="tsne-toggle" checked="{{tSNEis3d}}">3D</paper-toggle-button>
+        </div>
+      </div>
+      <div class="slider tsne-perplexity">
+        <label>
+          Perplexity
+          <paper-icon-button icon="help" class="help-icon"></paper-icon-button>
+          <paper-tooltip position="right" animation-delay="0" fit-to-visible-bounds="">
+            The most appropriate perplexity value depends on the density of the
+            data. Loosely speaking, a larger / denser dataset
+            requires a larger perplexity. Typical values for perplexity range
+            between 5 and 50.
+          </paper-tooltip>
+        </label>
+        <paper-slider id="perplexity-slider" pin="" min="2" max="100" value="30"></paper-slider>
+        <span></span>
+      </div>
+      <div class="slider tsne-learning-rate">
+        <label>
+          Learning rate
+          <paper-icon-button icon="help" class="help-icon"></paper-icon-button>
+          <paper-tooltip position="right" animation-delay="0" fit-to-visible-bounds="">
+            The ideal learning rate often depends on the size of the data,
+            with smaller datasets requiring smaller learning rates.
+          </paper-tooltip>
+        </label>
+        <paper-slider id="learning-rate-slider" snaps="" min="-3" max="2" step="1" value="1" max-markers="6">
+        </paper-slider>
+        <span></span>
+      </div>
+      <p>
+        <button class="run-tsne ink-button" title="Re-run t-SNE">Re-run</button>
+        <button class="stop-tsne ink-button" title="Stop t-SNE">Stop</button>
+      </p>
+      <p>Iteration: <span class="run-tsne-iter">0</span></p>
+      <p id="tsne-sampling" class="notice">
+        For fast results, the data will be sampled down to [[getTsneSampleSize()]] points.
+      </p>
+      <p>
+        <iron-icon icon="book" class="book-icon"></iron-icon>
+        <a target="_blank" href="http://distill.pub/2016/misread-tsne/">
+          How to use t-SNE effectively.
+        </a>
+      </p>
+    </div>
+    
+    <div data-panel="pca" class="ink-panel-content">
+      <div class="two-columns">
+        <div> 
+          <paper-dropdown-menu style="width: 100%" vertical-align="bottom" no-animations="" label="X">
+            <paper-listbox attr-for-selected="value" class="dropdown-content" selected="{{pcaX}}">
+              <template is="dom-repeat" items="[[pcaComponents]]">
+                <paper-item class="dropdown-item" value="[[item]]" label="Component #[[_addOne(item)]]">
+                  Component #[[_addOne(item)]]
+                </paper-item>
+              </template>
+            </paper-listbox>
+          </paper-dropdown-menu>
+          <paper-dropdown-menu no-animations="" vertical-align="bottom" label="Z" disabled="[[!hasPcaZ]]" id="z-dropdown">
+            <paper-listbox attr-for-selected="value" class="dropdown-content" selected="{{pcaZ}}">
+              <template is="dom-repeat" items="[[pcaComponents]]">
+                <paper-item class="dropdown-item" value="[[item]]" label="Component #[[_addOne(item)]]">
+                  Component #[[_addOne(item)]]
+                </paper-item>
+              </template>
+            </paper-listbox>
+          </paper-dropdown-menu>
+        </div>
+        <div> 
+          <paper-dropdown-menu style="width: 100%" vertical-align="bottom" no-animations="" label="Y">
+            <paper-listbox attr-for-selected="value" class="dropdown-content" selected="{{pcaY}}">
+              <template is="dom-repeat" items="[[pcaComponents]]">
+                <paper-item class="dropdown-item" value="[[item]]" label="Component #[[_addOne(item)]]">
+                  Component #[[_addOne(item)]]
+                </paper-item>
+              </template>
+            </paper-listbox>
+          </paper-dropdown-menu>
+          <paper-checkbox id="z-checkbox" checked="{{pcaIs3d}}"></paper-checkbox>
+        </div>
+      </div>
+      <p id="pca-sampling" class="notice">
+        PCA is approximate.
+        <paper-icon-button icon="help" class="help-icon"></paper-icon-button>
+      </p>
+      <paper-tooltip for="pca-sampling" position="bottom" animation-delay="0" fit-to-visible-bounds="">
+        For fast results, the data was randomly projected down to [[getPcaSampledDim()]] dimensions.
+      </paper-tooltip>
+    </div>
+    
+    <div data-panel="custom" class="ink-panel-content">
+      <paper-dropdown-menu style="width: 100%" no-animations="" label="Search by">
+        <paper-listbox attr-for-selected="value" class="dropdown-content" selected="{{customSelectedSearchByMetadataOption}}">
+          <template is="dom-repeat" items="[[searchByMetadataOptions]]">
+            <paper-item class="dropdown-item" value="[[item]]" label="[[item]]">
+              [[item]]
+            </paper-item>
+          </template>
+        </paper-listbox>
+      </paper-dropdown-menu>
+      <div class="two-columns">
+        <vz-projector-input id="xLeft" label="Left"></vz-projector-input>
+        <vz-projector-input id="xRight" label="Right"></vz-projector-input>
+      </div>
+      <div class="two-columns">
+        <vz-projector-input id="yUp" label="Up"></vz-projector-input>
+        <vz-projector-input id="yDown" label="Down"></vz-projector-input>
+      </div>
+    </div>
+  </div>
+</div>
+</template>
+</dom-module>
+<link rel="import" href="../paper-listbox/paper-listbox.html">
+<link rel="import" href="../iron-icons/image-icons.html">
+<dom-module id="vz-projector" assetpath="../vz-projector/">
+<template>
+<style include="vz-projector-styles"></style>
+<style>
+:host {
+  display: flex;
+  width: 100%;
+  height: 100%;
+}
+
+#container {
+  display: flex;
+  width: 100%;
+  height: 100%;
+  overflow: hidden;
+}
+
+.hidden {
+  display: none !important;
+}
+
+/* Main */
+
+#main {
+  position: relative;
+  flex-grow: 2;
+}
+
+#main .stage {
+  position: relative;
+  flex-grow: 2;
+}
+
+#scatter {
+  position: absolute;
+  top: 0;
+  left: 0;
+  right: 0;
+  bottom: 0;
+}
+
+#left-pane {
+  display: flex;
+  flex-direction: column;
+  justify-content: space-between;
+  min-width: 312px;
+  width: 312px;
+  border-right: 1px solid rgba(0, 0, 0, 0.1);
+  background: #fafafa;
+}
+
+#right-pane {
+  border-left: 1px solid rgba(0, 0, 0, 0.1);
+  background: #fafafa;
+  display: flex;
+  height: 100%;
+  min-width: 300px;
+  width: 300px;
+}
+
+.file-name {
+  margin-right: 5px;
+}
+
+.control input[type=text]:focus {
+  outline: none;
+  border-bottom: 1px solid rgba(0, 0, 0, 1);
+}
+
+.control {
+  display: inline-block;
+  width: 45%;
+  vertical-align: top;
+  margin-right: 10px;
+  overflow-x: hidden;
+}
+
+.control.last {
+  margin-right: 0;
+}
+
+#wrapper-notify-msg {
+  align-items: center;
+  display: flex;
+  justify-content: center;
+}
+
+#notify-msgs {
+  display: block;
+}
+
+.notify-msg {
+  backface-visibility: hidden;
+  font-weight: 500;
+  margin: 0;
+  opacity: 1;
+  padding: 0;
+  transition: opacity 0.3s ease-out, height 0.3s ease-out;
+}
+
+#warning-msg {
+  display: none;
+  position: fixed;
+  top: 10px;
+  left: 10px;
+  padding: 5px;
+  font-weight: 500;
+  color: black;
+  background-color: #ffb3b6;
+  border: 1px solid black;
+}
+
+.brush .extent {
+  stroke: #fff;
+  fill-opacity: .125;
+  shape-rendering: crispEdges;
+}
+
+.origin text {
+  font-size: 12px;
+  font-weight: 500;
+}
+
+.origin line {
+  stroke: black;
+  stroke-opacity: 0.2;
+}
+
+/* Ink Framework */
+
+/* - Buttons */
+.ink-button, ::shadow .ink-button {
+  border: none;
+  border-radius: 2px;
+  font-size: 13px;
+  padding: 10px;
+  min-width: 100px;
+  flex-shrink: 0;
+  background: #e3e3e3;
+}
+
+.status-bar-panel {
+  display: flex;
+  align-items: center;
+}
+
+.status-bar-entry {
+  border-left: 1px solid rgba(0, 0, 0, 0.5);
+  margin-left: 5px;
+  padding-left: 5px;
+}
+
+/* - Menubar */
+
+.ink-panel-menubar {
+  align-items: center;
+  position: relative;
+  height: 60px;
+  border-bottom: solid 1px #eee;
+  padding: 0 24px;
+  display: flex;
+}
+
+.ink-panel-menubar .ink-fabs {
+  position: absolute;
+  right: 12px;
+  top: 40px;
+  z-index: 1;
+}
+
+#bookmark-panel {
+  bottom: 0;
+  position: absolute;
+  width: 300px;
+}
+#bookmark-panel-container {
+  bottom: 60px;
+  position: absolute;
+}
+
+.ink-fab {
+  margin-left: 8px;
+  border: 1px solid rgba(0, 0, 0, 0.02);
+  background: white;
+  box-shadow: 0 1px 3px rgba(0, 0, 0, 0.3);
+}
+
+#metadata-card {
+  position: absolute;
+  right: 5px;
+  top: 25px;
+}
+
+#help-3d-icon {
+  position: absolute;
+  top: 20px;
+  left: 20px;
+}
+
+#help3dDialog .main {
+  margin: 0;
+  padding: 20px;
+}
+
+#help3dDialog .note {
+  margin-top: 25px;
+  font-size: 11px;
+  text-align: right;
+}
+
+#help3dDialog h3 {
+  margin-top: 20px;
+  margin-bottom: 5px;
+}
+
+#help3dDialog h3:first-child {
+  margin-top: 0;
+}
+
+#data-panel {
+  border-top: 1px solid rgba(0, 0, 0, 0.1);
+  overflow-y: auto;
+}
+</style>
+<paper-dialog id="wrapper-notify-msg" modal="">
+  <div id="notify-msgs"></div>
+</paper-dialog>
+<div id="warning-msg"></div>
+<div id="container">
+  <div id="left-pane" class="ink-panel">
+    <vz-projector-data-panel id="data-panel"></vz-projector-data-panel>
+    <vz-projector-projections-panel id="projections-panel"></vz-projector-projections-panel>
+  </div>
+  <div id="main" class="ink-panel">
+    <div class="ink-panel-menubar">
+      <paper-icon-button id="selectMode" alt="Bounding box selection" toggles="" icon="image:photo-size-select-small"></paper-icon-button>
+      <paper-tooltip for="selectMode" position="bottom" animation-delay="0" fit-to-visible-bounds="">Bounding box selection</paper-tooltip>
+
+      <paper-icon-button id="nightDayMode" alt="Enable/disable night mode" toggles="" icon="image:brightness-2"></paper-icon-button>
+      <paper-tooltip for="nightDayMode" position="bottom" animation-delay="0" fit-to-visible-bounds="">Enable/disable night mode</paper-tooltip>
+
+      <paper-icon-button id="labels3DMode" alt="Enable/disable 3D labels mode" toggles="" icon="font-download"></paper-icon-button>
+      <paper-tooltip for="labels3DMode" position="bottom" animation-delay="0" fit-to-visible-bounds="">Enable/disable 3D labels mode</paper-tooltip>
+      <div class="status-bar-panel">
+        <div class="status-bar-entry">Points: <span class="numDataPoints">Loading...</span></div>
+        <div class="status-bar-entry">Dimension: <span class="dim">Loading...</span></div>
+        <div id="status-bar" class="status-bar-entry" style="display: none;"></div>
+      </div>
+      <div class="ink-fabs">
+        <paper-icon-button id="reset-zoom" class="ink-fab" alt="Reset zoom to fit all points" icon="home"></paper-icon-button>
+        <paper-tooltip for="reset-zoom" position="left" animation-delay="0">Reset zoom to fit all points</paper-tooltip>
+      </div>
+    </div>
+    <div class="stage">
+      <div id="scatter"></div>
+      <vz-projector-metadata-card id="metadata-card"></vz-projector-metadata-card>
+      <paper-icon-button raised="" onclick="help3dDialog.open()" icon="help-outline" id="help-3d-icon"></paper-icon-button>
+      <paper-tooltip animation-delay="0" for="help-3d-icon">Help with interaction controls.</paper-tooltip>
+      <paper-dialog id="help3dDialog" with-backdrop="">
+        <div class="main" dialog-confirm="" autofocus="">
+          <h3>3D controls</h3>
+            <b>Rotate</b> Mouse left click.<br>
+            <b>Pan</b> Mouse right click.<br>
+            <b>Zoom</b> Mouse wheel.<br>
+            Holding <b>ctrl</b> reverses the mouse clicks.
+          <h3>2D controls</h3>
+            <b>Pan</b> Mouse left click.<br>
+            <b>Zoom</b> Mouse wheel.
+          <div class="note"> Click anywhere to dismiss.</div>
+        </div>
+      </paper-dialog>
+    </div>
+  </div>
+  <div id="right-pane" class="ink-panel">
+    <div class="ink-panel-content active">
+      <vz-projector-inspector-panel id="inspector-panel"></vz-projector-inspector-panel>
+    </div>
+    <div id="bookmark-panel-container">
+      <vz-projector-bookmark-panel id="bookmark-panel"></vz-projector-bookmark-panel>
+    </div>
+  </div>
+</div>
+
+</template> 
+</dom-module>
+<dom-module id="vz-projector-dashboard" assetpath="../vz-projector/">
+<template>
+  <tf-no-data-warning data-type="projector" show-warning="[[dataNotFound]]"></tf-no-data-warning>
+  <template is="dom-if" if="[[!dataNotFound]]">
+    <vz-projector id="projector" route-prefix="[[routePrefix]]" serving-mode="server"></vz-projector>
+  </template>
+</template>
+<script>
+(function() {
+Polymer({
+  is: 'vz-projector-dashboard',
+  properties: {
+    dataNotFound: Boolean,
+    routePrefix: String
+  },
+  ready() {
+    var self = this;
+    d3.json(this.routePrefix + '/runs', function(err, runs) {
+      self.dataNotFound = (runs.length === 0);
+    });
+  }
+});
+})();
+</script>
+</dom-module>
+<script>/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+var TF;
+(function (TF) {
+    var TensorBoard;
+    (function (TensorBoard) {
+        TensorBoard.AUTORELOAD_LOCALSTORAGE_KEY = 'TF.TensorBoard.autoReloadEnabled';
+        var getAutoReloadFromLocalStorage = function () {
+            var val = window.localStorage.getItem(TensorBoard.AUTORELOAD_LOCALSTORAGE_KEY);
+            return val === 'true' || val == null; // defaults to true
+        };
+        TensorBoard.AutoReloadBehavior = {
+            properties: {
+                autoReloadEnabled: {
+                    type: Boolean,
+                    observer: '_autoReloadObserver',
+                    value: getAutoReloadFromLocalStorage,
+                },
+                _autoReloadId: {
+                    type: Number,
+                },
+                autoReloadIntervalSecs: {
+                    type: Number,
+                    value: 120,
+                },
+            },
+            detached: function () { window.clearTimeout(this._autoReloadId); },
+            _autoReloadObserver: function (autoReload) {
+                window.localStorage.setItem(TensorBoard.AUTORELOAD_LOCALSTORAGE_KEY, autoReload);
+                if (autoReload) {
+                    var _this = this;
+                    this._autoReloadId = window.setTimeout(this._doAutoReload.bind(this), this.autoReloadIntervalSecs * 1000);
+                }
+                else {
+                    window.clearTimeout(this._autoReloadId);
+                }
+            },
+            _doAutoReload: function () {
+                if (this.reload == null) {
+                    throw new Error('AutoReloadBehavior requires a reload method');
+                }
+                this.reload();
+                this._autoReloadId = window.setTimeout(this._doAutoReload.bind(this), this.autoReloadIntervalSecs * 1000);
+            }
+        };
+    })(TensorBoard = TF.TensorBoard || (TF.TensorBoard = {}));
+})(TF || (TF = {}));
+</script></div><dom-module id="tf-tensorboard">
   <template>
     <paper-dialog with-backdrop="" id="settings">
       <h2>Settings</h2>
@@ -16007,8 +17648,8 @@ Polymer({
       <div id="content" class="fit">
         <content id="injected-overview"></content>
 
-        <template is="dom-if" if="[[_modeIsEvents(mode)]]">
-          <tf-event-dashboard id="events" backend="[[_backend]]" router="[[router]]"></tf-event-dashboard>
+        <template is="dom-if" if="[[_modeIsScalars(mode)]]">
+          <tf-scalar-dashboard id="scalars" backend="[[_backend]]" router="[[router]]"></tf-scalar-dashboard>
         </template>
 
         <template is="dom-if" if="[[_modeIsImages(mode)]]">
@@ -16030,6 +17671,11 @@ Polymer({
         <template is="dom-if" if="[[_modeIsHistograms(mode)]]">
           <tf-histogram-dashboard id="histograms" backend="[[_backend]]"></tf-histogram-dashboard>
         </template>
+
+        <template is="dom-if" if="[[_modeIsEmbeddings(mode)]]">
+          <vz-projector-dashboard id="projector" route-prefix="/data/plugin/projector">
+          </vz-projector-dashboard>
+        </template>
       </div>
     </paper-header-panel>
 
@@ -16112,7 +17758,7 @@ Polymer({
           type: Object,
           computed: "_makeBackend(router, demoDir)",
         },
-        // Which tab is selected (events, graph, images etc).
+        // Which tab is selected (scalars, graph, images etc).
         mode: {
           type: String,
           computed: '_getModeFromIndex(modeIndex)',
@@ -16149,8 +17795,8 @@ Polymer({
         }
         return new TF.Backend.Backend(router);
       },
-      _modeIsEvents: function(mode) {
-        return mode === "events";
+      _modeIsScalars: function(mode) {
+        return mode === "scalars";
       },
       _modeIsImages: function(mode) {
         return mode === "images";
@@ -16161,6 +17807,9 @@ Polymer({
       _modeIsGraphs: function(mode) {
         return mode === "graphs";
       },
+      _modeIsEmbeddings: function(mode) {
+        return mode === "embeddings";
+      },
       _modeIsDistributions: function(mode) {
         return mode === "distributions";
       },
@@ -16194,7 +17843,7 @@ Polymer({
         }
       },
       reload: function() {
-        if (this.mode === "graphs") {
+        if (this.mode === "graphs" || this.mode === "embeddings") {
           return;
         }
         this.selectedDashboard().reload();
@@ -16204,5 +17853,6173 @@ Polymer({
       },
     });
   </script>
+  
+  <script>(function e(t,n,r){function s(o,u){if(!n[o]){if(!t[o]){var a=typeof require=="function"&&require;if(!u&&a)return a(o,!0);if(i)return i(o,!0);var f=new Error("Cannot find module '"+o+"'");throw f.code="MODULE_NOT_FOUND",f}var l=n[o]={exports:{}};t[o][0].call(l.exports,function(e){var n=t[o][1][e];return s(n?n:e)},l,l.exports,e,t,n,r)}return n[o].exports}var i=typeof require=="function"&&require;for(var o=0;o<r.length;o++)s(r[o]);return s})({1:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+/**
+ * This is a fork of the Karpathy's TSNE.js (original license below).
+ * This fork implements Barnes-Hut approximation and runs in O(NlogN)
+ * time, as opposed to the Karpathy's O(N^2) version.
+ *
+ * @author smilkov@google.com (Daniel Smilkov)
+ */
+/**
+ * The MIT License (MIT)
+ * Copyright (c) 2015 Andrej Karpathy
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to deal
+ * in the Software without restriction, including without limitation the rights
+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in
+ * all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+ * THE SOFTWARE.
+ */
+var sptree_1 = require('./sptree');
+/**
+ * Barnes-hut approximation level. Higher means more approximation and faster
+ * results. Recommended value mentioned in the paper is 0.8.
+ */
+var THETA = 0.8;
+// Variables used for memorizing the second random number since running
+// gaussRandom() generates two random numbers at the cost of 1 atomic
+// computation. This optimization results in 2X speed-up of the generator.
+var return_v = false;
+var v_val = 0.0;
+/** Returns the square euclidean distance between two vectors. */
+function dist2(a, b) {
+    if (a.length !== b.length) {
+        throw new Error('Vectors a and b must be of same length');
+    }
+    var result = 0;
+    for (var i = 0; i < a.length; ++i) {
+        var diff = a[i] - b[i];
+        result += diff * diff;
+    }
+    return result;
+}
+exports.dist2 = dist2;
+/** Returns the square euclidean distance between two 2D points. */
+function dist2_2D(a, b) {
+    var dX = a[0] - b[0];
+    var dY = a[1] - b[1];
+    return dX * dX + dY * dY;
+}
+exports.dist2_2D = dist2_2D;
+/** Returns the square euclidean distance between two 3D points. */
+function dist2_3D(a, b) {
+    var dX = a[0] - b[0];
+    var dY = a[1] - b[1];
+    var dZ = a[2] - b[2];
+    return dX * dX + dY * dY + dZ * dZ;
+}
+exports.dist2_3D = dist2_3D;
+function gaussRandom(rng) {
+    if (return_v) {
+        return_v = false;
+        return v_val;
+    }
+    var u = 2 * rng() - 1;
+    var v = 2 * rng() - 1;
+    var r = u * u + v * v;
+    if (r === 0 || r > 1) {
+        return gaussRandom(rng);
+    }
+    var c = Math.sqrt(-2 * Math.log(r) / r);
+    v_val = v * c; // cache this for next function call for efficiency
+    return_v = true;
+    return u * c;
+}
+;
+// return random normal number
+function randn(rng, mu, std) {
+    return mu + gaussRandom(rng) * std;
+}
+;
+// utilitity that creates contiguous vector of zeros of size n
+function zeros(n) {
+    return new Float64Array(n);
+}
+;
+// utility that returns a matrix filled with random numbers
+// generated by the provided generator.
+function randnMatrix(n, d, rng) {
+    var nd = n * d;
+    var x = zeros(nd);
+    for (var i = 0; i < nd; ++i) {
+        x[i] = randn(rng, 0.0, 1E-4);
+    }
+    return x;
+}
+;
+// utility that returns a matrix filled with the provided value.
+function arrayofs(n, d, val) {
+    var x = [];
+    for (var i = 0; i < n; ++i) {
+        x.push(d === 3 ? [val, val, val] : [val, val]);
+    }
+    return x;
+}
+;
+// compute (p_{i|j} + p_{j|i})/(2n)
+function nearest2P(nearest, perplexity, tol) {
+    var N = nearest.length;
+    var Htarget = Math.log(perplexity); // target entropy of distribution
+    var P = zeros(N * N); // temporary probability matrix
+    var K = nearest[0].length;
+    var pRow = new Array(K); // pij[].
+    for (var i = 0; i < N; ++i) {
+        var neighbors = nearest[i];
+        var betaMin = -Infinity;
+        var betaMax = Infinity;
+        var beta = 1; // initial value of precision
+        var maxTries = 50;
+        // perform binary search to find a suitable precision beta
+        // so that the entropy of the distribution is appropriate
+        var numTries = 0;
+        while (true) {
+            // compute entropy and kernel row with beta precision
+            var psum = 0.0;
+            for (var k = 0; k < neighbors.length; ++k) {
+                var neighbor = neighbors[k];
+                var pij = (i === neighbor.index) ? 0 : Math.exp(-neighbor.dist * beta);
+                pRow[k] = pij;
+                psum += pij;
+            }
+            // normalize p and compute entropy
+            var Hhere = 0.0;
+            for (var k = 0; k < pRow.length; ++k) {
+                pRow[k] /= psum;
+                var pij = pRow[k];
+                if (pij > 1E-7) {
+                    Hhere -= pij * Math.log(pij);
+                }
+                ;
+            }
+            // adjust beta based on result
+            if (Hhere > Htarget) {
+                // entropy was too high (distribution too diffuse)
+                // so we need to increase the precision for more peaky distribution
+                betaMin = beta; // move up the bounds
+                if (betaMax === Infinity) {
+                    beta = beta * 2;
+                }
+                else {
+                    beta = (beta + betaMax) / 2;
+                }
+            }
+            else {
+                // converse case. make distrubtion less peaky
+                betaMax = beta;
+                if (betaMin === -Infinity) {
+                    beta = beta / 2;
+                }
+                else {
+                    beta = (beta + betaMin) / 2;
+                }
+            }
+            numTries++;
+            // stopping conditions: too many tries or got a good precision
+            if (numTries >= maxTries || Math.abs(Hhere - Htarget) < tol) {
+                break;
+            }
+        }
+        // copy over the final prow to P at row i
+        for (var k = 0; k < pRow.length; ++k) {
+            var pij = pRow[k];
+            var j = neighbors[k].index;
+            P[i * N + j] = pij;
+        }
+    } // end loop over examples i
+    // symmetrize P and normalize it to sum to 1 over all ij
+    var N2 = N * 2;
+    for (var i = 0; i < N; ++i) {
+        for (var j = i + 1; j < N; ++j) {
+            var i_j = i * N + j;
+            var j_i = j * N + i;
+            var value = (P[i_j] + P[j_i]) / N2;
+            P[i_j] = value;
+            P[j_i] = value;
+        }
+    }
+    return P;
+}
+;
+// helper function
+function sign(x) {
+    return x > 0 ? 1 : x < 0 ? -1 : 0;
+}
+function computeForce_2d(force, mult, pointA, pointB) {
+    force[0] += mult * (pointA[0] - pointB[0]);
+    force[1] += mult * (pointA[1] - pointB[1]);
+}
+function computeForce_3d(force, mult, pointA, pointB) {
+    force[0] += mult * (pointA[0] - pointB[0]);
+    force[1] += mult * (pointA[1] - pointB[1]);
+    force[2] += mult * (pointA[2] - pointB[2]);
+}
+var TSNE = (function () {
+    function TSNE(opt) {
+        this.iter = 0;
+        opt = opt || { dim: 2 };
+        this.perplexity = opt.perplexity || 30;
+        this.epsilon = opt.epsilon || 10;
+        this.rng = opt.rng || Math.random;
+        this.dim = opt.dim;
+        if (opt.dim === 2) {
+            this.dist2 = dist2_2D;
+            this.computeForce = computeForce_2d;
+        }
+        else if (opt.dim === 3) {
+            this.dist2 = dist2_3D;
+            this.computeForce = computeForce_3d;
+        }
+        else {
+            throw new Error('Only 2D and 3D is supported');
+        }
+    }
+    // this function takes a fattened distance matrix and creates
+    // matrix P from them.
+    // D is assumed to be provided as an array of size N^2.
+    TSNE.prototype.initDataDist = function (nearest) {
+        var N = nearest.length;
+        this.nearest = nearest;
+        this.P = nearest2P(nearest, this.perplexity, 1E-4);
+        this.N = N;
+        this.initSolution(); // refresh this
+    };
+    // (re)initializes the solution to random
+    TSNE.prototype.initSolution = function () {
+        // generate random solution to t-SNE
+        this.Y = randnMatrix(this.N, this.dim, this.rng); // the solution
+        this.gains = arrayofs(this.N, this.dim, 1.0); // step gains
+        // to accelerate progress in unchanging directions
+        this.ystep = arrayofs(this.N, this.dim, 0.0); // momentum accumulator
+        this.iter = 0;
+    };
+    // return pointer to current solution
+    TSNE.prototype.getSolution = function () { return this.Y; };
+    // perform a single step of optimization to improve the embedding
+    TSNE.prototype.step = function () {
+        this.iter += 1;
+        var N = this.N;
+        var grad = this.costGrad(this.Y); // evaluate gradient
+        // perform gradient step
+        var ymean = this.dim === 3 ? [0, 0, 0] : [0, 0];
+        for (var i = 0; i < N; ++i) {
+            for (var d = 0; d < this.dim; ++d) {
+                var gid = grad[i][d];
+                var sid = this.ystep[i][d];
+                var gainid = this.gains[i][d];
+                // compute gain update
+                var newgain = sign(gid) === sign(sid) ? gainid * 0.8 : gainid + 0.2;
+                if (newgain < 0.01) {
+                    newgain = 0.01; // clamp
+                }
+                this.gains[i][d] = newgain; // store for next turn
+                // compute momentum step direction
+                var momval = this.iter < 250 ? 0.5 : 0.8;
+                var newsid = momval * sid - this.epsilon * newgain * grad[i][d];
+                this.ystep[i][d] = newsid; // remember the step we took
+                // step!
+                var i_d = i * this.dim + d;
+                this.Y[i_d] += newsid;
+                ymean[d] += this.Y[i_d]; // accumulate mean so that we
+            }
+        }
+        // reproject Y to be zero mean
+        for (var i = 0; i < N; ++i) {
+            for (var d = 0; d < this.dim; ++d) {
+                this.Y[i * this.dim + d] -= ymean[d] / N;
+            }
+        }
+    };
+    // return cost and gradient, given an arrangement
+    TSNE.prototype.costGrad = function (Y) {
+        var _this = this;
+        var N = this.N;
+        var P = this.P;
+        // Trick that helps with local optima.
+        var alpha = this.iter < 100 ? 4 : 1;
+        // Make data for the SP tree.
+        var points = new Array(N); // (x, y)[]
+        for (var i = 0; i < N; ++i) {
+            var iTimesD = i * this.dim;
+            var row = new Array(this.dim);
+            for (var d = 0; d < this.dim; ++d) {
+                row[d] = Y[iTimesD + d];
+            }
+            points[i] = row;
+        }
+        // Make a tree.
+        var tree = new sptree_1.SPTree(points);
+        var root = tree.root;
+        // Annotate the tree.
+        var annotateTree = function (node) {
+            var numCells = 1;
+            if (node.children == null) {
+                // Update the current node and tell the parent.
+                node.numCells = numCells;
+                node.yCell = node.point;
+                return { numCells: numCells, yCell: node.yCell };
+            }
+            // node.point is a 2 or 3-dim number[], so slice() makes a copy.
+            var yCell = node.point.slice();
+            for (var i = 0; i < node.children.length; ++i) {
+                var child = node.children[i];
+                if (child == null) {
+                    continue;
+                }
+                var result = annotateTree(child);
+                numCells += result.numCells;
+                for (var d = 0; d < _this.dim; ++d) {
+                    yCell[d] += result.yCell[d];
+                }
+            }
+            // Update the node and tell the parent.
+            node.numCells = numCells;
+            node.yCell = yCell.map(function (v) { return v / numCells; });
+            return { numCells: numCells, yCell: yCell };
+        };
+        // Augment the tree with more info.
+        annotateTree(root);
+        tree.visit(function (node, low, high) {
+            node.rCell = high[0] - low[0];
+            return false;
+        });
+        // compute current Q distribution, unnormalized first
+        var grad = [];
+        var Z = 0;
+        var forces = new Array(N);
+        var _loop_1 = function(i) {
+            var pointI = points[i];
+            // Compute the positive forces for the i-th node.
+            var Fpos = this_1.dim === 3 ? [0, 0, 0] : [0, 0];
+            var neighbors = this_1.nearest[i];
+            for (var k = 0; k < neighbors.length; ++k) {
+                var j = neighbors[k].index;
+                var pij = P[i * N + j];
+                var pointJ = points[j];
+                var squaredDistItoJ = this_1.dist2(pointI, pointJ);
+                var premult = pij / (1 + squaredDistItoJ);
+                this_1.computeForce(Fpos, premult, pointI, pointJ);
+            }
+            // Compute the negative forces for the i-th node.
+            var FnegZ = this_1.dim === 3 ? [0, 0, 0] : [0, 0];
+            tree.visit(function (node) {
+                var squaredDistToCell = _this.dist2(pointI, node.yCell);
+                // Squared distance from point i to cell.
+                if (node.children == null ||
+                    (node.rCell / Math.sqrt(squaredDistToCell) < THETA)) {
+                    var qijZ_1 = 1 / (1 + squaredDistToCell);
+                    var dZ = node.numCells * qijZ_1;
+                    Z += dZ;
+                    dZ *= qijZ_1;
+                    _this.computeForce(FnegZ, dZ, pointI, node.yCell);
+                    return true;
+                }
+                // Cell is too close to approximate.
+                var squaredDistToPoint = _this.dist2(pointI, node.point);
+                var qijZ = 1 / (1 + squaredDistToPoint);
+                Z += qijZ;
+                qijZ *= qijZ;
+                _this.computeForce(FnegZ, qijZ, pointI, node.point);
+                return false;
+            }, true);
+            forces[i] = [Fpos, FnegZ];
+        };
+        var this_1 = this;
+        for (var i = 0; i < N; ++i) {
+            _loop_1(i);
+        }
+        // Normalize the negative forces and compute the gradient.
+        var A = 4 * alpha;
+        var B = 4 / Z;
+        for (var i = 0; i < N; ++i) {
+            var _a = forces[i], FPos = _a[0], FNegZ = _a[1];
+            var gsum = new Array(this.dim);
+            for (var d = 0; d < this.dim; ++d) {
+                gsum[d] = A * FPos[d] - B * FNegZ[d];
+            }
+            grad.push(gsum);
+        }
+        return grad;
+    };
+    return TSNE;
+}());
+exports.TSNE = TSNE;
+
+},{"./sptree":23}],2:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var data_1 = require('./data');
+var data_provider_1 = require('./data-provider');
+var dataProvider = require('./data-provider');
+var logging = require('./logging');
+/** Data provider that loads data from a demo folder. */
+var DemoDataProvider = (function () {
+    function DemoDataProvider() {
+        /** List of demo datasets for showing the capabilities of the tool. */
+        this.DEMO_CONFIG = {
+            embeddings: [
+                {
+                    tensorName: 'Word2Vec 5K',
+                    tensorShape: [5000, 200],
+                    tensorPath: 'word2vec_5000_200d_tensors.tsv',
+                    metadataPath: 'word2vec_5000_200d_labels.tsv'
+                },
+                {
+                    tensorName: 'Word2Vec 10K',
+                    tensorShape: [10000, 200],
+                    tensorPath: 'word2vec_10000_200d_tensors.tsv',
+                    metadataPath: 'word2vec_10000_200d_labels.tsv'
+                },
+                {
+                    tensorName: 'Word2Vec All',
+                    tensorShape: [71291, 200],
+                    tensorPath: 'word2vec_full_200d_tensors.tsv',
+                    metadataPath: 'word2vec_full_200d_labels.tsv'
+                },
+                {
+                    tensorName: 'SmartReply 5K',
+                    tensorShape: [5000, 256],
+                    tensorPath: 'smartreply_5000_256d_tensors.tsv',
+                    metadataPath: 'smartreply_5000_256d_labels.tsv'
+                },
+                {
+                    tensorName: 'SmartReply All',
+                    tensorShape: [35860, 256],
+                    tensorPath: 'smartreply_full_256d_tensors.tsv',
+                    metadataPath: 'smartreply_full_256d_labels.tsv'
+                },
+                {
+                    tensorName: 'Mnist with images 10K',
+                    tensorShape: [10000, 784],
+                    tensorPath: 'mnist_10k_784d_tensors.tsv',
+                    metadataPath: 'mnist_10k_784d_labels.tsv',
+                    sprite: {
+                        imagePath: 'mnist_10k_sprite.png',
+                        singleImageDim: [28, 28]
+                    }
+                },
+                {
+                    tensorName: 'Iris',
+                    tensorShape: [150, 4],
+                    tensorPath: 'iris_tensors.tsv',
+                    metadataPath: 'iris_labels.tsv'
+                },
+                {
+                    tensorName: 'Unit Cube',
+                    tensorShape: [8, 3],
+                    tensorPath: 'cube_tensors.tsv',
+                    metadataPath: 'cube_metadata.tsv'
+                }
+            ],
+            modelCheckpointPath: 'Demo datasets'
+        };
+        /** Name of the folder where the demo datasets are stored. */
+        this.DEMO_FOLDER = 'data';
+    }
+    DemoDataProvider.prototype.getEmbeddingInfo = function (tensorName) {
+        var embeddings = this.DEMO_CONFIG.embeddings;
+        for (var i = 0; i < embeddings.length; i++) {
+            var embedding = embeddings[i];
+            if (embedding.tensorName === tensorName) {
+                return embedding;
+            }
+        }
+        return null;
+    };
+    DemoDataProvider.prototype.retrieveRuns = function (callback) {
+        callback(['Demo']);
+    };
+    DemoDataProvider.prototype.retrieveProjectorConfig = function (run, callback) {
+        callback(this.DEMO_CONFIG);
+    };
+    DemoDataProvider.prototype.getDefaultTensor = function (run, callback) {
+        callback('SmartReply 5K');
+    };
+    DemoDataProvider.prototype.retrieveTensor = function (run, tensorName, callback) {
+        var embedding = this.getEmbeddingInfo(tensorName);
+        var separator = embedding.tensorPath.substr(-3) === 'tsv' ? '\t' : ' ';
+        var url = this.DEMO_FOLDER + "/" + embedding.tensorPath;
+        logging.setModalMessage('Fetching tensors...', data_provider_1.TENSORS_MSG_ID);
+        d3.text(url, function (error, dataString) {
+            if (error) {
+                logging.setModalMessage('Error: ' + error.responseText);
+                return;
+            }
+            dataProvider.parseTensors(dataString, separator).then(function (points) {
+                callback(new data_1.DataSet(points));
+            });
+        });
+    };
+    DemoDataProvider.prototype.retrieveSpriteAndMetadata = function (run, tensorName, callback) {
+        var embedding = this.getEmbeddingInfo(tensorName);
+        var metadataPath = null;
+        if (embedding.metadataPath) {
+            metadataPath = this.DEMO_FOLDER + "/" + embedding.metadataPath;
+        }
+        var spriteImagePath = null;
+        if (embedding.sprite && embedding.sprite.imagePath) {
+            spriteImagePath = this.DEMO_FOLDER + "/" + embedding.sprite.imagePath;
+        }
+        dataProvider.retrieveSpriteAndMetadataInfo(metadataPath, spriteImagePath, embedding.sprite, callback);
+    };
+    DemoDataProvider.prototype.getBookmarks = function (run, tensorName, callback) {
+        callback([]);
+    };
+    return DemoDataProvider;
+}());
+exports.DemoDataProvider = DemoDataProvider;
+
+},{"./data":6,"./data-provider":5,"./logging":12}],3:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var data_1 = require('./data');
+var data_provider_1 = require('./data-provider');
+var ProtoDataProvider = (function () {
+    function ProtoDataProvider(dataProto) {
+        this.dataProto = dataProto;
+    }
+    ProtoDataProvider.prototype.retrieveRuns = function (callback) {
+        callback(['proto']);
+    };
+    ProtoDataProvider.prototype.retrieveProjectorConfig = function (run, callback) {
+        callback({
+            modelCheckpointPath: 'proto',
+            embeddings: [{
+                    tensorName: 'proto',
+                    tensorShape: this.dataProto.shape,
+                    metadataPath: 'proto'
+                }]
+        });
+    };
+    ProtoDataProvider.prototype.retrieveTensor = function (run, tensorName, callback) {
+        callback(this.flatArrayToDataset(this.dataProto.tensor));
+    };
+    ProtoDataProvider.prototype.retrieveSpriteAndMetadata = function (run, tensorName, callback) {
+        var columnNames = this.dataProto.metadata.columns.map(function (c) { return c.name; });
+        var n = this.dataProto.shape[0];
+        var pointsMetadata = new Array(n);
+        this.dataProto.metadata.columns.forEach(function (c) {
+            var values = c.numericValues || c.stringValues;
+            for (var i = 0; i < n; i++) {
+                pointsMetadata[i] = pointsMetadata[i] || {};
+                pointsMetadata[i][c.name] = values[i];
+            }
+        });
+        callback({
+            stats: data_provider_1.analyzeMetadata(columnNames, pointsMetadata),
+            pointsInfo: pointsMetadata
+        });
+    };
+    ProtoDataProvider.prototype.getDefaultTensor = function (run, callback) {
+        callback('proto');
+    };
+    ProtoDataProvider.prototype.getBookmarks = function (run, tensorName, callback) {
+        return callback([]);
+    };
+    ProtoDataProvider.prototype.flatArrayToDataset = function (tensor) {
+        var points = [];
+        var n = this.dataProto.shape[0];
+        var d = this.dataProto.shape[1];
+        if (n * d !== tensor.length) {
+            throw 'The shape doesn\'t match the length of the flattened array';
+        }
+        for (var i = 0; i < n; i++) {
+            var vector = [];
+            var offset = i * d;
+            for (var j = 0; j < d; j++) {
+                vector.push(tensor[offset++]);
+            }
+            points.push({
+                vector: vector,
+                metadata: {},
+                projections: null,
+                projectedPoint: null,
+                index: i
+            });
+        }
+        return new data_1.DataSet(points);
+    };
+    return ProtoDataProvider;
+}());
+exports.ProtoDataProvider = ProtoDataProvider;
+
+},{"./data":6,"./data-provider":5}],4:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var data_1 = require('./data');
+var data_provider_1 = require('./data-provider');
+var dataProvider = require('./data-provider');
+var logging = require('./logging');
+/**
+ * Data provider that loads data provided by a python server (usually backed
+ * by a checkpoint file).
+ */
+var ServerDataProvider = (function () {
+    function ServerDataProvider(routePrefix) {
+        this.runProjectorConfigCache = {};
+        this.routePrefix = routePrefix;
+    }
+    ServerDataProvider.prototype.getEmbeddingInfo = function (run, tensorName, callback) {
+        this.retrieveProjectorConfig(run, function (config) {
+            var embeddings = config.embeddings;
+            for (var i = 0; i < embeddings.length; i++) {
+                var embedding = embeddings[i];
+                if (embedding.tensorName === tensorName) {
+                    callback(embedding);
+                    return;
+                }
+            }
+            callback(null);
+        });
+    };
+    ServerDataProvider.prototype.retrieveRuns = function (callback) {
+        var msgId = logging.setModalMessage('Fetching runs...');
+        d3.json(this.routePrefix + "/runs", function (err, runs) {
+            if (err) {
+                logging.setModalMessage('Error: ' + err.responseText);
+                return;
+            }
+            logging.setModalMessage(null, msgId);
+            callback(runs);
+        });
+    };
+    ServerDataProvider.prototype.retrieveProjectorConfig = function (run, callback) {
+        var _this = this;
+        if (run in this.runProjectorConfigCache) {
+            callback(this.runProjectorConfigCache[run]);
+            return;
+        }
+        var msgId = logging.setModalMessage('Fetching projector config...');
+        d3.json(this.routePrefix + "/info?run=" + run, function (err, config) {
+            if (err) {
+                logging.setModalMessage('Error: ' + err.responseText);
+                return;
+            }
+            logging.setModalMessage(null, msgId);
+            _this.runProjectorConfigCache[run] = config;
+            callback(config);
+        });
+    };
+    ServerDataProvider.prototype.retrieveTensor = function (run, tensorName, callback) {
+        // Get the tensor.
+        logging.setModalMessage('Fetching tensor values...', data_provider_1.TENSORS_MSG_ID);
+        d3.text(this.routePrefix + "/tensor?run=" + run + "&name=" + tensorName, function (err, tsv) {
+            if (err) {
+                logging.setModalMessage('Error: ' + err.responseText);
+                return;
+            }
+            dataProvider.parseTensors(tsv).then(function (dataPoints) {
+                callback(new data_1.DataSet(dataPoints));
+            });
+        });
+    };
+    ServerDataProvider.prototype.retrieveSpriteAndMetadata = function (run, tensorName, callback) {
+        var _this = this;
+        this.getEmbeddingInfo(run, tensorName, function (embedding) {
+            var metadataPath = null;
+            if (embedding.metadataPath) {
+                metadataPath =
+                    _this.routePrefix + "/metadata?run=" + run + "&name=" + tensorName;
+            }
+            var spriteImagePath = null;
+            if (embedding.sprite && embedding.sprite.imagePath) {
+                spriteImagePath =
+                    _this.routePrefix + "/sprite_image?run=" + run + "&name=" + tensorName;
+            }
+            dataProvider.retrieveSpriteAndMetadataInfo(metadataPath, spriteImagePath, embedding.sprite, callback);
+        });
+    };
+    ServerDataProvider.prototype.getDefaultTensor = function (run, callback) {
+        this.retrieveProjectorConfig(run, function (config) {
+            var tensorNames = config.embeddings.map(function (e) { return e.tensorName; });
+            // Return the first tensor that has metadata.
+            for (var i = 0; i < tensorNames.length; i++) {
+                var e = config.embeddings[i];
+                if (e.metadataPath) {
+                    callback(e.tensorName);
+                    return;
+                }
+            }
+            callback(tensorNames.length >= 1 ? tensorNames[0] : null);
+        });
+    };
+    ServerDataProvider.prototype.getBookmarks = function (run, tensorName, callback) {
+        var msgId = logging.setModalMessage('Fetching bookmarks...');
+        d3.json(this.routePrefix + "/bookmarks?run=" + run + "&name=" + tensorName, function (err, bookmarks) {
+            logging.setModalMessage(null, msgId);
+            if (!err) {
+                callback(bookmarks);
+            }
+        });
+    };
+    return ServerDataProvider;
+}());
+exports.ServerDataProvider = ServerDataProvider;
+
+},{"./data":6,"./data-provider":5,"./logging":12}],5:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var data_1 = require('./data');
+var logging = require('./logging');
+var util_1 = require('./util');
+/** Maximum number of colors supported in the color map. */
+var NUM_COLORS_COLOR_MAP = 50;
+exports.METADATA_MSG_ID = 'metadata';
+exports.TENSORS_MSG_ID = 'tensors';
+function parseRawTensors(content, callback) {
+    parseTensors(content).then(function (data) {
+        callback(new data_1.DataSet(data));
+    });
+}
+exports.parseRawTensors = parseRawTensors;
+function parseRawMetadata(contents, callback) {
+    parseMetadata(contents).then(function (result) { return callback(result); });
+}
+exports.parseRawMetadata = parseRawMetadata;
+/** Parses a tsv text file. */
+function parseTensors(content, delim) {
+    if (delim === void 0) { delim = '\t'; }
+    var data = [];
+    var numDim;
+    return util_1.runAsyncTask('Parsing tensors...', function () {
+        var lines = content.split('\n');
+        lines.forEach(function (line) {
+            line = line.trim();
+            if (line === '') {
+                return;
+            }
+            var row = line.split(delim);
+            var dataPoint = {
+                metadata: {},
+                vector: null,
+                index: data.length,
+                projections: null,
+                projectedPoint: null
+            };
+            // If the first label is not a number, take it as the label.
+            if (isNaN(row[0]) || numDim === row.length - 1) {
+                dataPoint.metadata['label'] = row[0];
+                dataPoint.vector = row.slice(1).map(Number);
+            }
+            else {
+                dataPoint.vector = row.map(Number);
+            }
+            data.push(dataPoint);
+            if (numDim == null) {
+                numDim = dataPoint.vector.length;
+            }
+            if (numDim !== dataPoint.vector.length) {
+                logging.setModalMessage('Parsing failed. Vector dimensions do not match');
+                throw Error('Parsing failed');
+            }
+            if (numDim <= 1) {
+                logging.setModalMessage('Parsing failed. Found a vector with only one dimension?');
+                throw Error('Parsing failed');
+            }
+        });
+        return data;
+    }, exports.TENSORS_MSG_ID).then(function (dataPoints) {
+        logging.setModalMessage(null, exports.TENSORS_MSG_ID);
+        return dataPoints;
+    });
+}
+exports.parseTensors = parseTensors;
+function analyzeMetadata(columnNames, pointsMetadata) {
+    var columnStats = columnNames.map(function (name) {
+        return {
+            name: name,
+            isNumeric: true,
+            tooManyUniqueValues: false,
+            min: Number.POSITIVE_INFINITY,
+            max: Number.NEGATIVE_INFINITY
+        };
+    });
+    var mapOfValues = columnNames.map(function () { return d3.map(); });
+    pointsMetadata.forEach(function (metadata) {
+        columnNames.forEach(function (name, colIndex) {
+            var stats = columnStats[colIndex];
+            var map = mapOfValues[colIndex];
+            var value = metadata[name];
+            // Skip missing values.
+            if (value == null) {
+                return;
+            }
+            if (!stats.tooManyUniqueValues) {
+                if (map.has(value)) {
+                    map.set(value, map.get(value) + 1);
+                }
+                else {
+                    map.set(value, 1);
+                }
+                if (map.size() > NUM_COLORS_COLOR_MAP) {
+                    stats.tooManyUniqueValues = true;
+                }
+            }
+            if (isNaN(value)) {
+                stats.isNumeric = false;
+            }
+            else {
+                metadata[name] = +value;
+                stats.min = Math.min(stats.min, +value);
+                stats.max = Math.max(stats.max, +value);
+            }
+        });
+    });
+    columnStats.forEach(function (stats, colIndex) {
+        var map = mapOfValues[colIndex];
+        if (!stats.tooManyUniqueValues) {
+            stats.uniqueEntries = map.entries().map(function (e) {
+                return { label: e.key, count: e.value };
+            });
+        }
+    });
+    return columnStats;
+}
+exports.analyzeMetadata = analyzeMetadata;
+function parseMetadata(content) {
+    return util_1.runAsyncTask('Parsing metadata...', function () {
+        var lines = content.split('\n').filter(function (line) { return line.trim().length > 0; });
+        var hasHeader = lines[0].indexOf('\t') >= 0;
+        var pointsMetadata = [];
+        // If the first row doesn't contain metadata keys, we assume that the values
+        // are labels.
+        var columnNames = ['label'];
+        if (hasHeader) {
+            columnNames = lines[0].split('\t');
+            lines = lines.slice(1);
+        }
+        lines.forEach(function (line) {
+            var rowValues = line.split('\t');
+            var metadata = {};
+            pointsMetadata.push(metadata);
+            columnNames.forEach(function (name, colIndex) {
+                var value = rowValues[colIndex];
+                // Normalize missing values.
+                value = (value === '' ? null : value);
+                metadata[name] = value;
+            });
+        });
+        return {
+            stats: analyzeMetadata(columnNames, pointsMetadata),
+            pointsInfo: pointsMetadata
+        };
+    }, exports.METADATA_MSG_ID).then(function (metadata) {
+        logging.setModalMessage(null, exports.METADATA_MSG_ID);
+        return metadata;
+    });
+}
+exports.parseMetadata = parseMetadata;
+function fetchImage(url) {
+    return new Promise(function (resolve, reject) {
+        var image = new Image();
+        image.onload = function () { return resolve(image); };
+        image.onerror = function (err) { return reject(err); };
+        image.src = url;
+    });
+}
+exports.fetchImage = fetchImage;
+function retrieveSpriteAndMetadataInfo(metadataPath, spriteImagePath, spriteMetadata, callback) {
+    var metadataPromise = Promise.resolve({});
+    if (metadataPath) {
+        metadataPromise = new Promise(function (resolve, reject) {
+            logging.setModalMessage('Fetching metadata...', exports.METADATA_MSG_ID);
+            d3.text(metadataPath, function (err, rawMetadata) {
+                if (err) {
+                    logging.setModalMessage('Error: ' + err.responseText);
+                    reject(err);
+                    return;
+                }
+                resolve(parseMetadata(rawMetadata));
+            });
+        });
+    }
+    var spriteMsgId = null;
+    var spritesPromise = null;
+    if (spriteImagePath) {
+        spriteMsgId = logging.setModalMessage('Fetching sprite image...');
+        spritesPromise = fetchImage(spriteImagePath);
+    }
+    // Fetch the metadata and the image in parallel.
+    Promise.all([metadataPromise, spritesPromise]).then(function (values) {
+        if (spriteMsgId) {
+            logging.setModalMessage(null, spriteMsgId);
+        }
+        var metadata = values[0], spriteImage = values[1];
+        metadata.spriteImage = spriteImage;
+        metadata.spriteMetadata = spriteMetadata;
+        callback(metadata);
+    });
+}
+exports.retrieveSpriteAndMetadataInfo = retrieveSpriteAndMetadataInfo;
+
+},{"./data":6,"./logging":12,"./util":24}],6:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var bh_tsne_1 = require('./bh_tsne');
+var knn = require('./knn');
+var util_1 = require('./util');
+var logging = require('./logging');
+var vector = require('./vector');
+/** Checks to see if the browser supports webgl. */
+function hasWebGLSupport() {
+    try {
+        var c = document.createElement('canvas');
+        var gl = c.getContext('webgl') || c.getContext('experimental-webgl');
+        return gl != null && typeof weblas !== 'undefined';
+    }
+    catch (e) {
+        return false;
+    }
+}
+var WEBGL_SUPPORT = hasWebGLSupport();
+var IS_FIREFOX = navigator.userAgent.toLowerCase().indexOf('firefox') >= 0;
+/** Controls whether nearest neighbors computation is done on the GPU or CPU. */
+var KNN_GPU_ENABLED = WEBGL_SUPPORT && !IS_FIREFOX;
+/** Sampling is used when computing expensive operations such as T-SNE. */
+exports.SAMPLE_SIZE = 10000;
+/** Number of dimensions to sample when doing approximate PCA. */
+exports.PCA_SAMPLE_DIM = 200;
+/** Number of pca components to compute. */
+var NUM_PCA_COMPONENTS = 10;
+/** Reserved metadata attribute used for trace information. */
+var TRACE_METADATA_ATTR = '__next__';
+/**
+ * Dataset contains a DataPoints array that should be treated as immutable. This
+ * acts as a working subset of the original data, with cached properties
+ * from computationally expensive operations. Because creating a subset
+ * requires normalizing and shifting the vector space, we make a copy of the
+ * data so we can still always create new subsets based on the original data.
+ */
+var DataSet = (function () {
+    /** Creates a new Dataset */
+    function DataSet(points, spriteAndMetadataInfo) {
+        this.sampledDataIndices = [];
+        /**
+         * This keeps a list of all current projections so you can easily test to see
+         * if it's been calculated already.
+         */
+        this.projections = d3.set();
+        this.tSNEIteration = 0;
+        this.tSNEShouldStop = true;
+        this.dim = [0, 0];
+        this.hasTSNERun = false;
+        this.points = points;
+        this.sampledDataIndices =
+            util_1.shuffle(d3.range(this.points.length)).slice(0, exports.SAMPLE_SIZE);
+        this.traces = this.computeTraces(points);
+        this.dim = [this.points.length, this.points[0].vector.length];
+        this.spriteAndMetadataInfo = spriteAndMetadataInfo;
+    }
+    DataSet.prototype.computeTraces = function (points) {
+        // Keep a list of indices seen so we don't compute traces for a given
+        // point twice.
+        var indicesSeen = new Int8Array(points.length);
+        // Compute traces.
+        var indexToTrace = {};
+        var traces = [];
+        for (var i = 0; i < points.length; i++) {
+            if (indicesSeen[i]) {
+                continue;
+            }
+            indicesSeen[i] = 1;
+            // Ignore points without a trace attribute.
+            var next = points[i].metadata[TRACE_METADATA_ATTR];
+            if (next == null || next === '') {
+                continue;
+            }
+            if (next in indexToTrace) {
+                var existingTrace = indexToTrace[+next];
+                // Pushing at the beginning of the array.
+                existingTrace.pointIndices.unshift(i);
+                indexToTrace[i] = existingTrace;
+                continue;
+            }
+            // The current point is pointing to a new/unseen trace.
+            var newTrace = { pointIndices: [] };
+            indexToTrace[i] = newTrace;
+            traces.push(newTrace);
+            var currentIndex = i;
+            while (points[currentIndex]) {
+                newTrace.pointIndices.push(currentIndex);
+                var next_1 = points[currentIndex].metadata[TRACE_METADATA_ATTR];
+                if (next_1 != null && next_1 !== '') {
+                    indicesSeen[+next_1] = 1;
+                    currentIndex = +next_1;
+                }
+                else {
+                    currentIndex = -1;
+                }
+            }
+        }
+        return traces;
+    };
+    DataSet.prototype.getPointAccessors = function (projection, components) {
+        var _this = this;
+        if (components.length > 3) {
+            throw new RangeError('components length must be <= 3');
+        }
+        var accessors = [null, null, null];
+        var prefix = (projection === 'custom') ? 'linear' : projection;
+        var _loop_1 = function(i) {
+            if (components[i] == null) {
+                return "continue";
+            }
+            accessors[i] =
+                (function (index) {
+                    return _this.points[index].projections[prefix + '-' + components[i]];
+                });
+        };
+        for (var i = 0; i < components.length; ++i) {
+            var state_1 = _loop_1(i);
+            if (state_1 === "continue") continue;
+        }
+        return accessors;
+    };
+    DataSet.prototype.hasMeaningfulVisualization = function (projection) {
+        if (projection !== 'tsne') {
+            return true;
+        }
+        return this.tSNEIteration > 0;
+    };
+    /**
+     * Returns a new subset dataset by copying out data. We make a copy because
+     * we have to modify the vectors by normalizing them.
+     *
+     * @param subset Array of indices of points that we want in the subset.
+     *
+     * @return A subset of the original dataset.
+     */
+    DataSet.prototype.getSubset = function (subset) {
+        var _this = this;
+        var pointsSubset = subset && subset.length ?
+            subset.map(function (i) { return _this.points[i]; }) : this.points;
+        var points = pointsSubset.map(function (dp) {
+            return {
+                metadata: dp.metadata,
+                index: dp.index,
+                vector: dp.vector.slice(),
+                projectedPoint: [0, 0, 0],
+                projections: {}
+            };
+        });
+        return new DataSet(points, this.spriteAndMetadataInfo);
+    };
+    /**
+     * Computes the centroid, shifts all points to that centroid,
+     * then makes them all unit norm.
+     */
+    DataSet.prototype.normalize = function () {
+        // Compute the centroid of all data points.
+        var centroid = vector.centroid(this.points, function (a) { return a.vector; });
+        if (centroid == null) {
+            throw Error('centroid should not be null');
+        }
+        // Shift all points by the centroid and make them unit norm.
+        for (var id = 0; id < this.points.length; ++id) {
+            var dataPoint = this.points[id];
+            dataPoint.vector = vector.sub(dataPoint.vector, centroid);
+            vector.unit(dataPoint.vector);
+        }
+    };
+    /** Projects the dataset onto a given vector and caches the result. */
+    DataSet.prototype.projectLinear = function (dir, label) {
+        this.projections.add(label);
+        this.points.forEach(function (dataPoint) {
+            dataPoint.projections[label] = vector.dot(dataPoint.vector, dir);
+        });
+    };
+    /** Projects the dataset along the top 10 principal components. */
+    DataSet.prototype.projectPCA = function () {
+        var _this = this;
+        if (this.projections.has('pca-0')) {
+            return Promise.resolve(null);
+        }
+        return util_1.runAsyncTask('Computing PCA...', function () {
+            // Approximate pca vectors by sampling the dimensions.
+            var dim = _this.points[0].vector.length;
+            var vectors = _this.points.map(function (d) { return d.vector; });
+            if (dim > exports.PCA_SAMPLE_DIM) {
+                vectors = vector.projectRandom(vectors, exports.PCA_SAMPLE_DIM);
+            }
+            var sigma = numeric.div(numeric.dot(numeric.transpose(vectors), vectors), vectors.length);
+            var U;
+            U = numeric.svd(sigma).U;
+            var pcaVectors = vectors.map(function (vector) {
+                var newV = [];
+                for (var d = 0; d < NUM_PCA_COMPONENTS; d++) {
+                    var dot = 0;
+                    for (var i = 0; i < vector.length; i++) {
+                        dot += vector[i] * U[i][d];
+                    }
+                    newV.push(dot);
+                }
+                return newV;
+            });
+            var _loop_2 = function(j) {
+                var label = 'pca-' + j;
+                _this.projections.add(label);
+                _this.points.forEach(function (d, i) {
+                    d.projections[label] = pcaVectors[i][j];
+                });
+            };
+            for (var j = 0; j < NUM_PCA_COMPONENTS; j++) {
+                _loop_2(j);
+            }
+        });
+    };
+    /** Runs tsne on the data. */
+    DataSet.prototype.projectTSNE = function (perplexity, learningRate, tsneDim, stepCallback) {
+        var _this = this;
+        this.hasTSNERun = true;
+        var k = Math.floor(3 * perplexity);
+        var opt = { epsilon: learningRate, perplexity: perplexity, dim: tsneDim };
+        this.tsne = new bh_tsne_1.TSNE(opt);
+        this.tSNEShouldStop = false;
+        this.tSNEIteration = 0;
+        var step = function () {
+            if (_this.tSNEShouldStop) {
+                stepCallback(null);
+                _this.tsne = null;
+                return;
+            }
+            _this.tsne.step();
+            var result = _this.tsne.getSolution();
+            _this.sampledDataIndices.forEach(function (index, i) {
+                var dataPoint = _this.points[index];
+                dataPoint.projections['tsne-0'] = result[i * tsneDim + 0];
+                dataPoint.projections['tsne-1'] = result[i * tsneDim + 1];
+                if (tsneDim === 3) {
+                    dataPoint.projections['tsne-2'] = result[i * tsneDim + 2];
+                }
+            });
+            _this.tSNEIteration++;
+            stepCallback(_this.tSNEIteration);
+            requestAnimationFrame(step);
+        };
+        // Nearest neighbors calculations.
+        var knnComputation;
+        if (this.nearest != null && k === this.nearestK) {
+            // We found the nearest neighbors before and will reuse them.
+            knnComputation = Promise.resolve(this.nearest);
+        }
+        else {
+            var sampledData = this.sampledDataIndices.map(function (i) { return _this.points[i]; });
+            this.nearestK = k;
+            knnComputation = KNN_GPU_ENABLED ?
+                knn.findKNNGPUCosine(sampledData, k, (function (d) { return d.vector; })) :
+                knn.findKNN(sampledData, k, (function (d) { return d.vector; }), function (a, b, limit) { return vector.cosDistNorm(a, b); });
+        }
+        knnComputation.then(function (nearest) {
+            _this.nearest = nearest;
+            util_1.runAsyncTask('Initializing T-SNE...', function () {
+                _this.tsne.initDataDist(_this.nearest);
+            }).then(step);
+        });
+    };
+    DataSet.prototype.mergeMetadata = function (metadata) {
+        var _this = this;
+        if (metadata.pointsInfo.length !== this.points.length) {
+            logging.setWarningMessage(("Number of tensors (" + this.points.length + ") do not match") +
+                (" the number of lines in metadata (" + metadata.pointsInfo.length + ")."));
+        }
+        this.spriteAndMetadataInfo = metadata;
+        metadata.pointsInfo.slice(0, this.points.length)
+            .forEach(function (m, i) { return _this.points[i].metadata = m; });
+    };
+    DataSet.prototype.stopTSNE = function () { this.tSNEShouldStop = true; };
+    /**
+     * Finds the nearest neighbors of the query point using a
+     * user-specified distance metric.
+     */
+    DataSet.prototype.findNeighbors = function (pointIndex, distFunc, numNN) {
+        // Find the nearest neighbors of a particular point.
+        var neighbors = knn.findKNNofPoint(this.points, pointIndex, numNN, (function (d) { return d.vector; }), distFunc);
+        // TODO(smilkov): Figure out why we slice.
+        var result = neighbors.slice(0, numNN);
+        return result;
+    };
+    /**
+     * Search the dataset based on a metadata field.
+     */
+    DataSet.prototype.query = function (query, inRegexMode, fieldName) {
+        var predicate = util_1.getSearchPredicate(query, inRegexMode, fieldName);
+        var matches = [];
+        this.points.forEach(function (point, id) {
+            if (predicate(point)) {
+                matches.push(id);
+            }
+        });
+        return matches;
+    };
+    return DataSet;
+}());
+exports.DataSet = DataSet;
+/**
+ * An interface that holds all the data for serializing the current state of
+ * the world.
+ */
+var State = (function () {
+    function State() {
+        /** A label identifying this state. */
+        this.label = '';
+        /** Whether this State is selected in the bookmarks pane. */
+        this.isSelected = false;
+        /** t-SNE parameters */
+        this.tSNEIteration = 0;
+        this.tSNEPerplexity = 0;
+        this.tSNELearningRate = 0;
+        this.tSNEis3d = true;
+        /** PCA projection component dimensions */
+        this.pcaComponentDimensions = [];
+        /** The computed projections of the tensors. */
+        this.projections = [];
+        /** The indices of selected points. */
+        this.selectedPoints = [];
+    }
+    return State;
+}());
+exports.State = State;
+function stateGetAccessorDimensions(state) {
+    var dimensions;
+    switch (state.selectedProjection) {
+        case 'pca':
+            dimensions = state.pcaComponentDimensions.slice();
+            break;
+        case 'tsne':
+            dimensions = [0, 1];
+            if (state.tSNEis3d) {
+                dimensions.push(2);
+            }
+            break;
+        case 'custom':
+            dimensions = ['x', 'y'];
+            break;
+        default:
+            throw new Error('Unexpected fallthrough');
+    }
+    return dimensions;
+}
+exports.stateGetAccessorDimensions = stateGetAccessorDimensions;
+
+},{"./bh_tsne":1,"./knn":10,"./logging":12,"./util":24,"./vector":25}],7:[function(require,module,exports){
+
+},{}],8:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+/**
+ * Min-heap data structure. Provides O(1) for peek, returning the smallest key.
+ */
+// TODO(jart): Rename to Heap and use Comparator.
+var MinHeap = (function () {
+    function MinHeap() {
+        this.arr = [];
+    }
+    /** Push an element with the provided key. */
+    MinHeap.prototype.push = function (key, value) {
+        this.arr.push({ key: key, value: value });
+        this.bubbleUp(this.arr.length - 1);
+    };
+    /** Pop the element with the smallest key. */
+    MinHeap.prototype.pop = function () {
+        if (this.arr.length === 0) {
+            throw new Error('pop() called on empty binary heap');
+        }
+        var item = this.arr[0];
+        var last = this.arr.length - 1;
+        this.arr[0] = this.arr[last];
+        this.arr.pop();
+        if (last > 0) {
+            this.bubbleDown(0);
+        }
+        return item;
+    };
+    ;
+    /** Returns, but doesn't remove the element with the smallest key */
+    MinHeap.prototype.peek = function () { return this.arr[0]; };
+    /**
+     * Pops the element with the smallest key and at the same time
+     * adds the newly provided element. This is faster than calling
+     * pop() and push() separately.
+     */
+    MinHeap.prototype.popPush = function (key, value) {
+        if (this.arr.length === 0) {
+            throw new Error('pop() called on empty binary heap');
+        }
+        var item = this.arr[0];
+        this.arr[0] = { key: key, value: value };
+        if (this.arr.length > 0) {
+            this.bubbleDown(0);
+        }
+        return item;
+    };
+    /** Returns the number of elements in the heap. */
+    MinHeap.prototype.size = function () { return this.arr.length; };
+    /** Returns all the items in the heap. */
+    MinHeap.prototype.items = function () { return this.arr; };
+    MinHeap.prototype.swap = function (a, b) {
+        var temp = this.arr[a];
+        this.arr[a] = this.arr[b];
+        this.arr[b] = temp;
+    };
+    MinHeap.prototype.bubbleDown = function (pos) {
+        var left = (pos << 1) + 1;
+        var right = left + 1;
+        var largest = pos;
+        if (left < this.arr.length && this.arr[left].key < this.arr[largest].key) {
+            largest = left;
+        }
+        if (right < this.arr.length &&
+            this.arr[right].key < this.arr[largest].key) {
+            largest = right;
+        }
+        if (largest !== pos) {
+            this.swap(largest, pos);
+            this.bubbleDown(largest);
+        }
+    };
+    MinHeap.prototype.bubbleUp = function (pos) {
+        if (pos <= 0) {
+            return;
+        }
+        var parent = ((pos - 1) >> 1);
+        if (this.arr[pos].key < this.arr[parent].key) {
+            this.swap(pos, parent);
+            this.bubbleUp(parent);
+        }
+    };
+    return MinHeap;
+}());
+exports.MinHeap = MinHeap;
+/** List that keeps the K elements with the smallest keys. */
+var KMin = (function () {
+    /** Constructs a new k-min data structure with the provided k. */
+    function KMin(k) {
+        this.maxHeap = new MinHeap();
+        this.k = k;
+    }
+    /** Adds an element to the list. */
+    KMin.prototype.add = function (key, value) {
+        if (this.maxHeap.size() < this.k) {
+            this.maxHeap.push(-key, value);
+            return;
+        }
+        var largest = this.maxHeap.peek();
+        // If the new element is smaller, replace the largest with the new element.
+        if (key < -largest.key) {
+            this.maxHeap.popPush(-key, value);
+        }
+    };
+    /** Returns the k items with the smallest keys. */
+    KMin.prototype.getMinKItems = function () {
+        var items = this.maxHeap.items();
+        items.sort(function (a, b) { return b.key - a.key; });
+        return items.map(function (a) { return a.value; });
+    };
+    /** Returns the size of the list. */
+    KMin.prototype.getSize = function () { return this.maxHeap.size(); };
+    /** Returns the largest key in the list. */
+    KMin.prototype.getLargestKey = function () {
+        return this.maxHeap.size() === 0 ? null : -this.maxHeap.peek().key;
+    };
+    return KMin;
+}());
+exports.KMin = KMin;
+
+},{}],9:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+
+},{}],10:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var util_1 = require('./util');
+var logging = require('./logging');
+var heap_1 = require('./heap');
+var vector = require('./vector');
+/**
+ * Optimal size for the height of the matrix when doing computation on the GPU
+ * using WebGL. This was found experimentally.
+ *
+ * This also guarantees that for computing pair-wise distance for up to 10K
+ * vectors, no more than 40MB will be allocated in the GPU. Without the
+ * allocation limit, we can freeze the graphics of the whole OS.
+ */
+var OPTIMAL_GPU_BLOCK_SIZE = 256;
+/** Id of message box used for knn gpu progress bar. */
+var KNN_GPU_MSG_ID = 'knn-gpu';
+/**
+ * Returns the K nearest neighbors for each vector where the distance
+ * computation is done on the GPU (WebGL) using cosine distance.
+ *
+ * @param dataPoints List of data points, where each data point holds an
+ *   n-dimensional vector.
+ * @param k Number of nearest neighbors to find.
+ * @param accessor A method that returns the vector, given the data point.
+ */
+function findKNNGPUCosine(dataPoints, k, accessor) {
+    var N = dataPoints.length;
+    var dim = accessor(dataPoints[0]).length;
+    // The goal is to compute a large matrix multiplication A*A.T where A is of
+    // size NxD and A.T is its transpose. This results in a NxN matrix which
+    // could be too big to store on the GPU memory. To avoid memory overflow, we
+    // compute multiple A*partial_A.T where partial_A is of size BxD (B is much
+    // smaller than N). This results in storing only NxB size matrices on the GPU
+    // at a given time.
+    // A*A.T will give us NxN matrix holding the cosine distance between every
+    // pair of points, which we sort using KMin data structure to obtain the
+    // K nearest neighbors for each point.
+    var typedArray = vector.toTypedArray(dataPoints, accessor);
+    var bigMatrix = new weblas.pipeline.Tensor([N, dim], typedArray);
+    var nearest = new Array(N);
+    var numPieces = Math.ceil(N / OPTIMAL_GPU_BLOCK_SIZE);
+    var M = Math.floor(N / numPieces);
+    var modulo = N % numPieces;
+    var offset = 0;
+    var progress = 0;
+    var progressDiff = 1 / (2 * numPieces);
+    var piece = 0;
+    function step(resolve) {
+        var progressMsg = 'Finding nearest neighbors: ' + (progress * 100).toFixed() + '%';
+        util_1.runAsyncTask(progressMsg, function () {
+            var B = piece < modulo ? M + 1 : M;
+            var typedB = new Float32Array(B * dim);
+            for (var i = 0; i < B; ++i) {
+                var vector_1 = accessor(dataPoints[offset + i]);
+                for (var d = 0; d < dim; ++d) {
+                    typedB[i * dim + d] = vector_1[d];
+                }
+            }
+            var partialMatrix = new weblas.pipeline.Tensor([B, dim], typedB);
+            // Result is N x B matrix.
+            var result = weblas.pipeline.sgemm(1, bigMatrix, partialMatrix, null, null);
+            var partial = result.transfer();
+            partialMatrix.delete();
+            result.delete();
+            progress += progressDiff;
+            for (var i = 0; i < B; i++) {
+                var kMin = new heap_1.KMin(k);
+                var iReal = offset + i;
+                for (var j = 0; j < N; j++) {
+                    if (j === iReal) {
+                        continue;
+                    }
+                    var cosDist = 1 - partial[j * B + i]; // [j, i];
+                    kMin.add(cosDist, { index: j, dist: cosDist });
+                }
+                nearest[iReal] = kMin.getMinKItems();
+            }
+            progress += progressDiff;
+            offset += B;
+            piece++;
+        }, KNN_GPU_MSG_ID).then(function () {
+            if (piece < numPieces) {
+                step(resolve);
+            }
+            else {
+                logging.setModalMessage(null, KNN_GPU_MSG_ID);
+                bigMatrix.delete();
+                resolve(nearest);
+            }
+        }, function (error) {
+            // GPU failed. Reverting back to CPU.
+            logging.setModalMessage(null, KNN_GPU_MSG_ID);
+            var distFunc = function (a, b, limit) { return vector.cosDistNorm(a, b); };
+            findKNN(dataPoints, k, accessor, distFunc).then(function (nearest) {
+                resolve(nearest);
+            });
+        });
+    }
+    return new Promise(function (resolve) { return step(resolve); });
+}
+exports.findKNNGPUCosine = findKNNGPUCosine;
+/**
+ * Returns the K nearest neighbors for each vector where the distance
+ * computation is done on the CPU using a user-specified distance method.
+ *
+ * @param dataPoints List of data points, where each data point holds an
+ *   n-dimensional vector.
+ * @param k Number of nearest neighbors to find.
+ * @param accessor A method that returns the vector, given the data point.
+ * @param dist Method that takes two vectors and a limit, and computes the
+ *   distance between two vectors, with the ability to stop early if the
+ *   distance is above the limit.
+ */
+function findKNN(dataPoints, k, accessor, dist) {
+    return util_1.runAsyncTask('Finding nearest neighbors...', function () {
+        var N = dataPoints.length;
+        var nearest = new Array(N);
+        // Find the distances from node i.
+        var kMin = new Array(N);
+        for (var i = 0; i < N; i++) {
+            kMin[i] = new heap_1.KMin(k);
+        }
+        for (var i = 0; i < N; i++) {
+            var a = accessor(dataPoints[i]);
+            var kMinA = kMin[i];
+            for (var j = i + 1; j < N; j++) {
+                var kMinB = kMin[j];
+                var limitI = kMinA.getSize() === k ?
+                    kMinA.getLargestKey() || Number.MAX_VALUE :
+                    Number.MAX_VALUE;
+                var limitJ = kMinB.getSize() === k ?
+                    kMinB.getLargestKey() || Number.MAX_VALUE :
+                    Number.MAX_VALUE;
+                var limit = Math.max(limitI, limitJ);
+                var dist2ItoJ = dist(a, accessor(dataPoints[j]), limit);
+                if (dist2ItoJ >= 0) {
+                    kMinA.add(dist2ItoJ, { index: j, dist: dist2ItoJ });
+                    kMinB.add(dist2ItoJ, { index: i, dist: dist2ItoJ });
+                }
+            }
+        }
+        for (var i = 0; i < N; i++) {
+            nearest[i] = kMin[i].getMinKItems();
+        }
+        return nearest;
+    });
+}
+exports.findKNN = findKNN;
+/** Calculates the minimum distance between a search point and a rectangle. */
+function minDist(point, x1, y1, x2, y2) {
+    var x = point[0];
+    var y = point[1];
+    var dx1 = x - x1;
+    var dx2 = x - x2;
+    var dy1 = y - y1;
+    var dy2 = y - y2;
+    if (dx1 * dx2 <= 0) {
+        if (dy1 * dy2 <= 0) {
+            return 0; // return 0 as point is in rect
+        }
+        return Math.min(Math.abs(dy1), Math.abs(dy2));
+    }
+    if (dy1 * dy2 <= 0) {
+        // We know it is already inside the rectangle
+        return Math.min(Math.abs(dx1), Math.abs(dx2));
+    }
+    var corner;
+    if (x > x2) {
+        // Upper-right vs lower-right.
+        corner = y > y2 ? [x2, y2] : [x2, y1];
+    }
+    else {
+        // Upper-left vs lower-left.
+        corner = y > y2 ? [x1, y2] : [x1, y1];
+    }
+    return Math.sqrt(vector.dist22D([x, y], corner));
+}
+/**
+ * Returns the nearest neighbors of a particular point.
+ *
+ * @param dataPoints List of data points.
+ * @param pointIndex The index of the point we need the nearest neighbors of.
+ * @param k Number of nearest neighbors to search for.
+ * @param accessor Method that maps a data point => vector (array of numbers).
+ * @param distance Method that takes two vectors and returns their distance.
+ */
+function findKNNofPoint(dataPoints, pointIndex, k, accessor, distance) {
+    var kMin = new heap_1.KMin(k);
+    var a = accessor(dataPoints[pointIndex]);
+    for (var i = 0; i < dataPoints.length; ++i) {
+        if (i === pointIndex) {
+            continue;
+        }
+        var b = accessor(dataPoints[i]);
+        var dist = distance(a, b);
+        kMin.add(dist, { index: i, dist: dist });
+    }
+    return kMin.getMinKItems();
+}
+exports.findKNNofPoint = findKNNofPoint;
+
+},{"./heap":8,"./logging":12,"./util":24,"./vector":25}],11:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+/**
+ * Accelerates label placement by dividing the view into a uniform grid.
+ * Labels only need to be tested for collision with other labels that overlap
+ * the same grid cells. This is a fork of {@code amoeba.CollisionGrid}.
+ */
+var CollisionGrid = (function () {
+    /**
+     * Constructs a new Collision grid.
+     *
+     * @param bound The bound of the grid. Labels out of bounds will be rejected.
+     * @param cellWidth Width of a cell in the grid.
+     * @param cellHeight Height of a cell in the grid.
+     */
+    function CollisionGrid(bound, cellWidth, cellHeight) {
+        /** The bound of the grid. Labels out of bounds will be rejected. */
+        this.bound = bound;
+        /** Width of a cell in the grid. */
+        this.cellWidth = cellWidth;
+        /** Height of a cell in the grid. */
+        this.cellHeight = cellHeight;
+        /** Number of grid cells along the x axis. */
+        this.numHorizCells = Math.ceil(this.boundWidth(bound) / cellWidth);
+        /** Number of grid cells along the y axis. */
+        this.numVertCells = Math.ceil(this.boundHeight(bound) / cellHeight);
+        /**
+         * The 2d grid (stored as a 1d array.) Each cell consists of an array of
+         * BoundingBoxes for objects that are in the cell.
+         */
+        this.grid = new Array(this.numHorizCells * this.numVertCells);
+    }
+    CollisionGrid.prototype.boundWidth = function (bound) { return bound.hiX - bound.loX; };
+    CollisionGrid.prototype.boundHeight = function (bound) { return bound.hiY - bound.loY; };
+    CollisionGrid.prototype.boundsIntersect = function (a, b) {
+        return !(a.loX > b.hiX || a.loY > b.hiY || a.hiX < b.loX || a.hiY < b.loY);
+    };
+    /**
+     * Checks if a given bounding box has any conflicts in the grid and inserts it
+     * if none are found.
+     *
+     * @param bound The bound to insert.
+     * @param justTest If true, just test if it conflicts, without inserting.
+     * @return True if the bound was successfully inserted; false if it
+     *         could not be inserted due to a conflict.
+     */
+    CollisionGrid.prototype.insert = function (bound, justTest) {
+        if (justTest === void 0) { justTest = false; }
+        // Reject if the label is out of bounds.
+        if ((bound.hiX < this.bound.loX) || (bound.loX > this.bound.hiX) ||
+            (bound.hiY < this.bound.loY) || (bound.loY > this.bound.hiY)) {
+            return false;
+        }
+        var minCellX = this.getCellX(bound.loX);
+        var maxCellX = this.getCellX(bound.hiX);
+        var minCellY = this.getCellY(bound.loY);
+        var maxCellY = this.getCellY(bound.hiY);
+        // Check all overlapped cells to verify that we can insert.
+        var baseIdx = minCellY * this.numHorizCells + minCellX;
+        var idx = baseIdx;
+        for (var j = minCellY; j <= maxCellY; j++) {
+            for (var i = minCellX; i <= maxCellX; i++) {
+                var cell = this.grid[idx++];
+                if (cell) {
+                    for (var k = 0; k < cell.length; k++) {
+                        if (this.boundsIntersect(bound, cell[k])) {
+                            return false;
+                        }
+                    }
+                }
+            }
+            idx += this.numHorizCells - (maxCellX - minCellX + 1);
+        }
+        if (justTest) {
+            return true;
+        }
+        // Insert into the overlapped cells.
+        idx = baseIdx;
+        for (var j = minCellY; j <= maxCellY; j++) {
+            for (var i = minCellX; i <= maxCellX; i++) {
+                if (!this.grid[idx]) {
+                    this.grid[idx] = [bound];
+                }
+                else {
+                    this.grid[idx].push(bound);
+                }
+                idx++;
+            }
+            idx += this.numHorizCells - (maxCellX - minCellX + 1);
+        }
+        return true;
+    };
+    /**
+     * Returns the x index of the grid cell where the given x coordinate falls.
+     *
+     * @param x the coordinate, in world space.
+     * @return the x index of the cell.
+     */
+    CollisionGrid.prototype.getCellX = function (x) {
+        return Math.floor((x - this.bound.loX) / this.cellWidth);
+    };
+    ;
+    /**
+     * Returns the y index of the grid cell where the given y coordinate falls.
+     *
+     * @param y the coordinate, in world space.
+     * @return the y index of the cell.
+     */
+    CollisionGrid.prototype.getCellY = function (y) {
+        return Math.floor((y - this.bound.loY) / this.cellHeight);
+    };
+    ;
+    return CollisionGrid;
+}());
+exports.CollisionGrid = CollisionGrid;
+
+},{}],12:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+/** Duration in ms for showing warning messages to the user */
+var WARNING_DURATION_MS = 5000;
+/**
+ * Animation duration for the user message which should be +20ms more than the
+ * `transition` css property in `.notify-msg` in `vz-projector.html`.
+ */
+var MSG_ANIMATION_DURATION_MSEC = 300 + 20;
+var dom = null;
+var msgId = 0;
+var numActiveMessages = 0;
+function setDomContainer(domElement) {
+    dom = domElement;
+}
+exports.setDomContainer = setDomContainer;
+/**
+ * Updates the user message with the provided id.
+ *
+ * @param msg The message shown to the user. If null, the message is removed.
+ * @param id The id of an existing message. If no id is provided, a unique id
+ *     is assigned.
+ * @return The id of the message.
+ */
+function setModalMessage(msg, id) {
+    if (id === void 0) { id = null; }
+    if (dom == null) {
+        console.warn('Can\'t show modal message before the dom is initialized');
+        return;
+    }
+    if (id == null) {
+        id = (msgId++).toString();
+    }
+    var dialog = dom.querySelector('#wrapper-notify-msg');
+    var msgsContainer = dom.querySelector('#notify-msgs');
+    var divId = "notify-msg-" + id;
+    var msgDiv = d3.select(dom.querySelector('#' + divId));
+    var exists = msgDiv.size() > 0;
+    if (!exists) {
+        msgDiv = d3.select(msgsContainer).insert('div', ':first-child')
+            .attr('class', 'notify-msg')
+            .attr('id', divId);
+        numActiveMessages++;
+    }
+    if (msg == null) {
+        numActiveMessages--;
+        if (numActiveMessages === 0) {
+            dialog.close();
+        }
+        msgDiv.style('opacity', 0);
+        msgDiv.style('height', 0);
+        setTimeout(function () { return msgDiv.remove(); }, MSG_ANIMATION_DURATION_MSEC);
+    }
+    else {
+        msgDiv.text(msg);
+        dialog.open();
+    }
+    return id;
+}
+exports.setModalMessage = setModalMessage;
+/**
+ * Shows a warning message to the user for a certain amount of time.
+ */
+function setWarningMessage(msg) {
+    var warningMsg = dom.querySelector('#warning-msg');
+    var warningDiv = d3.select(warningMsg);
+    warningDiv.style('display', 'block').text('Warning: ' + msg);
+    // Hide the warning message after a certain timeout.
+    setTimeout(function () {
+        warningDiv.style('display', 'none');
+    }, WARNING_DURATION_MS);
+}
+exports.setWarningMessage = setWarningMessage;
+
+},{}],13:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var renderContext_1 = require('./renderContext');
+var LABEL_FONT_SIZE = 10;
+var LABEL_SCALE_DEFAULT = 1.0;
+var LABEL_SCALE_LARGE = 2;
+var LABEL_FILL_COLOR = 0x000000;
+var LABEL_STROKE_COLOR = 0xFFFFFF;
+var POINT_COLOR_UNSELECTED = 0xE3E3E3;
+var POINT_COLOR_NO_SELECTION = 0x7575D9;
+var POINT_COLOR_SELECTED = 0xFA6666;
+var POINT_COLOR_HOVER = 0x760B4F;
+var POINT_SCALE_DEFAULT = 1.0;
+var POINT_SCALE_SELECTED = 1.2;
+var POINT_SCALE_NEIGHBOR = 1.2;
+var POINT_SCALE_HOVER = 1.2;
+var LABELS_3D_COLOR_UNSELECTED = 0xFFFFFF;
+var LABELS_3D_COLOR_NO_SELECTION = 0xFFFFFF;
+var SPRITE_IMAGE_COLOR_UNSELECTED = 0xFFFFFF;
+var SPRITE_IMAGE_COLOR_NO_SELECTION = 0xFFFFFF;
+var TRACE_START_HUE = 60;
+var TRACE_END_HUE = 360;
+var TRACE_SATURATION = 1;
+var TRACE_LIGHTNESS = .3;
+/**
+ * Interprets projector events and assembes the arrays and commands necessary
+ * to use the ScatterPlot to render the current projected data set.
+ */
+var ProjectorScatterPlotAdapter = (function () {
+    function ProjectorScatterPlotAdapter() {
+    }
+    ProjectorScatterPlotAdapter.prototype.generateVisibleLabelRenderParams = function (ds, selectedPointIndices, neighborsOfFirstPoint, hoverPointIndex) {
+        if (ds == null) {
+            return null;
+        }
+        var n = selectedPointIndices.length + neighborsOfFirstPoint.length +
+            ((hoverPointIndex != null) ? 1 : 0);
+        var visibleLabels = new Uint32Array(n);
+        var scale = new Float32Array(n);
+        var opacityFlags = new Int8Array(n);
+        scale.fill(LABEL_SCALE_DEFAULT);
+        opacityFlags.fill(1);
+        var dst = 0;
+        if (hoverPointIndex != null) {
+            visibleLabels[dst] = hoverPointIndex;
+            scale[dst] = LABEL_SCALE_LARGE;
+            opacityFlags[dst] = 0;
+            ++dst;
+        }
+        // Selected points
+        {
+            var n_1 = selectedPointIndices.length;
+            for (var i = 0; i < n_1; ++i) {
+                visibleLabels[dst] = selectedPointIndices[i];
+                scale[dst] = LABEL_SCALE_LARGE;
+                opacityFlags[dst] = (n_1 === 1) ? 0 : 1;
+                ++dst;
+            }
+        }
+        // Neighbors
+        {
+            var n_2 = neighborsOfFirstPoint.length;
+            for (var i = 0; i < n_2; ++i) {
+                visibleLabels[dst++] = neighborsOfFirstPoint[i].index;
+            }
+        }
+        return new renderContext_1.LabelRenderParams(visibleLabels, scale, opacityFlags, LABEL_FONT_SIZE, LABEL_FILL_COLOR, LABEL_STROKE_COLOR);
+    };
+    ProjectorScatterPlotAdapter.prototype.generatePointScaleFactorArray = function (ds, selectedPointIndices, neighborsOfFirstPoint, hoverPointIndex) {
+        if (ds == null) {
+            return new Float32Array(0);
+        }
+        var scale = new Float32Array(ds.points.length);
+        scale.fill(POINT_SCALE_DEFAULT);
+        // Scale up all selected points.
+        {
+            var n = selectedPointIndices.length;
+            for (var i = 0; i < n; ++i) {
+                var p = selectedPointIndices[i];
+                scale[p] = POINT_SCALE_SELECTED;
+            }
+        }
+        // Scale up the neighbor points.
+        {
+            var n = neighborsOfFirstPoint.length;
+            for (var i = 0; i < n; ++i) {
+                var p = neighborsOfFirstPoint[i].index;
+                scale[p] = POINT_SCALE_NEIGHBOR;
+            }
+        }
+        // Scale up the hover point.
+        if (hoverPointIndex != null) {
+            scale[hoverPointIndex] = POINT_SCALE_HOVER;
+        }
+        return scale;
+    };
+    ProjectorScatterPlotAdapter.prototype.generateLineSegmentColorMap = function (ds, legendPointColorer) {
+        var traceColorArrayMap = {};
+        if (ds == null) {
+            return traceColorArrayMap;
+        }
+        for (var i = 0; i < ds.traces.length; i++) {
+            var dataTrace = ds.traces[i];
+            var colors = new Float32Array(2 * (dataTrace.pointIndices.length - 1) * 3);
+            var colorIndex = 0;
+            if (legendPointColorer) {
+                for (var j = 0; j < dataTrace.pointIndices.length - 1; j++) {
+                    var c1 = new THREE.Color(legendPointColorer(dataTrace.pointIndices[j]));
+                    var c2 = new THREE.Color(legendPointColorer(dataTrace.pointIndices[j + 1]));
+                    colors[colorIndex++] = c1.r;
+                    colors[colorIndex++] = c1.g;
+                    colors[colorIndex++] = c1.b;
+                    colors[colorIndex++] = c2.r;
+                    colors[colorIndex++] = c2.g;
+                    colors[colorIndex++] = c2.b;
+                }
+            }
+            else {
+                for (var j = 0; j < dataTrace.pointIndices.length - 1; j++) {
+                    var c1 = this.getDefaultPointInTraceColor(j, dataTrace.pointIndices.length);
+                    var c2 = this.getDefaultPointInTraceColor(j + 1, dataTrace.pointIndices.length);
+                    colors[colorIndex++] = c1.r;
+                    colors[colorIndex++] = c1.g;
+                    colors[colorIndex++] = c1.b;
+                    colors[colorIndex++] = c2.r;
+                    colors[colorIndex++] = c2.g;
+                    colors[colorIndex++] = c2.b;
+                }
+            }
+            traceColorArrayMap[i] = colors;
+        }
+        return traceColorArrayMap;
+    };
+    ProjectorScatterPlotAdapter.prototype.getDefaultPointInTraceColor = function (index, totalPoints) {
+        var hue = TRACE_START_HUE +
+            (TRACE_END_HUE - TRACE_START_HUE) * index / totalPoints;
+        var rgb = d3.hsl(hue, TRACE_SATURATION, TRACE_LIGHTNESS).rgb();
+        return new THREE.Color(rgb.r / 255, rgb.g / 255, rgb.b / 255);
+    };
+    ProjectorScatterPlotAdapter.prototype.generatePointColorArray = function (ds, legendPointColorer, selectedPointIndices, neighborsOfFirstPoint, hoverPointIndex, label3dMode, spriteImageMode) {
+        if (ds == null) {
+            return new Float32Array(0);
+        }
+        var colors = new Float32Array(ds.points.length * 3);
+        var unselectedColor = POINT_COLOR_UNSELECTED;
+        var noSelectionColor = POINT_COLOR_NO_SELECTION;
+        if (label3dMode) {
+            unselectedColor = LABELS_3D_COLOR_UNSELECTED;
+            noSelectionColor = LABELS_3D_COLOR_NO_SELECTION;
+        }
+        if (spriteImageMode) {
+            unselectedColor = SPRITE_IMAGE_COLOR_UNSELECTED;
+            noSelectionColor = SPRITE_IMAGE_COLOR_NO_SELECTION;
+        }
+        // Give all points the unselected color.
+        {
+            var n = ds.points.length;
+            var dst = 0;
+            if (selectedPointIndices.length > 0) {
+                var c = new THREE.Color(unselectedColor);
+                for (var i = 0; i < n; ++i) {
+                    colors[dst++] = c.r;
+                    colors[dst++] = c.g;
+                    colors[dst++] = c.b;
+                }
+            }
+            else {
+                if (legendPointColorer != null) {
+                    for (var i = 0; i < n; ++i) {
+                        var c = new THREE.Color(legendPointColorer(i));
+                        colors[dst++] = c.r;
+                        colors[dst++] = c.g;
+                        colors[dst++] = c.b;
+                    }
+                }
+                else {
+                    var c = new THREE.Color(noSelectionColor);
+                    for (var i = 0; i < n; ++i) {
+                        colors[dst++] = c.r;
+                        colors[dst++] = c.g;
+                        colors[dst++] = c.b;
+                    }
+                }
+            }
+        }
+        // Color the selected points.
+        {
+            var n = selectedPointIndices.length;
+            var c = new THREE.Color(POINT_COLOR_SELECTED);
+            for (var i = 0; i < n; ++i) {
+                var dst = selectedPointIndices[i] * 3;
+                colors[dst++] = c.r;
+                colors[dst++] = c.g;
+                colors[dst++] = c.b;
+            }
+        }
+        // Color the neighbors.
+        {
+            var n = neighborsOfFirstPoint.length;
+            var c = new THREE.Color(POINT_COLOR_SELECTED);
+            for (var i = 0; i < n; ++i) {
+                var dst = neighborsOfFirstPoint[i].index * 3;
+                colors[dst++] = c.r;
+                colors[dst++] = c.g;
+                colors[dst++] = c.b;
+            }
+        }
+        // Color the hover point.
+        if (hoverPointIndex != null) {
+            var c = new THREE.Color(POINT_COLOR_HOVER);
+            var dst = hoverPointIndex * 3;
+            colors[dst++] = c.r;
+            colors[dst++] = c.g;
+            colors[dst++] = c.b;
+        }
+        return colors;
+    };
+    return ProjectorScatterPlotAdapter;
+}());
+exports.ProjectorScatterPlotAdapter = ProjectorScatterPlotAdapter;
+
+},{"./renderContext":14}],14:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http:www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+/**
+ * LabelRenderParams describes the set of points that should have labels
+ * rendered next to them.
+ */
+var LabelRenderParams = (function () {
+    function LabelRenderParams(pointIndices, scaleFactors, useSceneOpacityFlags, defaultFontSize, fillColor, strokeColor) {
+        this.pointIndices = pointIndices;
+        this.scaleFactors = scaleFactors;
+        this.useSceneOpacityFlags = useSceneOpacityFlags;
+        this.defaultFontSize = defaultFontSize;
+        this.fillColor = fillColor;
+        this.strokeColor = strokeColor;
+    }
+    return LabelRenderParams;
+}());
+exports.LabelRenderParams = LabelRenderParams;
+/**
+ * RenderContext contains all of the state required to color and render the data
+ * set. ScatterPlot passes this to every attached visualizer as part of the
+ * render callback.
+ * TODO(nicholsonc): This should only contain the data that's changed between
+ * each frame. Data like colors / scale factors / labels should be recomputed
+ * only when they change.
+ */
+var RenderContext = (function () {
+    function RenderContext(camera, cameraTarget, screenWidth, screenHeight, nearestCameraSpacePointZ, farthestCameraSpacePointZ, pointColors, pointScaleFactors, labelAccessor, labels, traceColors) {
+        this.camera = camera;
+        this.cameraTarget = cameraTarget;
+        this.screenWidth = screenWidth;
+        this.screenHeight = screenHeight;
+        this.nearestCameraSpacePointZ = nearestCameraSpacePointZ;
+        this.farthestCameraSpacePointZ = farthestCameraSpacePointZ;
+        this.pointColors = pointColors;
+        this.pointScaleFactors = pointScaleFactors;
+        this.labelAccessor = labelAccessor;
+        this.labels = labels;
+        this.traceColors = traceColors;
+    }
+    return RenderContext;
+}());
+exports.RenderContext = RenderContext;
+
+},{}],15:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var renderContext_1 = require('./renderContext');
+var scatterPlotVisualizerAxes_1 = require('./scatterPlotVisualizerAxes');
+var util_1 = require('./util');
+var vector_1 = require('./vector');
+var BACKGROUND_COLOR = 0xffffff;
+/**
+ * The length of the cube (diameter of the circumscribing sphere) where all the
+ * points live.
+ */
+var CUBE_LENGTH = 2;
+var MAX_ZOOM = 5 * CUBE_LENGTH;
+var MIN_ZOOM = 0.025 * CUBE_LENGTH;
+// Constants relating to the camera parameters.
+var PERSP_CAMERA_FOV_VERTICAL = 70;
+var PERSP_CAMERA_NEAR_CLIP_PLANE = 0.01;
+var PERSP_CAMERA_FAR_CLIP_PLANE = 100;
+var ORTHO_CAMERA_FRUSTUM_HALF_EXTENT = 1.2;
+// Key presses.
+var SHIFT_KEY = 16;
+var CTRL_KEY = 17;
+var START_CAMERA_POS_3D = new THREE.Vector3(0.45, 0.9, 1.6);
+var START_CAMERA_TARGET_3D = new THREE.Vector3(0, 0, 0);
+var START_CAMERA_POS_2D = new THREE.Vector3(0, 0, 1);
+var START_CAMERA_TARGET_2D = new THREE.Vector3(0, 0, 0);
+var ORBIT_MOUSE_ROTATION_SPEED = 1;
+var ORBIT_ANIMATION_ROTATION_CYCLE_IN_SECONDS = 7;
+/** Supported modes of interaction. */
+(function (Mode) {
+    Mode[Mode["SELECT"] = 0] = "SELECT";
+    Mode[Mode["HOVER"] = 1] = "HOVER";
+})(exports.Mode || (exports.Mode = {}));
+var Mode = exports.Mode;
+/** Defines a camera, suitable for serialization. */
+var CameraDef = (function () {
+    function CameraDef() {
+        this.orthographic = false;
+    }
+    return CameraDef;
+}());
+exports.CameraDef = CameraDef;
+/**
+ * Maintains a three.js instantiation and context,
+ * animation state, and all other logic that's
+ * independent of how a 3D scatter plot is actually rendered. Also holds an
+ * array of visualizers and dispatches application events to them.
+ */
+var ScatterPlot = (function () {
+    function ScatterPlot(container, labelAccessor, selectionContext, hoverContext) {
+        this.visualizers = [];
+        this.onCameraMoveListeners = [];
+        this.backgroundColor = BACKGROUND_COLOR;
+        this.dimensionality = 3;
+        this.cameraDef = null;
+        this.orbitAnimationOnNextCameraCreation = false;
+        this.selecting = false;
+        this.mouseIsDown = false;
+        this.isDragSequence = false;
+        this.containerNode = container.node();
+        this.selectionContext = selectionContext;
+        this.hoverContext = hoverContext;
+        this.getLayoutValues();
+        this.labelAccessor = labelAccessor;
+        this.xScale = d3.scale.linear();
+        this.yScale = d3.scale.linear();
+        this.zScale = d3.scale.linear();
+        this.scene = new THREE.Scene();
+        this.renderer =
+            new THREE.WebGLRenderer({ alpha: true, premultipliedAlpha: false });
+        this.renderer.setClearColor(BACKGROUND_COLOR, 1);
+        this.containerNode.appendChild(this.renderer.domElement);
+        this.light = new THREE.PointLight(0xFFECBF, 1, 0);
+        this.scene.add(this.light);
+        this.setDimensions(3);
+        this.recreateCamera(this.makeDefaultCameraDef(this.dimensionality));
+        this.renderer.render(this.scene, this.camera);
+        this.addAxesToScene();
+        this.addInteractionListeners();
+    }
+    ScatterPlot.prototype.addInteractionListeners = function () {
+        this.containerNode.addEventListener('mousemove', this.onMouseMove.bind(this));
+        this.containerNode.addEventListener('mousedown', this.onMouseDown.bind(this));
+        this.containerNode.addEventListener('mouseup', this.onMouseUp.bind(this));
+        this.containerNode.addEventListener('click', this.onClick.bind(this));
+        window.addEventListener('keydown', this.onKeyDown.bind(this), false);
+        window.addEventListener('keyup', this.onKeyUp.bind(this), false);
+    };
+    ScatterPlot.prototype.addCameraControlsEventListeners = function (cameraControls) {
+        var _this = this;
+        // Start is called when the user stars interacting with
+        // controls.
+        cameraControls.addEventListener('start', function () {
+            _this.stopOrbitAnimation();
+            _this.onCameraMoveListeners.forEach(function (l) { return l(_this.camera.position, cameraControls.target); });
+        });
+        // Change is called everytime the user interacts with the controls.
+        cameraControls.addEventListener('change', function () {
+            _this.render();
+        });
+        // End is called when the user stops interacting with the
+        // controls (e.g. on mouse up, after dragging).
+        cameraControls.addEventListener('end', function () { });
+    };
+    ScatterPlot.prototype.makeCamera3D = function (cameraDef, w, h) {
+        var camera;
+        {
+            var aspectRatio = w / h;
+            camera = new THREE.PerspectiveCamera(PERSP_CAMERA_FOV_VERTICAL, aspectRatio, PERSP_CAMERA_NEAR_CLIP_PLANE, PERSP_CAMERA_FAR_CLIP_PLANE);
+            camera.position.set(cameraDef.position[0], cameraDef.position[1], cameraDef.position[2]);
+            var at = new THREE.Vector3(cameraDef.target[0], cameraDef.target[1], cameraDef.target[2]);
+            camera.lookAt(at);
+            camera.zoom = cameraDef.zoom;
+        }
+        var occ = new THREE.OrbitControls(camera, this.renderer.domElement);
+        occ.enableRotate = true;
+        occ.rotateSpeed = ORBIT_MOUSE_ROTATION_SPEED;
+        occ.mouseButtons.ORBIT = THREE.MOUSE.LEFT;
+        occ.mouseButtons.PAN = THREE.MOUSE.RIGHT;
+        if (this.orbitCameraControls != null) {
+            this.orbitCameraControls.dispose();
+        }
+        this.camera = camera;
+        this.orbitCameraControls = occ;
+        this.addCameraControlsEventListeners(this.orbitCameraControls);
+    };
+    ScatterPlot.prototype.makeCamera2D = function (cameraDef, w, h) {
+        var camera;
+        var target = new THREE.Vector3(cameraDef.target[0], cameraDef.target[1], cameraDef.target[2]);
+        {
+            var aspectRatio = w / h;
+            var left = -ORTHO_CAMERA_FRUSTUM_HALF_EXTENT;
+            var right = ORTHO_CAMERA_FRUSTUM_HALF_EXTENT;
+            var bottom = -ORTHO_CAMERA_FRUSTUM_HALF_EXTENT;
+            var top_1 = ORTHO_CAMERA_FRUSTUM_HALF_EXTENT;
+            // Scale up the larger of (w, h) to match the aspect ratio.
+            if (aspectRatio > 1) {
+                left *= aspectRatio;
+                right *= aspectRatio;
+            }
+            else {
+                top_1 /= aspectRatio;
+                bottom /= aspectRatio;
+            }
+            camera =
+                new THREE.OrthographicCamera(left, right, top_1, bottom, -1000, 1000);
+            camera.position.set(cameraDef.position[0], cameraDef.position[1], cameraDef.position[2]);
+            camera.up = new THREE.Vector3(0, 1, 0);
+            camera.lookAt(target);
+            camera.zoom = cameraDef.zoom;
+        }
+        var occ = new THREE.OrbitControls(camera, this.renderer.domElement);
+        occ.target = target;
+        occ.enableRotate = false;
+        occ.enableDamping = false;
+        occ.autoRotate = false;
+        occ.mouseButtons.ORBIT = null;
+        occ.mouseButtons.PAN = THREE.MOUSE.LEFT;
+        if (this.orbitCameraControls != null) {
+            this.orbitCameraControls.dispose();
+        }
+        this.camera = camera;
+        this.orbitCameraControls = occ;
+        this.addCameraControlsEventListeners(occ);
+    };
+    ScatterPlot.prototype.makeDefaultCameraDef = function (dimensionality) {
+        var def = new CameraDef();
+        def.orthographic = (dimensionality === 2);
+        def.zoom = 1.0;
+        if (def.orthographic) {
+            def.position =
+                [START_CAMERA_POS_2D.x, START_CAMERA_POS_2D.y, START_CAMERA_POS_2D.z];
+            def.target = [
+                START_CAMERA_TARGET_2D.x, START_CAMERA_TARGET_2D.y,
+                START_CAMERA_TARGET_2D.z
+            ];
+        }
+        else {
+            def.position =
+                [START_CAMERA_POS_3D.x, START_CAMERA_POS_3D.y, START_CAMERA_POS_3D.z];
+            def.target = [
+                START_CAMERA_TARGET_3D.x, START_CAMERA_TARGET_3D.y,
+                START_CAMERA_TARGET_3D.z
+            ];
+        }
+        return def;
+    };
+    /** Recreate the scatter plot camera from a definition structure. */
+    ScatterPlot.prototype.recreateCamera = function (cameraDef) {
+        if (cameraDef.orthographic) {
+            this.makeCamera2D(cameraDef, this.width, this.height);
+        }
+        else {
+            this.makeCamera3D(cameraDef, this.width, this.height);
+        }
+        this.orbitCameraControls.minDistance = MIN_ZOOM;
+        this.orbitCameraControls.maxDistance = MAX_ZOOM;
+        this.orbitCameraControls.update();
+        if (this.orbitAnimationOnNextCameraCreation) {
+            this.startOrbitAnimation();
+        }
+    };
+    ScatterPlot.prototype.onClick = function (e, notify) {
+        if (notify === void 0) { notify = true; }
+        if (e && this.selecting) {
+            return;
+        }
+        // Only call event handlers if the click originated from the scatter plot.
+        if (!this.isDragSequence && notify) {
+            var selection = this.nearestPoint ? [this.nearestPoint] : [];
+            this.selectionContext.notifySelectionChanged(selection);
+        }
+        this.isDragSequence = false;
+        this.render();
+    };
+    ScatterPlot.prototype.onMouseDown = function (e) {
+        this.isDragSequence = false;
+        this.mouseIsDown = true;
+        // If we are in selection mode, and we have in fact clicked a valid point,
+        // create a sphere so we can select things
+        if (this.selecting) {
+            this.orbitCameraControls.enabled = false;
+            this.setNearestPointToMouse(e);
+            if (this.nearestPoint) {
+                this.createSelectionSphere();
+            }
+        }
+        else if (!e.ctrlKey && this.sceneIs3D() &&
+            this.orbitCameraControls.mouseButtons.ORBIT === THREE.MOUSE.RIGHT) {
+            // The user happened to press the ctrl key when the tab was active,
+            // unpressed the ctrl when the tab was inactive, and now he/she
+            // is back to the projector tab.
+            this.orbitCameraControls.mouseButtons.ORBIT = THREE.MOUSE.LEFT;
+            this.orbitCameraControls.mouseButtons.PAN = THREE.MOUSE.RIGHT;
+        }
+        else if (e.ctrlKey && this.sceneIs3D() &&
+            this.orbitCameraControls.mouseButtons.ORBIT === THREE.MOUSE.LEFT) {
+            // Similarly to the situation above.
+            this.orbitCameraControls.mouseButtons.ORBIT = THREE.MOUSE.RIGHT;
+            this.orbitCameraControls.mouseButtons.PAN = THREE.MOUSE.LEFT;
+        }
+    };
+    /** When we stop dragging/zooming, return to normal behavior. */
+    ScatterPlot.prototype.onMouseUp = function (e) {
+        if (this.selecting) {
+            this.orbitCameraControls.enabled = true;
+            this.scene.remove(this.selectionSphere);
+            this.selectionSphere = null;
+            this.render();
+        }
+        this.mouseIsDown = false;
+    };
+    /**
+     * When the mouse moves, find the nearest point (if any) and send it to the
+     * hoverlisteners (usually called from embedding.ts)
+     */
+    ScatterPlot.prototype.onMouseMove = function (e) {
+        if (!this.dataSet) {
+            return;
+        }
+        this.isDragSequence = this.mouseIsDown;
+        // Depending if we're selecting or just navigating, handle accordingly.
+        if (this.selecting && this.mouseIsDown) {
+            if (this.selectionSphere) {
+                this.adjustSelectionSphere(e);
+            }
+            this.render();
+        }
+        else if (!this.mouseIsDown) {
+            this.setNearestPointToMouse(e);
+            this.hoverContext.notifyHoverOverPoint(this.nearestPoint);
+        }
+    };
+    /** For using ctrl + left click as right click, and for circle select */
+    ScatterPlot.prototype.onKeyDown = function (e) {
+        // If ctrl is pressed, use left click to orbit
+        if (e.keyCode === CTRL_KEY && this.sceneIs3D()) {
+            this.orbitCameraControls.mouseButtons.ORBIT = THREE.MOUSE.RIGHT;
+            this.orbitCameraControls.mouseButtons.PAN = THREE.MOUSE.LEFT;
+        }
+        // If shift is pressed, start selecting
+        if (e.keyCode === SHIFT_KEY) {
+            this.selecting = true;
+            this.containerNode.style.cursor = 'crosshair';
+        }
+    };
+    /** For using ctrl + left click as right click, and for circle select */
+    ScatterPlot.prototype.onKeyUp = function (e) {
+        if (e.keyCode === CTRL_KEY && this.sceneIs3D()) {
+            this.orbitCameraControls.mouseButtons.ORBIT = THREE.MOUSE.LEFT;
+            this.orbitCameraControls.mouseButtons.PAN = THREE.MOUSE.RIGHT;
+        }
+        // If shift is released, stop selecting
+        if (e.keyCode === SHIFT_KEY) {
+            this.selecting = (this.getMode() === Mode.SELECT);
+            if (!this.selecting) {
+                this.containerNode.style.cursor = 'default';
+            }
+            this.scene.remove(this.selectionSphere);
+            this.selectionSphere = null;
+            this.render();
+        }
+    };
+    ScatterPlot.prototype.setNearestPointToMouse = function (e) {
+        if (this.pickingTexture == null) {
+            this.nearestPoint = null;
+            return;
+        }
+        // Create buffer for reading a single pixel.
+        var pixelBuffer = new Uint8Array(4);
+        var dpr = window.devicePixelRatio || 1;
+        var x = e.offsetX * dpr;
+        var y = e.offsetY * dpr;
+        // Read the pixel under the mouse from the texture.
+        this.renderer.readRenderTargetPixels(this.pickingTexture, x, this.pickingTexture.height - y, 1, 1, pixelBuffer);
+        // Interpret the pixel as an ID.
+        var id = (pixelBuffer[0] << 16) | (pixelBuffer[1] << 8) | pixelBuffer[2];
+        this.nearestPoint =
+            (id !== 0xffffff) && (id < this.dataSet.points.length) ? id : null;
+    };
+    /** Returns the squared distance to the mouse for the i-th point. */
+    ScatterPlot.prototype.getDist2ToMouse = function (i, e) {
+        var point = util_1.getProjectedPointFromIndex(this.dataSet, i);
+        var screenCoords = util_1.vector3DToScreenCoords(this.camera, this.width, this.height, point);
+        var dpr = window.devicePixelRatio || 1;
+        return vector_1.dist_2D([e.offsetX * dpr, e.offsetY * dpr], [screenCoords[0], screenCoords[1]]);
+    };
+    ScatterPlot.prototype.adjustSelectionSphere = function (e) {
+        var _this = this;
+        var dist = this.getDist2ToMouse(this.nearestPoint, e) / 100;
+        this.selectionSphere.scale.set(dist, dist, dist);
+        var selectedPoints = [];
+        this.dataSet.points.forEach(function (point) {
+            var pt = point.projectedPoint;
+            var pointVect = new THREE.Vector3(pt[0], pt[1], pt[2]);
+            var distPointToSphereOrigin = _this.selectionSphere.position.clone().sub(pointVect).length();
+            if (distPointToSphereOrigin < dist) {
+                selectedPoints.push(_this.dataSet.points.indexOf(point));
+            }
+        });
+        this.selectionContext.notifySelectionChanged(selectedPoints);
+    };
+    ScatterPlot.prototype.removeAll = function () {
+        var _this = this;
+        this.visualizers.forEach(function (v) {
+            v.removeAllFromScene(_this.scene);
+        });
+    };
+    ScatterPlot.prototype.createSelectionSphere = function () {
+        var geometry = new THREE.SphereGeometry(1, 300, 100);
+        var material = new THREE.MeshPhongMaterial({
+            color: 0x000000,
+            specular: (this.sceneIs3D() && 0xffffff),
+            emissive: 0x000000,
+            shininess: 10,
+            shading: THREE.SmoothShading,
+            opacity: 0.125,
+            transparent: true,
+        });
+        this.selectionSphere = new THREE.Mesh(geometry, material);
+        this.selectionSphere.scale.set(0, 0, 0);
+        var pos = this.dataSet.points[this.nearestPoint].projectedPoint;
+        this.scene.add(this.selectionSphere);
+        this.selectionSphere.position.set(pos[0], pos[1], pos[2]);
+    };
+    ScatterPlot.prototype.getLayoutValues = function () {
+        this.width = this.containerNode.offsetWidth;
+        this.height = Math.max(1, this.containerNode.offsetHeight);
+        return [this.width, this.height];
+    };
+    /**
+     * Returns an x, y, z value for each item of our data based on the accessor
+     * methods.
+     */
+    ScatterPlot.prototype.getPointsCoordinates = function () {
+        var _this = this;
+        var xAccessor = this.pointAccessors[0];
+        var yAccessor = this.pointAccessors[1];
+        var zAccessor = this.pointAccessors[2];
+        // Determine max and min of each axis of our data.
+        var xExtent = d3.extent(this.dataSet.points, function (p, i) { return xAccessor(i); });
+        var yExtent = d3.extent(this.dataSet.points, function (p, i) { return yAccessor(i); });
+        var range = [-CUBE_LENGTH / 2, CUBE_LENGTH / 2];
+        this.xScale.domain(xExtent).range(range);
+        this.yScale.domain(yExtent).range(range);
+        if (zAccessor) {
+            var zExtent = d3.extent(this.dataSet.points, function (p, i) { return zAccessor(i); });
+            this.zScale.domain(zExtent).range(range);
+        }
+        // Determine 3d coordinates of each data point.
+        this.dataSet.points.forEach(function (d, i) {
+            d.projectedPoint[0] = _this.xScale(xAccessor(i));
+            d.projectedPoint[1] = _this.yScale(yAccessor(i));
+        });
+        if (zAccessor) {
+            this.dataSet.points.forEach(function (d, i) {
+                d.projectedPoint[2] = _this.zScale(zAccessor(i));
+            });
+        }
+        else {
+            this.dataSet.points.forEach(function (d, i) {
+                d.projectedPoint[2] = 0;
+            });
+        }
+    };
+    ScatterPlot.prototype.addAxesToScene = function () {
+        this.addVisualizer(new scatterPlotVisualizerAxes_1.ScatterPlotVisualizerAxes());
+    };
+    ScatterPlot.prototype.sceneIs3D = function () {
+        return this.dimensionality === 3;
+    };
+    /** Set 2d vs 3d mode. */
+    ScatterPlot.prototype.setDimensions = function (dimensionality) {
+        if ((dimensionality !== 2) && (dimensionality !== 3)) {
+            throw new RangeError('dimensionality must be 2 or 3');
+        }
+        this.dimensionality = dimensionality;
+        var def = this.cameraDef || this.makeDefaultCameraDef(dimensionality);
+        this.recreateCamera(def);
+    };
+    /** Gets the current camera information, suitable for serialization. */
+    ScatterPlot.prototype.getCameraDef = function () {
+        var def = new CameraDef();
+        var pos = this.camera.position;
+        var tgt = this.orbitCameraControls.target;
+        def.orthographic = !this.sceneIs3D();
+        def.position = [pos.x, pos.y, pos.z];
+        def.target = [tgt.x, tgt.y, tgt.z];
+        def.zoom = this.camera.zoom;
+        return def;
+    };
+    /** Sets parameters for the next camera recreation. */
+    ScatterPlot.prototype.setCameraParametersForNextCameraCreation = function (def, orbitAnimation) {
+        this.cameraDef = def;
+        this.orbitAnimationOnNextCameraCreation = orbitAnimation;
+    };
+    /** Gets the current camera position. */
+    ScatterPlot.prototype.getCameraPosition = function () {
+        var currPos = this.camera.position;
+        return [currPos.x, currPos.y, currPos.z];
+    };
+    /** Gets the current camera target. */
+    ScatterPlot.prototype.getCameraTarget = function () {
+        var currTarget = this.orbitCameraControls.target;
+        return [currTarget.x, currTarget.y, currTarget.z];
+    };
+    /** Sets up the camera from given position and target coordinates. */
+    ScatterPlot.prototype.setCameraPositionAndTarget = function (position, target) {
+        this.stopOrbitAnimation();
+        this.camera.position.set(position[0], position[1], position[2]);
+        this.orbitCameraControls.target.set(target[0], target[1], target[2]);
+        this.orbitCameraControls.update();
+        this.render();
+    };
+    /** Starts orbiting the camera around its current lookat target. */
+    ScatterPlot.prototype.startOrbitAnimation = function () {
+        if (!this.sceneIs3D()) {
+            return;
+        }
+        if (this.orbitAnimationId != null) {
+            this.stopOrbitAnimation();
+        }
+        this.orbitCameraControls.autoRotate = true;
+        this.orbitCameraControls.rotateSpeed =
+            ORBIT_ANIMATION_ROTATION_CYCLE_IN_SECONDS;
+        this.updateOrbitAnimation();
+    };
+    ScatterPlot.prototype.updateOrbitAnimation = function () {
+        var _this = this;
+        this.orbitCameraControls.update();
+        this.orbitAnimationId =
+            requestAnimationFrame(function () { return _this.updateOrbitAnimation(); });
+    };
+    /** Stops the orbiting animation on the camera. */
+    ScatterPlot.prototype.stopOrbitAnimation = function () {
+        this.orbitCameraControls.autoRotate = false;
+        this.orbitCameraControls.rotateSpeed = ORBIT_MOUSE_ROTATION_SPEED;
+        if (this.orbitAnimationId != null) {
+            cancelAnimationFrame(this.orbitAnimationId);
+            this.orbitAnimationId = null;
+        }
+    };
+    /** Adds a visualizer to the set, will start dispatching events to it */
+    ScatterPlot.prototype.addVisualizer = function (visualizer) {
+        this.visualizers.push(visualizer);
+        if (this.dataSet) {
+            visualizer.onDataSet(this.dataSet);
+        }
+        if (this.labelAccessor) {
+            visualizer.onSetLabelAccessor(this.labelAccessor);
+        }
+        if (this.scene) {
+            visualizer.onRecreateScene(this.scene, this.sceneIs3D(), this.backgroundColor);
+        }
+    };
+    /** Removes all visualizers attached to this scatter plot. */
+    ScatterPlot.prototype.removeAllVisualizers = function () {
+        this.removeAll();
+        this.visualizers = [];
+        this.addAxesToScene();
+    };
+    ScatterPlot.prototype.recreateScene = function () {
+        var _this = this;
+        this.removeAll();
+        this.visualizers.forEach(function (v) {
+            v.onRecreateScene(_this.scene, _this.sceneIs3D(), _this.backgroundColor);
+        });
+        this.resize(false);
+        this.render();
+    };
+    /** Sets the data for the scatter plot. */
+    ScatterPlot.prototype.setDataSet = function (dataSet) {
+        this.removeAll();
+        this.dataSet = dataSet;
+        this.nearestPoint = null;
+        this.visualizers.forEach(function (v) {
+            v.onDataSet(dataSet);
+        });
+        this.render();
+    };
+    ScatterPlot.prototype.update = function () {
+        var _this = this;
+        this.getPointsCoordinates();
+        this.visualizers.forEach(function (v) {
+            v.onUpdate(_this.dataSet);
+        });
+        this.render();
+    };
+    ScatterPlot.prototype.render = function () {
+        if (!this.dataSet) {
+            return;
+        }
+        // place the light near the camera
+        {
+            var lightPos = this.camera.position.clone();
+            lightPos.x += 1;
+            lightPos.y += 1;
+            this.light.position.set(lightPos.x, lightPos.y, lightPos.z);
+        }
+        var cameraSpacePointExtents = util_1.getNearFarPoints(this.dataSet, this.camera.position, this.orbitCameraControls.target);
+        var rc = new renderContext_1.RenderContext(this.camera, this.orbitCameraControls.target, this.width, this.height, cameraSpacePointExtents[0], cameraSpacePointExtents[1], this.pointColors, this.pointScaleFactors, this.labelAccessor, this.labels, this.traceColors);
+        // Render first pass to picking target. This render fills pickingTexture
+        // with colors that are actually point ids, so that sampling the texture at
+        // the mouse's current x,y coordinates will reveal the data point that the
+        // mouse is over.
+        this.visualizers.forEach(function (v) {
+            v.onPickingRender(rc);
+        });
+        this.renderer.render(this.scene, this.camera, this.pickingTexture);
+        // Render second pass to color buffer, to be displayed on the canvas.
+        this.visualizers.forEach(function (v) {
+            v.onRender(rc);
+        });
+        this.renderer.render(this.scene, this.camera);
+    };
+    ScatterPlot.prototype.setPointAccessors = function (pointAccessors) {
+        this.pointAccessors = pointAccessors;
+    };
+    ScatterPlot.prototype.setLabelAccessor = function (labelAccessor) {
+        this.labelAccessor = labelAccessor;
+        this.visualizers.forEach(function (v) {
+            v.onSetLabelAccessor(labelAccessor);
+        });
+    };
+    ScatterPlot.prototype.setMode = function (mode) {
+        this.mode = mode;
+        if (mode === Mode.SELECT) {
+            this.selecting = true;
+            this.containerNode.style.cursor = 'crosshair';
+        }
+        else {
+            this.selecting = false;
+            this.containerNode.style.cursor = 'default';
+        }
+    };
+    /** Set the colors for every data point. (RGB triplets) */
+    ScatterPlot.prototype.setPointColors = function (colors) {
+        this.pointColors = colors;
+    };
+    /** Set the scale factors for every data point. (scalars) */
+    ScatterPlot.prototype.setPointScaleFactors = function (scaleFactors) {
+        this.pointScaleFactors = scaleFactors;
+    };
+    /** Set the labels to rendered */
+    ScatterPlot.prototype.setLabels = function (labels) {
+        this.labels = labels;
+    };
+    /** Set the colors for every data trace. (RGB triplets) */
+    ScatterPlot.prototype.setTraceColors = function (colors) {
+        this.traceColors = colors;
+    };
+    ScatterPlot.prototype.getMode = function () { return this.mode; };
+    ScatterPlot.prototype.resetZoom = function () {
+        this.recreateCamera(this.makeDefaultCameraDef(this.dimensionality));
+        this.render();
+    };
+    ScatterPlot.prototype.setDayNightMode = function (isNight) {
+        d3.select(this.containerNode)
+            .selectAll('canvas')
+            .style('filter', isNight ? 'invert(100%)' : null);
+    };
+    ScatterPlot.prototype.showAxes = function (show) { };
+    ScatterPlot.prototype.showTickLabels = function (show) { };
+    ScatterPlot.prototype.resize = function (render) {
+        if (render === void 0) { render = true; }
+        var _a = [this.width, this.height], oldW = _a[0], oldH = _a[1];
+        var _b = this.getLayoutValues(), newW = _b[0], newH = _b[1];
+        if (this.dimensionality === 3) {
+            var camera = this.camera;
+            camera.aspect = newW / newH;
+            camera.updateProjectionMatrix();
+        }
+        else {
+            var camera = this.camera;
+            // Scale the ortho frustum by however much the window changed.
+            var scaleW = newW / oldW;
+            var scaleH = newH / oldH;
+            var newCamHalfWidth = ((camera.right - camera.left) * scaleW) / 2;
+            var newCamHalfHeight = ((camera.top - camera.bottom) * scaleH) / 2;
+            camera.top = newCamHalfHeight;
+            camera.bottom = -newCamHalfHeight;
+            camera.left = -newCamHalfWidth;
+            camera.right = newCamHalfWidth;
+            camera.updateProjectionMatrix();
+        }
+        // Accouting for retina displays.
+        var dpr = window.devicePixelRatio || 1;
+        this.renderer.setPixelRatio(dpr);
+        this.renderer.setSize(newW, newH);
+        // the picking texture needs to be exactly the same as the render texture.
+        {
+            var renderCanvasSize = this.renderer.getSize();
+            var pixelRatio = this.renderer.getPixelRatio();
+            this.pickingTexture = new THREE.WebGLRenderTarget(renderCanvasSize.width * pixelRatio, renderCanvasSize.height * pixelRatio);
+            this.pickingTexture.texture.minFilter = THREE.LinearFilter;
+        }
+        this.visualizers.forEach(function (v) {
+            v.onResize(newW, newH);
+        });
+        if (render) {
+            this.render();
+        }
+        ;
+    };
+    ScatterPlot.prototype.onCameraMove = function (listener) {
+        this.onCameraMoveListeners.push(listener);
+    };
+    ScatterPlot.prototype.clickOnPoint = function (pointIndex) {
+        this.nearestPoint = pointIndex;
+        this.onClick(null, false);
+    };
+    return ScatterPlot;
+}());
+exports.ScatterPlot = ScatterPlot;
+
+},{"./renderContext":14,"./scatterPlotVisualizerAxes":18,"./util":24,"./vector":25}],16:[function(require,module,exports){
+arguments[4][9][0].apply(exports,arguments)
+},{"dup":9}],17:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var util_1 = require('./util');
+var FONT_SIZE = 80;
+var ONE_OVER_FONT_SIZE = 1 / FONT_SIZE;
+var LABEL_SCALE = 2.2; // at 1:1 texel/pixel ratio
+var LABEL_COLOR = 'black';
+var LABEL_BACKGROUND = 'white';
+var MAX_CANVAS_DIMENSION = 8192;
+var NUM_GLYPHS = 256;
+var RGB_ELEMENTS_PER_ENTRY = 3;
+var XYZ_ELEMENTS_PER_ENTRY = 3;
+var UV_ELEMENTS_PER_ENTRY = 2;
+var VERTICES_PER_GLYPH = 2 * 3; // 2 triangles, 3 verts per triangle
+/**
+ * Each label is made up of triangles (two per letter.) Each vertex, then, is
+ * the corner of one of these triangles (and thus the corner of a letter
+ * rectangle.)
+ * Each has the following attributes:
+ *    posObj: The (x, y) position of the vertex within the label, where the
+ *            bottom center of the word is positioned at (0, 0);
+ *    position: The position of the label in worldspace.
+ *    vUv: The (u, v) coordinates that index into the glyphs sheet (range 0, 1.)
+ *    color: The color of the label (matches the cooresponding point's color.)
+ *    wordShown: Boolean. Whether or not the label is visible.
+ */
+var VERTEX_SHADER = "\n    attribute vec2 posObj;\n    attribute vec3 color;\n    varying vec2 vUv;\n    varying vec3 vColor;\n\n    void main() {\n      vUv = uv;\n      vColor = color;\n\n      // Rotate label to face camera.\n\n      vec4 vRight = vec4(\n        modelViewMatrix[0][0], modelViewMatrix[1][0], modelViewMatrix[2][0], 0);\n\n      vec4 vUp = vec4(\n        modelViewMatrix[0][1], modelViewMatrix[1][1], modelViewMatrix[2][1], 0);\n\n      vec4 vAt = -vec4(\n        modelViewMatrix[0][2], modelViewMatrix[1][2], modelViewMatrix[2][2], 0);\n\n      mat4 pointToCamera = mat4(vRight, vUp, vAt, vec4(0, 0, 0, 1));\n\n      vec2 scaledPos = posObj * " + ONE_OVER_FONT_SIZE + " * " + LABEL_SCALE + ";\n\n      vec4 posRotated = pointToCamera * vec4(scaledPos, 0, 1);\n      vec4 mvPosition = modelViewMatrix * (vec4(position, 0) + posRotated);\n      gl_Position = projectionMatrix * mvPosition;\n    }";
+var FRAGMENT_SHADER = "\n    uniform sampler2D texture;\n    uniform bool picking;\n    varying vec2 vUv;\n    varying vec3 vColor;\n\n    void main() {\n      if (picking) {\n        gl_FragColor = vec4(vColor, 1.0);\n      } else {\n        vec4 fromTexture = texture2D(texture, vUv);\n        gl_FragColor = vec4(vColor, 1.0) * fromTexture;\n      }\n    }";
+/**
+ * Renders the text labels as 3d geometry in the world.
+ */
+var ScatterPlotVisualizer3DLabels = (function () {
+    function ScatterPlotVisualizer3DLabels() {
+        this.glyphTexture = this.createGlyphTexture();
+        this.uniforms = {
+            texture: { type: 't', value: this.glyphTexture.texture },
+            picking: { type: 'bool', value: false },
+        };
+        this.material = new THREE.ShaderMaterial({
+            uniforms: this.uniforms,
+            transparent: true,
+            vertexShader: VERTEX_SHADER,
+            fragmentShader: FRAGMENT_SHADER,
+        });
+    }
+    ScatterPlotVisualizer3DLabels.prototype.createGlyphTexture = function () {
+        if (this.glyphTexture) {
+            this.glyphTexture.texture.dispose();
+        }
+        var canvas = document.createElement('canvas');
+        canvas.width = MAX_CANVAS_DIMENSION;
+        canvas.height = FONT_SIZE;
+        var ctx = canvas.getContext('2d');
+        ctx.font = 'bold ' + FONT_SIZE * 0.75 + 'px roboto';
+        ctx.textBaseline = 'top';
+        ctx.fillStyle = LABEL_BACKGROUND;
+        ctx.rect(0, 0, canvas.width, canvas.height);
+        ctx.fill();
+        ctx.fillStyle = LABEL_COLOR;
+        var spaceOffset = ctx.measureText(' ').width;
+        // For each letter, store length, position at the encoded index.
+        var glyphLengths = new Float32Array(NUM_GLYPHS);
+        var glyphOffset = new Float32Array(NUM_GLYPHS);
+        var leftCoord = 0;
+        for (var i = 0; i < NUM_GLYPHS; i++) {
+            var text = ' ' + String.fromCharCode(i);
+            var textLength = ctx.measureText(text).width;
+            glyphLengths[i] = textLength - spaceOffset;
+            glyphOffset[i] = leftCoord;
+            ctx.fillText(text, leftCoord - spaceOffset, 0);
+            leftCoord += textLength;
+        }
+        var tex = util_1.createTexture(canvas);
+        return { texture: tex, lengths: glyphLengths, offsets: glyphOffset };
+    };
+    ScatterPlotVisualizer3DLabels.prototype.processLabelVerts = function () {
+        var numTotalLetters = 0;
+        this.labelVertexMap = [];
+        for (var i = 0; i < this.dataSet.points.length; i++) {
+            var label = this.labelAccessor(i).toString();
+            var vertsArray = [];
+            for (var j = 0; j < label.length; j++) {
+                for (var k = 0; k < VERTICES_PER_GLYPH; k++) {
+                    vertsArray.push(numTotalLetters * VERTICES_PER_GLYPH + k);
+                }
+                numTotalLetters++;
+            }
+            this.labelVertexMap.push(vertsArray);
+        }
+        this.totalVertexCount = numTotalLetters * VERTICES_PER_GLYPH;
+    };
+    ScatterPlotVisualizer3DLabels.prototype.createColorBuffers = function () {
+        var _this = this;
+        var numPoints = this.dataSet.points.length;
+        this.pickingColors =
+            new Float32Array(this.totalVertexCount * RGB_ELEMENTS_PER_ENTRY);
+        this.renderColors =
+            new Float32Array(this.totalVertexCount * RGB_ELEMENTS_PER_ENTRY);
+        var _loop_1 = function(i) {
+            var color = new THREE.Color(i);
+            this_1.labelVertexMap[i].forEach(function (j) {
+                _this.pickingColors[RGB_ELEMENTS_PER_ENTRY * j] = color.r;
+                _this.pickingColors[RGB_ELEMENTS_PER_ENTRY * j + 1] = color.g;
+                _this.pickingColors[RGB_ELEMENTS_PER_ENTRY * j + 2] = color.b;
+                _this.renderColors[RGB_ELEMENTS_PER_ENTRY * j] = 1.0;
+                _this.renderColors[RGB_ELEMENTS_PER_ENTRY * j + 1] = 1.0;
+                _this.renderColors[RGB_ELEMENTS_PER_ENTRY * j + 2] = 1.0;
+            });
+        };
+        var this_1 = this;
+        for (var i = 0; i < numPoints; i++) {
+            _loop_1(i);
+        }
+    };
+    ScatterPlotVisualizer3DLabels.prototype.createLabelGeometry = function (dataSet) {
+        var _this = this;
+        this.processLabelVerts();
+        this.createColorBuffers();
+        var positionArray = new Float32Array(this.totalVertexCount * XYZ_ELEMENTS_PER_ENTRY);
+        this.positions =
+            new THREE.BufferAttribute(positionArray, XYZ_ELEMENTS_PER_ENTRY);
+        var posArray = new Float32Array(this.totalVertexCount * XYZ_ELEMENTS_PER_ENTRY);
+        var uvArray = new Float32Array(this.totalVertexCount * UV_ELEMENTS_PER_ENTRY);
+        var colorsArray = new Float32Array(this.totalVertexCount * RGB_ELEMENTS_PER_ENTRY);
+        var positionObject = new THREE.BufferAttribute(posArray, 2);
+        var uv = new THREE.BufferAttribute(uvArray, UV_ELEMENTS_PER_ENTRY);
+        var colors = new THREE.BufferAttribute(colorsArray, RGB_ELEMENTS_PER_ENTRY);
+        this.geometry = new THREE.BufferGeometry();
+        this.geometry.addAttribute('posObj', positionObject);
+        this.geometry.addAttribute('position', this.positions);
+        this.geometry.addAttribute('uv', uv);
+        this.geometry.addAttribute('color', colors);
+        var lettersSoFar = 0;
+        for (var i = 0; i < dataSet.points.length; i++) {
+            var label = this.labelAccessor(i).toString();
+            var leftOffset = 0;
+            // Determine length of word in pixels.
+            for (var j = 0; j < label.length; j++) {
+                var letterCode = label.charCodeAt(j);
+                leftOffset += this.glyphTexture.lengths[letterCode];
+            }
+            leftOffset /= -2; // centers text horizontally around the origin
+            for (var j = 0; j < label.length; j++) {
+                var letterCode = label.charCodeAt(j);
+                var letterWidth = this.glyphTexture.lengths[letterCode];
+                var scale = FONT_SIZE;
+                var right = (leftOffset + letterWidth) / scale;
+                var left = (leftOffset) / scale;
+                var top_1 = FONT_SIZE / scale;
+                // First triangle
+                positionObject.setXY(lettersSoFar * VERTICES_PER_GLYPH + 0, left, 0);
+                positionObject.setXY(lettersSoFar * VERTICES_PER_GLYPH + 1, right, 0);
+                positionObject.setXY(lettersSoFar * VERTICES_PER_GLYPH + 2, left, top_1);
+                // Second triangle
+                positionObject.setXY(lettersSoFar * VERTICES_PER_GLYPH + 3, left, top_1);
+                positionObject.setXY(lettersSoFar * VERTICES_PER_GLYPH + 4, right, 0);
+                positionObject.setXY(lettersSoFar * VERTICES_PER_GLYPH + 5, right, top_1);
+                // Set UVs based on letter.
+                var uLeft = (this.glyphTexture.offsets[letterCode]);
+                var uRight = (this.glyphTexture.offsets[letterCode] + letterWidth);
+                // Scale so that uvs lie between 0 and 1 on the texture.
+                uLeft /= MAX_CANVAS_DIMENSION;
+                uRight /= MAX_CANVAS_DIMENSION;
+                var vTop = 1;
+                var vBottom = 0;
+                uv.setXY(lettersSoFar * VERTICES_PER_GLYPH + 0, uLeft, vTop);
+                uv.setXY(lettersSoFar * VERTICES_PER_GLYPH + 1, uRight, vTop);
+                uv.setXY(lettersSoFar * VERTICES_PER_GLYPH + 2, uLeft, vBottom);
+                uv.setXY(lettersSoFar * VERTICES_PER_GLYPH + 3, uLeft, vBottom);
+                uv.setXY(lettersSoFar * VERTICES_PER_GLYPH + 4, uRight, vTop);
+                uv.setXY(lettersSoFar * VERTICES_PER_GLYPH + 5, uRight, vBottom);
+                lettersSoFar++;
+                leftOffset += letterWidth;
+            }
+        }
+        var _loop_2 = function(i) {
+            var pp = dataSet.points[i].projectedPoint;
+            this_2.labelVertexMap[i].forEach(function (j) {
+                _this.positions.setXYZ(j, pp[0], pp[1], pp[2]);
+            });
+        };
+        var this_2 = this;
+        for (var i = 0; i < dataSet.points.length; i++) {
+            _loop_2(i);
+        }
+        ;
+        this.labelsMesh = new THREE.Mesh(this.geometry, this.material);
+    };
+    ScatterPlotVisualizer3DLabels.prototype.destroyLabels = function () {
+        if (this.labelsMesh) {
+            if (this.scene) {
+                this.scene.remove(this.labelsMesh);
+            }
+            this.geometry.dispose();
+            this.labelsMesh = null;
+        }
+    };
+    ScatterPlotVisualizer3DLabels.prototype.createLabels = function (dataSet) {
+        this.destroyLabels();
+        if (this.labelAccessor) {
+            this.createLabelGeometry(dataSet);
+        }
+    };
+    ScatterPlotVisualizer3DLabels.prototype.colorSprites = function (pointColors) {
+        if (this.labelAccessor == null || this.geometry == null ||
+            this.dataSet == null || pointColors == null) {
+            return;
+        }
+        var colors = this.geometry.getAttribute('color');
+        colors.array = this.renderColors;
+        var n = this.dataSet.points.length;
+        var src = 0;
+        var _loop_3 = function(i) {
+            var c = new THREE.Color(pointColors[src++], pointColors[src++], pointColors[src++]);
+            this_3.labelVertexMap[i].forEach(function (j) {
+                colors.setXYZ(j, c.r, c.g, c.b);
+            });
+        };
+        var this_3 = this;
+        for (var i = 0; i < n; ++i) {
+            _loop_3(i);
+        }
+        colors.needsUpdate = true;
+    };
+    ScatterPlotVisualizer3DLabels.prototype.onRecreateScene = function (scene, sceneIs3D, backgroundColor) {
+        this.scene = scene;
+        if (this.labelsMesh == null) {
+            this.createLabels(this.dataSet);
+        }
+        if (this.labelsMesh) {
+            scene.add(this.labelsMesh);
+        }
+    };
+    ScatterPlotVisualizer3DLabels.prototype.removeAllFromScene = function (scene) {
+        this.destroyLabels();
+    };
+    ScatterPlotVisualizer3DLabels.prototype.onSetLabelAccessor = function (labelAccessor) {
+        this.labelAccessor = labelAccessor;
+        this.onUpdate(this.dataSet);
+    };
+    ScatterPlotVisualizer3DLabels.prototype.onDataSet = function (dataSet) {
+        this.dataSet = dataSet;
+        this.labelAccessor = null;
+    };
+    ScatterPlotVisualizer3DLabels.prototype.onPickingRender = function (rc) {
+        this.material.uniforms.texture.value = this.glyphTexture.texture;
+        this.material.uniforms.picking.value = true;
+        var colors = this.geometry.getAttribute('color');
+        colors.array = this.pickingColors;
+        colors.needsUpdate = true;
+    };
+    ScatterPlotVisualizer3DLabels.prototype.onRender = function (rc) {
+        this.colorSprites(rc.pointColors);
+        this.material.uniforms.texture.value = this.glyphTexture.texture;
+        this.material.uniforms.picking.value = false;
+        var colors = this.geometry.getAttribute('color');
+        colors.array = this.renderColors;
+        colors.needsUpdate = true;
+    };
+    ScatterPlotVisualizer3DLabels.prototype.onUpdate = function (dataSet) {
+        this.createLabels(dataSet);
+        if (this.labelsMesh && this.scene) {
+            this.scene.add(this.labelsMesh);
+        }
+    };
+    ScatterPlotVisualizer3DLabels.prototype.onResize = function (newWidth, newHeight) { };
+    return ScatterPlotVisualizer3DLabels;
+}());
+exports.ScatterPlotVisualizer3DLabels = ScatterPlotVisualizer3DLabels;
+
+},{"./util":24}],18:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+/**
+ * Maintains and renders 3d axes for the scatter plot.
+ */
+var ScatterPlotVisualizerAxes = (function () {
+    function ScatterPlotVisualizerAxes() {
+        this.axis = new THREE.AxisHelper();
+    }
+    ScatterPlotVisualizerAxes.prototype.onDataSet = function (dataSet) { };
+    ScatterPlotVisualizerAxes.prototype.onRecreateScene = function (scene, sceneIs3D, backgroundColor) {
+        if (sceneIs3D) {
+            scene.add(this.axis);
+        }
+    };
+    ScatterPlotVisualizerAxes.prototype.removeAllFromScene = function (scene) {
+        scene.remove(this.axis);
+    };
+    ScatterPlotVisualizerAxes.prototype.onPickingRender = function (renderContext) { };
+    ScatterPlotVisualizerAxes.prototype.onRender = function (renderContext) { };
+    ScatterPlotVisualizerAxes.prototype.onUpdate = function (dataSet) { };
+    ScatterPlotVisualizerAxes.prototype.onResize = function (newWidth, newHeight) { };
+    ScatterPlotVisualizerAxes.prototype.onSetLabelAccessor = function (labelAccessor) { };
+    return ScatterPlotVisualizerAxes;
+}());
+exports.ScatterPlotVisualizerAxes = ScatterPlotVisualizerAxes;
+
+},{}],19:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var label_1 = require('./label');
+var util_1 = require('./util');
+var MAX_LABELS_ON_SCREEN = 10000;
+/**
+ * Creates and maintains a 2d canvas on top of the GL canvas. All labels, when
+ * active, are rendered to the 2d canvas as part of the visible render pass.
+ */
+var ScatterPlotVisualizerCanvasLabels = (function () {
+    function ScatterPlotVisualizerCanvasLabels(container) {
+        this.labelsActive = true;
+        this.sceneIs3D = true;
+        this.canvas = container.append('canvas').node();
+        this.gc = this.canvas.getContext('2d');
+        d3.select(this.canvas).style({ position: 'absolute', left: 0, top: 0 });
+        this.canvas.style.pointerEvents = 'none';
+    }
+    ScatterPlotVisualizerCanvasLabels.prototype.removeAllLabels = function () {
+        var pixelWidth = this.canvas.width * window.devicePixelRatio;
+        var pixelHeight = this.canvas.height * window.devicePixelRatio;
+        this.gc.clearRect(0, 0, pixelWidth, pixelHeight);
+    };
+    /** Render all of the non-overlapping visible labels to the canvas. */
+    ScatterPlotVisualizerCanvasLabels.prototype.makeLabels = function (rc) {
+        if ((rc.labels == null) || (rc.labels.pointIndices.length === 0)) {
+            return;
+        }
+        var strokeStylePrefix;
+        var fillStylePrefix;
+        {
+            var ls = new THREE.Color(rc.labels.strokeColor).multiplyScalar(255);
+            var lc = new THREE.Color(rc.labels.fillColor).multiplyScalar(255);
+            strokeStylePrefix = 'rgba(' + ls.r + ',' + ls.g + ',' + ls.b + ',';
+            fillStylePrefix = 'rgba(' + lc.r + ',' + lc.g + ',' + lc.b + ',';
+        }
+        var labelHeight = parseInt(this.gc.font, 10);
+        var dpr = window.devicePixelRatio;
+        var grid;
+        {
+            var pixw = this.canvas.width * dpr;
+            var pixh = this.canvas.height * dpr;
+            var bb = { loX: 0, hiX: pixw, loY: 0, hiY: pixh };
+            grid = new label_1.CollisionGrid(bb, pixw / 25, pixh / 50);
+        }
+        var opacityMap = d3.scale.pow().exponent(Math.E)
+            .domain([rc.farthestCameraSpacePointZ, rc.nearestCameraSpacePointZ])
+            .range([0.1, 1]);
+        var camPos = rc.camera.position;
+        var camToTarget = camPos.clone().sub(rc.cameraTarget);
+        this.gc.lineWidth = 6;
+        this.gc.textBaseline = 'middle';
+        this.gc.miterLimit = 2;
+        // Have extra space between neighboring labels. Don't pack too tightly.
+        var labelMargin = 2;
+        // Shift the label to the right of the point circle.
+        var xShift = 4;
+        var n = Math.min(MAX_LABELS_ON_SCREEN, rc.labels.pointIndices.length);
+        for (var i = 0; i < n; ++i) {
+            var index = rc.labels.pointIndices[i];
+            var point = util_1.getProjectedPointFromIndex(this.dataSet, index);
+            // discard points that are behind the camera
+            var camToPoint = camPos.clone().sub(point);
+            if (camToTarget.dot(camToPoint) < 0) {
+                continue;
+            }
+            var _a = util_1.vector3DToScreenCoords(rc.camera, rc.screenWidth, rc.screenHeight, point), x = _a[0], y = _a[1];
+            x += xShift;
+            // Computing the width of the font is expensive,
+            // so we assume width of 1 at first. Then, if the label doesn't
+            // conflict with other labels, we measure the actual width.
+            var textBoundingBox = {
+                loX: x - labelMargin,
+                hiX: x + 1 + labelMargin,
+                loY: y - labelHeight / 2 - labelMargin,
+                hiY: y + labelHeight / 2 + labelMargin
+            };
+            if (grid.insert(textBoundingBox, true)) {
+                var text = rc.labelAccessor(index);
+                var fontSize = rc.labels.defaultFontSize * rc.labels.scaleFactors[i] * dpr;
+                this.gc.font = fontSize + 'px roboto';
+                // Now, check with properly computed width.
+                textBoundingBox.hiX += this.gc.measureText(text).width - 1;
+                if (grid.insert(textBoundingBox)) {
+                    var opacity = 1;
+                    if (this.sceneIs3D && (rc.labels.useSceneOpacityFlags[i] === 1)) {
+                        opacity = opacityMap(camToPoint.length());
+                    }
+                    this.gc.strokeStyle = strokeStylePrefix + opacity + ')';
+                    this.gc.fillStyle = fillStylePrefix + opacity + ')';
+                    this.gc.strokeText(text, x, y);
+                    this.gc.fillText(text, x, y);
+                }
+            }
+        }
+    };
+    ScatterPlotVisualizerCanvasLabels.prototype.onDataSet = function (dataSet) {
+        this.labelsActive = (dataSet.spriteAndMetadataInfo.spriteImage == null);
+        this.dataSet = dataSet;
+    };
+    ScatterPlotVisualizerCanvasLabels.prototype.onResize = function (newWidth, newHeight) {
+        var dpr = window.devicePixelRatio;
+        d3.select(this.canvas)
+            .attr('width', newWidth * dpr)
+            .attr('height', newHeight * dpr)
+            .style({ width: newWidth + 'px', height: newHeight + 'px' });
+    };
+    ScatterPlotVisualizerCanvasLabels.prototype.onRecreateScene = function (scene, sceneIs3D, backgroundColor) {
+        this.sceneIs3D = sceneIs3D;
+    };
+    ScatterPlotVisualizerCanvasLabels.prototype.removeAllFromScene = function (scene) {
+        this.removeAllLabels();
+    };
+    ScatterPlotVisualizerCanvasLabels.prototype.onUpdate = function () {
+        this.removeAllLabels();
+    };
+    ScatterPlotVisualizerCanvasLabels.prototype.onRender = function (rc) {
+        if (!this.labelsActive) {
+            return;
+        }
+        this.removeAllLabels();
+        this.makeLabels(rc);
+    };
+    ScatterPlotVisualizerCanvasLabels.prototype.onPickingRender = function (renderContext) { };
+    ScatterPlotVisualizerCanvasLabels.prototype.onSetLabelAccessor = function (labelAccessor) { };
+    return ScatterPlotVisualizerCanvasLabels;
+}());
+exports.ScatterPlotVisualizerCanvasLabels = ScatterPlotVisualizerCanvasLabels;
+
+},{"./label":11,"./util":24}],20:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var util_1 = require('./util');
+var NUM_POINTS_FOG_THRESHOLD = 5000;
+var MIN_POINT_SIZE = 5.0;
+var IMAGE_SIZE = 30;
+// Constants relating to the indices of buffer arrays.
+var RGB_NUM_ELEMENTS = 3;
+var INDEX_NUM_ELEMENTS = 1;
+var XYZ_NUM_ELEMENTS = 3;
+var VERTEX_SHADER = "\n  // Index of the specific vertex (passed in as bufferAttribute), and the\n  // variable that will be used to pass it to the fragment shader.\n  attribute float vertexIndex;\n  attribute vec3 color;\n  attribute float scaleFactor;\n\n  varying vec2 xyIndex;\n  varying vec3 vColor;\n\n  uniform bool sizeAttenuation;\n  uniform float pointSize;\n  uniform float imageWidth;\n  uniform float imageHeight;\n\n  void main() {\n    // Pass index and color values to fragment shader.\n    vColor = color;\n    xyIndex = vec2(mod(vertexIndex, imageWidth),\n              floor(vertexIndex / imageWidth));\n\n    // Transform current vertex by modelViewMatrix (model world position and\n    // camera world position matrix).\n    vec4 cameraSpacePos = modelViewMatrix * vec4(position, 1.0);\n\n    // Project vertex in camera-space to screen coordinates using the camera's\n    // projection matrix.\n    gl_Position = projectionMatrix * cameraSpacePos;\n\n    // Create size attenuation (if we're in 3D mode) by making the size of\n    // each point inversly proportional to its distance to the camera.\n    float outputPointSize = pointSize;\n    if (sizeAttenuation) {\n      outputPointSize = -pointSize / cameraSpacePos.z;\n    }\n\n    gl_PointSize =\n      max(outputPointSize * scaleFactor, " + MIN_POINT_SIZE.toFixed(1) + ");\n  }";
+var FRAGMENT_SHADER_POINT_TEST_CHUNK = "\n  bool point_in_unit_circle(vec2 spriteCoord) {\n    vec2 centerToP = spriteCoord - vec2(0.5, 0.5);\n    return dot(centerToP, centerToP) < (0.5 * 0.5);\n  }\n\n  bool point_in_unit_equilateral_triangle(vec2 spriteCoord) {\n    vec3 v0 = vec3(0, 1, 0);\n    vec3 v1 = vec3(0.5, 0, 0);\n    vec3 v2 = vec3(1, 1, 0);\n    vec3 p = vec3(spriteCoord, 0);\n    float p_in_v0_v1 = cross(v1 - v0, p - v0).z;\n    float p_in_v1_v2 = cross(v2 - v1, p - v1).z;\n    return (p_in_v0_v1 > 0.0) && (p_in_v1_v2 > 0.0);\n  }\n";
+var FRAGMENT_SHADER = "\n  varying vec2 xyIndex;\n  varying vec3 vColor;\n\n  uniform sampler2D texture;\n  uniform float imageWidth;\n  uniform float imageHeight;\n  uniform bool isImage;\n\n  " + THREE.ShaderChunk['common'] + "\n  " + THREE.ShaderChunk['fog_pars_fragment'] + "\n  " + FRAGMENT_SHADER_POINT_TEST_CHUNK + "\n\n  void main() {\n    if (isImage) {\n      // Coordinates of the vertex within the entire sprite image.\n      vec2 coords = (gl_PointCoord + xyIndex) / vec2(imageWidth, imageHeight);\n      gl_FragColor = vec4(vColor, 1.0) * texture2D(texture, coords);\n    } else {\n      bool inside = point_in_unit_circle(gl_PointCoord);\n      vec3 c = mix(vec3(1, 1, 1), vColor, float(inside));\n      gl_FragColor = vec4(c, 1);\n    }\n    " + THREE.ShaderChunk['fog_fragment'] + "\n  }";
+var FRAGMENT_SHADER_PICKING = "\n  varying vec2 xyIndex;\n  varying vec3 vColor;\n  uniform bool isImage;\n\n  " + FRAGMENT_SHADER_POINT_TEST_CHUNK + "\n\n  void main() {\n    xyIndex; // Silence 'unused variable' warning.\n    if (isImage) {\n      gl_FragColor = vec4(vColor, 1);\n    } else {\n      bool inside = point_in_unit_circle(gl_PointCoord);\n      if (!inside) {\n        discard;\n      }\n      gl_FragColor = vec4(vColor, 1);\n    }\n  }";
+/**
+ * Uses GL point sprites to render the dataset.
+ */
+var ScatterPlotVisualizerSprites = (function () {
+    function ScatterPlotVisualizerSprites() {
+        this.sceneIs3D = true;
+    }
+    /**
+     * Create points, set their locations and actually instantiate the
+     * geometry.
+     */
+    ScatterPlotVisualizerSprites.prototype.addSprites = function (scene) {
+        this.geometry = new THREE.BufferGeometry();
+        this.createBufferAttributes();
+        var canvas = document.createElement('canvas');
+        var image = this.image || canvas;
+        var tex = util_1.createTexture(image);
+        var pointSize = (this.sceneIs3D ? this.pointSize3D : this.pointSize2D);
+        var imageDim = [0, 0];
+        if (this.image) {
+            pointSize = IMAGE_SIZE;
+            imageDim =
+                this.dataSet.spriteAndMetadataInfo.spriteMetadata.singleImageDim;
+        }
+        this.uniforms = {
+            texture: { type: 't', value: tex },
+            imageWidth: { type: 'f', value: image.width / imageDim[0] },
+            imageHeight: { type: 'f', value: image.height / imageDim[1] },
+            fogColor: { type: 'c', value: this.fog.color },
+            fogNear: { type: 'f', value: this.fog.near },
+            fogFar: { type: 'f', value: this.fog.far },
+            sizeAttenuation: { type: 'bool', value: this.sceneIs3D },
+            isImage: { type: 'bool', value: (this.image != null) },
+            pointSize: { type: 'f', value: pointSize }
+        };
+        var haveImage = (this.image != null);
+        this.renderMaterial = new THREE.ShaderMaterial({
+            uniforms: this.uniforms,
+            vertexShader: VERTEX_SHADER,
+            fragmentShader: FRAGMENT_SHADER,
+            transparent: !haveImage,
+            depthTest: haveImage,
+            depthWrite: haveImage,
+            fog: true,
+            blending: (this.image ? THREE.NormalBlending : THREE.MultiplyBlending),
+        });
+        this.pickingMaterial = new THREE.ShaderMaterial({
+            uniforms: this.uniforms,
+            vertexShader: VERTEX_SHADER,
+            fragmentShader: FRAGMENT_SHADER_PICKING,
+            transparent: true,
+            depthTest: true,
+            depthWrite: true,
+            fog: false,
+            blending: THREE.NormalBlending,
+        });
+        this.points = new THREE.Points(this.geometry, this.renderMaterial);
+        scene.add(this.points);
+    };
+    ScatterPlotVisualizerSprites.prototype.calibratePointSize = function () {
+        var numPts = this.dataSet.points.length;
+        var scaleConstant = 200;
+        var logBase = 8;
+        // Scale point size inverse-logarithmically to the number of points.
+        this.pointSize3D = scaleConstant / Math.log(numPts) / Math.log(logBase);
+        this.pointSize2D = this.pointSize3D / 1.5;
+    };
+    ScatterPlotVisualizerSprites.prototype.setFogDistances = function (nearestPointZ, farthestPointZ) {
+        if (this.sceneIs3D) {
+            this.fog.near = nearestPointZ;
+            // If there are fewer points we want less fog. We do this
+            // by making the "far" value (that is, the distance from the camera to the
+            // far edge of the fog) proportional to the number of points.
+            var multiplier = 2 -
+                Math.min(this.dataSet.points.length, NUM_POINTS_FOG_THRESHOLD) /
+                    NUM_POINTS_FOG_THRESHOLD;
+            this.fog.far = farthestPointZ * multiplier;
+        }
+        else {
+            this.fog.near = Infinity;
+            this.fog.far = Infinity;
+        }
+    };
+    /**
+     * Set up buffer attributes to be used for the points/images.
+     */
+    ScatterPlotVisualizerSprites.prototype.createBufferAttributes = function () {
+        var numPoints = this.dataSet.points.length;
+        // Fill pickingColors with each point's unique id as its color.
+        this.pickingColors = new Float32Array(numPoints * RGB_NUM_ELEMENTS);
+        {
+            var dst = 0;
+            for (var i = 0; i < numPoints; i++) {
+                var c = new THREE.Color(i);
+                this.pickingColors[dst++] = c.r;
+                this.pickingColors[dst++] = c.g;
+                this.pickingColors[dst++] = c.b;
+            }
+        }
+        var colors = new THREE.BufferAttribute(this.pickingColors, RGB_NUM_ELEMENTS);
+        var scaleFactors = new THREE.BufferAttribute(new Float32Array(numPoints), INDEX_NUM_ELEMENTS);
+        var positions = new THREE.BufferAttribute(new Float32Array(numPoints * XYZ_NUM_ELEMENTS), XYZ_NUM_ELEMENTS);
+        /**
+         * The actual indices of the points which we use for sizeAttenuation in
+         * the shader.
+         */
+        var indicesShader = new THREE.BufferAttribute(new Float32Array(numPoints), 1);
+        // Create the array of indices.
+        for (var i = 0; i < numPoints; i++) {
+            indicesShader.setX(i, this.dataSet.points[i].index);
+        }
+        this.geometry.addAttribute('position', positions);
+        this.geometry.addAttribute('color', colors);
+        this.geometry.addAttribute('vertexIndex', indicesShader);
+        this.geometry.addAttribute('scaleFactor', scaleFactors);
+    };
+    ScatterPlotVisualizerSprites.prototype.updatePositionsArray = function (dataSet) {
+        if (this.geometry == null) {
+            return;
+        }
+        var n = dataSet.points.length;
+        var positions = this.geometry.getAttribute('position');
+        positions.array = new Float32Array(n * XYZ_NUM_ELEMENTS);
+        for (var i = 0; i < n; i++) {
+            var pp = dataSet.points[i].projectedPoint;
+            positions.setXYZ(i, pp[0], pp[1], pp[2]);
+        }
+        positions.needsUpdate = true;
+    };
+    ScatterPlotVisualizerSprites.prototype.removeAllFromScene = function (scene) {
+        scene.remove(this.points);
+    };
+    ScatterPlotVisualizerSprites.prototype.onDataSet = function (dataSet) {
+        this.dataSet = dataSet;
+        this.image = this.dataSet.spriteAndMetadataInfo.spriteImage;
+        this.points = null;
+        if (this.geometry) {
+            this.geometry.dispose();
+        }
+        this.geometry = null;
+        this.calibratePointSize();
+    };
+    ScatterPlotVisualizerSprites.prototype.onRecreateScene = function (scene, sceneIs3D, backgroundColor) {
+        this.sceneIs3D = sceneIs3D;
+        this.fog = new THREE.Fog(backgroundColor);
+        scene.fog = this.fog;
+        if (this.dataSet) {
+            this.addSprites(scene);
+            this.updatePositionsArray(this.dataSet);
+        }
+    };
+    ScatterPlotVisualizerSprites.prototype.onUpdate = function (dataSet) {
+        this.updatePositionsArray(dataSet);
+    };
+    ScatterPlotVisualizerSprites.prototype.onResize = function (newWidth, newHeight) { };
+    ScatterPlotVisualizerSprites.prototype.onSetLabelAccessor = function (labelAccessor) { };
+    ScatterPlotVisualizerSprites.prototype.onPickingRender = function (rc) {
+        if (!this.geometry) {
+            return;
+        }
+        this.points.material = this.pickingMaterial;
+        var colors = this.geometry.getAttribute('color');
+        colors.array = this.pickingColors;
+        colors.needsUpdate = true;
+        var scaleFactors = this.geometry.getAttribute('scaleFactor');
+        scaleFactors.array = rc.pointScaleFactors;
+        scaleFactors.needsUpdate = true;
+    };
+    ScatterPlotVisualizerSprites.prototype.onRender = function (rc) {
+        if (!this.geometry) {
+            return;
+        }
+        this.setFogDistances(rc.nearestCameraSpacePointZ, rc.farthestCameraSpacePointZ);
+        this.points.material = this.renderMaterial;
+        this.renderMaterial.uniforms.isImage.value = !!this.image;
+        var colors = this.geometry.getAttribute('color');
+        this.renderColors = rc.pointColors;
+        colors.array = this.renderColors;
+        colors.needsUpdate = true;
+        var scaleFactors = this.geometry.getAttribute('scaleFactor');
+        scaleFactors.array = rc.pointScaleFactors;
+        scaleFactors.needsUpdate = true;
+    };
+    return ScatterPlotVisualizerSprites;
+}());
+exports.ScatterPlotVisualizerSprites = ScatterPlotVisualizerSprites;
+
+},{"./util":24}],21:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var TRACE_DEFAULT_OPACITY = .2;
+var TRACE_DEFAULT_LINEWIDTH = 2;
+var TRACE_SELECTED_OPACITY = .9;
+var TRACE_SELECTED_LINEWIDTH = 3;
+var TRACE_DESELECTED_OPACITY = .05;
+var RGB_NUM_ELEMENTS = 3;
+var XYZ_NUM_ELEMENTS = 3;
+/**
+ * Renders 'traces' (polylines) that connect multiple points in the dataset
+ */
+var ScatterPlotVisualizerTraces = (function () {
+    function ScatterPlotVisualizerTraces(selectionContext) {
+        var _this = this;
+        this.tracePositionBuffer = {};
+        this.traceColorBuffer = {};
+        selectionContext.registerSelectionChangedListener(function (s) { return _this.onSelectionChanged(s); });
+    }
+    /**
+     * Create line traces between connected points and instantiate the geometry.
+     */
+    ScatterPlotVisualizerTraces.prototype.addTraces = function (scene) {
+        if (!this.dataSet || !this.dataSet.traces) {
+            return;
+        }
+        this.traces = [];
+        for (var i = 0; i < this.dataSet.traces.length; i++) {
+            var dataTrace = this.dataSet.traces[i];
+            for (var j = 0; j < dataTrace.pointIndices.length - 1; j++) {
+                this.dataSet.points[dataTrace.pointIndices[j]].traceIndex = i;
+                this.dataSet.points[dataTrace.pointIndices[j + 1]].traceIndex = i;
+            }
+            var geometry = new THREE.BufferGeometry();
+            geometry.addAttribute('position', this.tracePositionBuffer[i]);
+            this.tracePositionBuffer[i].needsUpdate = true;
+            geometry.addAttribute('color', this.traceColorBuffer[i]);
+            this.traceColorBuffer[i].needsUpdate = true;
+            // We use the same material for every line.
+            var material = new THREE.LineBasicMaterial({
+                linewidth: TRACE_DEFAULT_LINEWIDTH,
+                opacity: TRACE_DEFAULT_OPACITY,
+                transparent: true,
+                vertexColors: THREE.VertexColors
+            });
+            var trace = new THREE.LineSegments(geometry, material);
+            this.traces.push(trace);
+            scene.add(trace);
+        }
+    };
+    ScatterPlotVisualizerTraces.prototype.resetTraces = function () {
+        if (!this.traces) {
+            return;
+        }
+        for (var i = 0; i < this.traces.length; i++) {
+            this.traces[i].material.opacity = TRACE_DEFAULT_OPACITY;
+            this.traces[i].material.linewidth =
+                TRACE_DEFAULT_LINEWIDTH;
+            this.traces[i].material.needsUpdate = true;
+        }
+    };
+    ScatterPlotVisualizerTraces.prototype.removeAllFromScene = function (scene) {
+        if (!this.traces) {
+            return;
+        }
+        for (var i = 0; i < this.traces.length; i++) {
+            scene.remove(this.traces[i]);
+        }
+        this.traces = [];
+    };
+    ScatterPlotVisualizerTraces.prototype.onDataSet = function (dataSet) {
+        this.dataSet = dataSet;
+        if (dataSet) {
+            // Set up the position buffer arrays for each trace.
+            for (var i = 0; i < this.dataSet.traces.length; i++) {
+                var dataTrace = this.dataSet.traces[i];
+                var vertexCount = 2 * (dataTrace.pointIndices.length - 1);
+                var traces = new Float32Array(vertexCount * XYZ_NUM_ELEMENTS);
+                this.tracePositionBuffer[i] =
+                    new THREE.BufferAttribute(traces, XYZ_NUM_ELEMENTS);
+                var colors = new Float32Array(vertexCount * RGB_NUM_ELEMENTS);
+                this.traceColorBuffer[i] =
+                    new THREE.BufferAttribute(colors, RGB_NUM_ELEMENTS);
+            }
+        }
+    };
+    ScatterPlotVisualizerTraces.prototype.onSelectionChanged = function (selection) {
+        this.resetTraces();
+        if (selection.length > 0) {
+            var selectedIndex = selection[0];
+            var traceIndex = this.dataSet.points[selectedIndex].traceIndex;
+            if (traceIndex) {
+                for (var i = 0; i < this.traces.length; i++) {
+                    this.traces[i].material.opacity = TRACE_DESELECTED_OPACITY;
+                    this.traces[i].material.needsUpdate = true;
+                }
+                this.traces[traceIndex].material.opacity = TRACE_SELECTED_OPACITY;
+                this.traces[traceIndex].material
+                    .linewidth = TRACE_SELECTED_LINEWIDTH;
+                this.traces[traceIndex].material.needsUpdate = true;
+            }
+        }
+    };
+    ScatterPlotVisualizerTraces.prototype.onRecreateScene = function (scene, sceneIs3D, backgroundColor) {
+        this.addTraces(scene);
+    };
+    ScatterPlotVisualizerTraces.prototype.onUpdate = function () {
+        if (!this.dataSet) {
+            return;
+        }
+        for (var i = 0; i < this.dataSet.traces.length; i++) {
+            var dataTrace = this.dataSet.traces[i];
+            var vertexCount = 0;
+            for (var j = 0; j < dataTrace.pointIndices.length - 1; j++) {
+                var point1 = this.dataSet.points[dataTrace.pointIndices[j]];
+                var point2 = this.dataSet.points[dataTrace.pointIndices[j + 1]];
+                this.tracePositionBuffer[i].setXYZ(vertexCount, point1.projectedPoint[0], point1.projectedPoint[1], point1.projectedPoint[2]);
+                this.tracePositionBuffer[i].setXYZ(vertexCount + 1, point2.projectedPoint[0], point2.projectedPoint[1], point2.projectedPoint[2]);
+                vertexCount += 2;
+            }
+        }
+        for (var i = 0; i < this.dataSet.traces.length; i++) {
+            this.tracePositionBuffer[i].needsUpdate = true;
+        }
+    };
+    ScatterPlotVisualizerTraces.prototype.onRender = function (renderContext) {
+        for (var i = 0; i < this.dataSet.traces.length; i++) {
+            this.traceColorBuffer[i].array = renderContext.traceColors[i];
+            this.traceColorBuffer[i].needsUpdate = true;
+        }
+    };
+    ScatterPlotVisualizerTraces.prototype.onPickingRender = function (renderContext) { };
+    ScatterPlotVisualizerTraces.prototype.onResize = function (newWidth, newHeight) { };
+    ScatterPlotVisualizerTraces.prototype.onSetLabelAccessor = function (labelAccessor) { };
+    return ScatterPlotVisualizerTraces;
+}());
+exports.ScatterPlotVisualizerTraces = ScatterPlotVisualizerTraces;
+
+},{}],22:[function(require,module,exports){
+arguments[4][9][0].apply(exports,arguments)
+},{"dup":9}],23:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+/**
+ * A Space-partitioning tree (https://en.wikipedia.org/wiki/Space_partitioning)
+ * that recursively divides the space into regions of equal sizes. This data
+ * structure can act both as a Quad tree and an Octree when the data is 2 or
+ * 3 dimensional respectively. One usage is in t-SNE in order to do Barnes-Hut
+ * approximation.
+ */
+var SPTree = (function () {
+    /**
+     * Constructs a new tree with the provided data.
+     *
+     * @param data List of n-dimensional data points.
+     * @param capacity Number of data points to store in a single node.
+     */
+    function SPTree(data) {
+        if (data.length < 1) {
+            throw new Error('There should be at least 1 data point');
+        }
+        // Make a bounding box based on the extent of the data.
+        this.dim = data[0].length;
+        // Each node has 2^d children, where d is the dimension of the space.
+        // Binary masks (e.g. 000, 001, ... 111 in 3D) are used to determine in
+        // which child (e.g. quadron in 2D) the new point is going to be assigned.
+        // For more details, see the insert() method and its comments.
+        this.masks = new Array(Math.pow(2, this.dim));
+        for (var d = 0; d < this.masks.length; ++d) {
+            this.masks[d] = (1 << d);
+        }
+        var min = new Array(this.dim);
+        fillArray(min, Number.POSITIVE_INFINITY);
+        var max = new Array(this.dim);
+        fillArray(max, Number.NEGATIVE_INFINITY);
+        for (var i = 0; i < data.length; ++i) {
+            // For each dim get the min and max.
+            // E.g. For 2-D, get the x_min, x_max, y_min, y_max.
+            for (var d = 0; d < this.dim; ++d) {
+                min[d] = Math.min(min[d], data[i][d]);
+                max[d] = Math.max(max[d], data[i][d]);
+            }
+        }
+        // Create a bounding box with the center of the largest span.
+        var center = new Array(this.dim);
+        var halfDim = 0;
+        for (var d = 0; d < this.dim; ++d) {
+            var span = max[d] - min[d];
+            center[d] = min[d] + span / 2;
+            halfDim = Math.max(halfDim, span / 2);
+        }
+        this.root = { box: { center: center, halfDim: halfDim }, point: data[0] };
+        for (var i = 1; i < data.length; ++i) {
+            this.insert(this.root, data[i]);
+        }
+    }
+    /**
+     * Visits every node in the tree. Each node can store 1 or more points,
+     * depending on the node capacity provided in the constructor.
+     *
+     * @param accessor Method that takes the currently visited node, and the
+     * low and high point of the region that this node occupies. E.g. in 2D,
+     * the low and high points will be the lower-left corner and the upper-right
+     * corner.
+     */
+    SPTree.prototype.visit = function (accessor, noBox) {
+        if (noBox === void 0) { noBox = false; }
+        this.visitNode(this.root, accessor, noBox);
+    };
+    SPTree.prototype.visitNode = function (node, accessor, noBox) {
+        var skipChildren;
+        if (noBox) {
+            skipChildren = accessor(node);
+        }
+        else {
+            var lowPoint = new Array(this.dim);
+            var highPoint = new Array(this.dim);
+            for (var d = 0; d < this.dim; ++d) {
+                lowPoint[d] = node.box.center[d] - node.box.halfDim;
+                highPoint[d] = node.box.center[d] + node.box.halfDim;
+            }
+            skipChildren = accessor(node, lowPoint, highPoint);
+        }
+        if (!node.children || skipChildren) {
+            return;
+        }
+        for (var i = 0; i < node.children.length; ++i) {
+            var child = node.children[i];
+            if (child) {
+                this.visitNode(child, accessor, noBox);
+            }
+        }
+    };
+    SPTree.prototype.insert = function (node, p) {
+        // Subdivide and then add the point to whichever node will accept it.
+        if (node.children == null) {
+            node.children = new Array(this.masks.length);
+        }
+        // Decide which child will get the new point by constructing a D-bits binary
+        // signature (D=3 for 3D) where the k-th bit is 1 if the point's k-th
+        // coordinate is greater than the node's k-th coordinate, 0 otherwise.
+        // Then the binary signature in decimal system gives us the index of the
+        // child where the new point should be.
+        var index = 0;
+        for (var d = 0; d < this.dim; ++d) {
+            if (p[d] > node.box.center[d]) {
+                index |= this.masks[d];
+            }
+        }
+        if (node.children[index] == null) {
+            this.makeChild(node, index, p);
+        }
+        else {
+            this.insert(node.children[index], p);
+        }
+    };
+    SPTree.prototype.makeChild = function (node, index, p) {
+        var oldC = node.box.center;
+        var h = node.box.halfDim / 2;
+        var newC = new Array(this.dim);
+        for (var d = 0; d < this.dim; ++d) {
+            newC[d] = (index & (1 << d)) ? oldC[d] + h : oldC[d] - h;
+        }
+        node.children[index] = { box: { center: newC, halfDim: h }, point: p };
+    };
+    return SPTree;
+}());
+exports.SPTree = SPTree;
+function fillArray(arr, value) {
+    for (var i = 0; i < arr.length; ++i) {
+        arr[i] = value;
+    }
+}
+
+},{}],24:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var logging = require('./logging');
+/**
+ * Delay for running expensive tasks, in milliseconds.
+ * The duration was empirically found so that it leaves enough time for the
+ * browser to update its UI state before starting an expensive UI-blocking task.
+ */
+var TASK_DELAY_MS = 200;
+/** Shuffles the array in-place in O(n) time using Fisher-Yates algorithm. */
+function shuffle(array) {
+    var m = array.length;
+    var t;
+    var i;
+    // While there remain elements to shuffle.
+    while (m) {
+        // Pick a remaining element
+        i = Math.floor(Math.random() * m--);
+        // And swap it with the current element.
+        t = array[m];
+        array[m] = array[i];
+        array[i] = t;
+    }
+    return array;
+}
+exports.shuffle = shuffle;
+/** Retrieves a projected point from the data set as a THREE.js vector */
+function getProjectedPointFromIndex(dataSet, i) {
+    var pp = dataSet.points[i].projectedPoint;
+    var v = new THREE.Vector3(pp[0], pp[1], pp[2]);
+    return v;
+}
+exports.getProjectedPointFromIndex = getProjectedPointFromIndex;
+/** Projects a 3d point into screen space */
+function vector3DToScreenCoords(cam, w, h, v) {
+    var dpr = window.devicePixelRatio;
+    var pv = new THREE.Vector3().copy(v).project(cam);
+    // The screen-space origin is at the middle of the screen, with +y up.
+    var coords = [((pv.x + 1) / 2 * w) * dpr, -((pv.y - 1) / 2 * h) * dpr];
+    return coords;
+}
+exports.vector3DToScreenCoords = vector3DToScreenCoords;
+/**
+ * Gets the camera-space z coordinates of the nearest and farthest points.
+ * Ignores points that are behind the camera.
+ */
+function getNearFarPoints(dataSet, cameraPos, cameraTarget) {
+    var shortestDist = Infinity;
+    var furthestDist = 0;
+    var camToTarget = new THREE.Vector3().copy(cameraTarget).sub(cameraPos);
+    for (var i = 0; i < dataSet.points.length; i++) {
+        var point = getProjectedPointFromIndex(dataSet, i);
+        var camToPoint = new THREE.Vector3().copy(point).sub(cameraPos);
+        if (camToTarget.dot(camToPoint) < 0) {
+            continue;
+        }
+        var distToCam = cameraPos.distanceToSquared(point);
+        furthestDist = Math.max(furthestDist, distToCam);
+        shortestDist = Math.min(shortestDist, distToCam);
+    }
+    furthestDist = Math.sqrt(furthestDist);
+    shortestDist = Math.sqrt(shortestDist);
+    return [shortestDist, furthestDist];
+}
+exports.getNearFarPoints = getNearFarPoints;
+/**
+ * Generate a texture for the points/images and sets some initial params
+ */
+function createTexture(image) {
+    var tex = new THREE.Texture(image);
+    tex.needsUpdate = true;
+    // Used if the texture isn't a power of 2.
+    tex.minFilter = THREE.LinearFilter;
+    tex.generateMipmaps = false;
+    tex.flipY = false;
+    return tex;
+}
+exports.createTexture = createTexture;
+/**
+ * Assert that the condition is satisfied; if not, log user-specified message
+ * to the console.
+ */
+function assert(condition, message) {
+    if (!condition) {
+        message = message || 'Assertion failed';
+        throw new Error(message);
+    }
+}
+exports.assert = assert;
+function getSearchPredicate(query, inRegexMode, fieldName) {
+    var predicate;
+    if (inRegexMode) {
+        var regExp_1 = new RegExp(query, 'i');
+        predicate = function (p) { return regExp_1.test(p.metadata[fieldName].toString()); };
+    }
+    else {
+        // Doing a case insensitive substring match.
+        query = query.toLowerCase();
+        predicate = function (p) {
+            var label = p.metadata[fieldName].toString().toLowerCase();
+            return label.indexOf(query) >= 0;
+        };
+    }
+    return predicate;
+}
+exports.getSearchPredicate = getSearchPredicate;
+/**
+ * Runs an expensive task asynchronously with some delay
+ * so that it doesn't block the UI thread immediately.
+ *
+ * @param message The message to display to the user.
+ * @param task The expensive task to run.
+ * @param msgId Optional. ID of an existing message. If provided, will overwrite
+ *     an existing message and won't automatically clear the message when the
+ *     task is done.
+ * @return The value returned by the task.
+ */
+function runAsyncTask(message, task, msgId) {
+    if (msgId === void 0) { msgId = null; }
+    var autoClear = (msgId == null);
+    msgId = logging.setModalMessage(message, msgId);
+    return new Promise(function (resolve, reject) {
+        d3.timer(function () {
+            try {
+                var result = task();
+                // Clearing the old message.
+                if (autoClear) {
+                    logging.setModalMessage(null, msgId);
+                }
+                resolve(result);
+            }
+            catch (ex) {
+                reject(ex);
+            }
+            return true;
+        }, TASK_DELAY_MS);
+    });
+}
+exports.runAsyncTask = runAsyncTask;
+
+},{"./logging":12}],25:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var util_1 = require('./util');
+/** Returns the dot product of two vectors. */
+function dot(a, b) {
+    util_1.assert(a.length === b.length, 'Vectors a and b must be of same length');
+    var result = 0;
+    for (var i = 0; i < a.length; ++i) {
+        result += a[i] * b[i];
+    }
+    return result;
+}
+exports.dot = dot;
+/** Sums all the elements in the vector */
+function sum(a) {
+    var result = 0;
+    for (var i = 0; i < a.length; ++i) {
+        result += a[i];
+    }
+    return result;
+}
+exports.sum = sum;
+/** Returns the sum of two vectors, i.e. a + b */
+function add(a, b) {
+    util_1.assert(a.length === b.length, 'Vectors a and b must be of same length');
+    var result = new Array(a.length);
+    for (var i = 0; i < a.length; ++i) {
+        result[i] = a[i] + b[i];
+    }
+    return result;
+}
+exports.add = add;
+/** Subtracts vector b from vector a, i.e. returns a - b */
+function sub(a, b) {
+    util_1.assert(a.length === b.length, 'Vectors a and b must be of same length');
+    var result = new Array(a.length);
+    for (var i = 0; i < a.length; ++i) {
+        result[i] = a[i] - b[i];
+    }
+    return result;
+}
+exports.sub = sub;
+/** Returns the square norm of the vector */
+function norm2(a) {
+    var result = 0;
+    for (var i = 0; i < a.length; ++i) {
+        result += a[i] * a[i];
+    }
+    return result;
+}
+exports.norm2 = norm2;
+/** Returns the euclidean distance between two vectors. */
+function dist(a, b) {
+    return Math.sqrt(dist2(a, b));
+}
+exports.dist = dist;
+/** Returns the square euclidean distance between two vectors. */
+function dist2(a, b) {
+    util_1.assert(a.length === b.length, 'Vectors a and b must be of same length');
+    var result = 0;
+    for (var i = 0; i < a.length; ++i) {
+        var diff = a[i] - b[i];
+        result += diff * diff;
+    }
+    return result;
+}
+exports.dist2 = dist2;
+/** Returns the square euclidean distance between two 2D points. */
+function dist2_2D(a, b) {
+    var dX = a[0] - b[0];
+    var dY = a[1] - b[1];
+    return dX * dX + dY * dY;
+}
+exports.dist2_2D = dist2_2D;
+/** Returns the euclidean distance between 2 2D points. */
+function dist_2D(a, b) {
+    return Math.sqrt(dist2_2D(a, b));
+}
+exports.dist_2D = dist_2D;
+/** Returns the square euclidean distance between two 3D points. */
+function dist2_3D(a, b) {
+    var dX = a[0] - b[0];
+    var dY = a[1] - b[1];
+    var dZ = a[2] - b[2];
+    return dX * dX + dY * dY + dZ * dZ;
+}
+exports.dist2_3D = dist2_3D;
+/** Returns the euclidean distance between 2 3D points. */
+function dist_3D(a, b) {
+    return Math.sqrt(dist2_3D(a, b));
+}
+exports.dist_3D = dist_3D;
+/**
+ * Returns the square euclidean distance between two vectors, with an early
+ * exit (returns -1) if the distance is >= to the provided limit.
+ */
+function dist2WithLimit(a, b, limit) {
+    util_1.assert(a.length === b.length, 'Vectors a and b must be of same length');
+    var result = 0;
+    for (var i = 0; i < a.length; ++i) {
+        var diff = a[i] - b[i];
+        result += diff * diff;
+        if (result >= limit) {
+            return -1;
+        }
+    }
+    return result;
+}
+exports.dist2WithLimit = dist2WithLimit;
+/** Returns the square euclidean distance between two 2D points. */
+function dist22D(a, b) {
+    var dX = a[0] - b[0];
+    var dY = a[1] - b[1];
+    return dX * dX + dY * dY;
+}
+exports.dist22D = dist22D;
+/** Modifies the vector in-place to have unit norm. */
+function unit(a) {
+    var norm = Math.sqrt(norm2(a));
+    util_1.assert(norm >= 0, 'Norm of the vector must be > 0');
+    for (var i = 0; i < a.length; ++i) {
+        a[i] /= norm;
+    }
+}
+exports.unit = unit;
+/**
+ *  Projects the vectors to a lower dimension
+ *
+ * @param vectors Array of vectors to be projected.
+ * @param newDim The resulting dimension of the vectors.
+ */
+function projectRandom(vectors, newDim) {
+    var dim = vectors[0].length;
+    var N = vectors.length;
+    var newVectors = new Array(N);
+    for (var i = 0; i < N; ++i) {
+        newVectors[i] = new Array(newDim);
+    }
+    // Make nDim projections.
+    for (var k = 0; k < newDim; ++k) {
+        var randomVector = rn(dim);
+        for (var i = 0; i < N; ++i) {
+            newVectors[i][k] = dot(vectors[i], randomVector);
+        }
+    }
+    return newVectors;
+}
+exports.projectRandom = projectRandom;
+/**
+ * Projects a vector onto a 2D plane specified by the two direction vectors.
+ */
+function project2d(a, dir1, dir2) {
+    return [dot(a, dir1), dot(a, dir2)];
+}
+exports.project2d = project2d;
+/** Returns a vector filled with zeros */
+function zeros(length) {
+    var result = new Array(length);
+    for (var i = 0; i < length; ++i) {
+        result[i] = 0;
+    }
+    return result;
+}
+exports.zeros = zeros;
+/**
+ * Computes the centroid of the data points. If the provided data points are not
+ * vectors, an accessor function needs to be provided.
+ */
+function centroid(dataPoints, accessor) {
+    if (dataPoints.length === 0) {
+        return null;
+    }
+    if (accessor == null) {
+        accessor = function (a) { return a; };
+    }
+    util_1.assert(dataPoints.length >= 0, '`vectors` must be of length >= 1');
+    var centroid = zeros(accessor(dataPoints[0]).length);
+    for (var i = 0; i < dataPoints.length; ++i) {
+        var dataPoint = dataPoints[i];
+        var vector = accessor(dataPoint);
+        for (var j = 0; j < centroid.length; ++j) {
+            centroid[j] += vector[j];
+        }
+    }
+    for (var j = 0; j < centroid.length; ++j) {
+        centroid[j] /= dataPoints.length;
+    }
+    return centroid;
+}
+exports.centroid = centroid;
+/**
+ * Generates a vector of the specified size where each component is drawn from
+ * a random (0, 1) gaussian distribution.
+ */
+function rn(size) {
+    var normal = d3.random.normal();
+    var result = new Array(size);
+    for (var i = 0; i < size; ++i) {
+        result[i] = normal();
+    }
+    return result;
+}
+exports.rn = rn;
+/**
+ * Returns the cosine distance ([0, 2]) between two vectors
+ * that have been normalized to unit norm.
+ */
+function cosDistNorm(a, b) {
+    return 1 - dot(a, b);
+}
+exports.cosDistNorm = cosDistNorm;
+/**
+ * Returns the cosine distance ([0, 2]) between two vectors.
+ */
+function cosDist(a, b) {
+    return 1 - cosSim(a, b);
+}
+exports.cosDist = cosDist;
+/** Returns the cosine similarity ([-1, 1]) between two vectors. */
+function cosSim(a, b) {
+    return dot(a, b) / Math.sqrt(norm2(a) * norm2(b));
+}
+exports.cosSim = cosSim;
+/**
+ * Converts list of vectors (matrix) into a 1-dimensional
+ * typed array with row-first order.
+ */
+function toTypedArray(dataPoints, accessor) {
+    var N = dataPoints.length;
+    var dim = accessor(dataPoints[0]).length;
+    var result = new Float32Array(N * dim);
+    for (var i = 0; i < N; ++i) {
+        var vector = accessor(dataPoints[i]);
+        for (var d = 0; d < dim; ++d) {
+            result[i * dim + d] = vector[d];
+        }
+    }
+    return result;
+}
+exports.toTypedArray = toTypedArray;
+/**
+ * Transposes an RxC matrix represented as a flat typed array
+ * into a CxR matrix, again represented as a flat typed array.
+ */
+function transposeTypedArray(r, c, typedArray) {
+    var result = new Float32Array(r * c);
+    for (var i = 0; i < r; ++i) {
+        for (var j = 0; j < c; ++j) {
+            result[j * r + i] = typedArray[i * c + j];
+        }
+    }
+    return result;
+}
+exports.transposeTypedArray = transposeTypedArray;
+
+},{"./util":24}],26:[function(require,module,exports){
+"use strict";
+var __extends = (this && this.__extends) || function (d, b) {
+    for (var p in b) if (b.hasOwnProperty(p)) d[p] = b[p];
+    function __() { this.constructor = d; }
+    d.prototype = b === null ? Object.create(b) : (__.prototype = b.prototype, new __());
+};
+// tslint:disable-next-line:no-unused-variable
+var vz_projector_util_1 = require('./vz-projector-util');
+// tslint:disable-next-line
+exports.BookmarkPanelPolymer = vz_projector_util_1.PolymerElement({
+    is: 'vz-projector-bookmark-panel',
+    properties: { savedStates: Object, selectedState: Number }
+});
+var BookmarkPanel = (function (_super) {
+    __extends(BookmarkPanel, _super);
+    function BookmarkPanel() {
+        _super.apply(this, arguments);
+    }
+    BookmarkPanel.prototype.ready = function () {
+        this.dom = d3.select(this);
+        this.savedStates = [];
+        this.setupUploadButton();
+    };
+    BookmarkPanel.prototype.initialize = function (projector, dataProvider) {
+        this.projector = projector;
+        this.dataProvider = dataProvider;
+    };
+    BookmarkPanel.prototype.setSelectedTensor = function (run, tensorInfo) {
+        var _this = this;
+        if (tensorInfo && tensorInfo.bookmarksPath) {
+            this.loadAllStates([]);
+            // Get any bookmarks that may come when the projector starts up.
+            this.dataProvider.getBookmarks(run, tensorInfo.tensorName, function (bookmarks) {
+                _this.loadAllStates(bookmarks);
+            });
+        }
+    };
+    /** Handles a click on show bookmarks tray button. */
+    BookmarkPanel.prototype._expandMore = function () {
+        this.$.panel.toggle();
+        this.dom.select('#expand-more').style('display', 'none');
+        this.dom.select('#expand-less').style('display', '');
+    };
+    /** Handles a click on hide bookmarks tray button. */
+    BookmarkPanel.prototype._expandLess = function () {
+        this.$.panel.toggle();
+        this.dom.select('#expand-more').style('display', '');
+        this.dom.select('#expand-less').style('display', 'none');
+    };
+    /** Handles a click on the add bookmark button. */
+    BookmarkPanel.prototype._addBookmark = function () {
+        var currentState = this.projector.getCurrentState();
+        currentState.label = 'State ' + this.savedStates.length;
+        currentState.isSelected = true;
+        this.selectedState = this.savedStates.length;
+        for (var i = 0; i < this.savedStates.length; i++) {
+            this.savedStates[i].isSelected = false;
+            // We have to call notifyPath so that polymer knows this element was
+            // updated.
+            this.notifyPath('savedStates.' + i + '.isSelected', false, false);
+        }
+        this.push('savedStates', currentState);
+    };
+    /** Handles a click on the download bookmarks button. */
+    BookmarkPanel.prototype._downloadFile = function () {
+        var serializedState = this.serializeAllSavedStates();
+        var blob = new Blob([serializedState], { type: 'text/plain' });
+        var textFile = window.URL.createObjectURL(blob);
+        // Force a download.
+        var a = document.createElement('a');
+        document.body.appendChild(a);
+        a.style.display = 'none';
+        a.href = textFile;
+        a.download = 'state';
+        a.click();
+        document.body.removeChild(a);
+        window.URL.revokeObjectURL(textFile);
+    };
+    /** Handles a click on the upload bookmarks button. */
+    BookmarkPanel.prototype._uploadFile = function () {
+        var fileInput = this.dom.select('#state-file');
+        fileInput.node().click();
+    };
+    BookmarkPanel.prototype.setupUploadButton = function () {
+        // Show and setup the load view button.
+        var fileInput = this.dom.select('#state-file');
+        fileInput.on('change', function () {
+            var file = d3.event.target.files[0];
+            // Clear out the value of the file chooser. This ensures that if the user
+            // selects the same file, we'll re-read it.
+            d3.event.target.value = '';
+            var fileReader = new FileReader();
+            fileReader.onload = function (evt) {
+                var str = evt.target.result;
+                var savedStates = JSON.parse(str);
+                this.loadAllStates(savedStates);
+                this.loadSavedState(0);
+            }.bind(this);
+            fileReader.readAsText(file);
+        }.bind(this));
+    };
+    BookmarkPanel.prototype.loadAllStates = function (savedStates) {
+        for (var i = 0; i < savedStates.length; i++) {
+            savedStates[i].isSelected = false;
+            this.push('savedStates', savedStates[i]);
+        }
+    };
+    /** Deselects any selected state selection. */
+    BookmarkPanel.prototype.clearStateSelection = function () {
+        for (var i = 0; i < this.savedStates.length; i++) {
+            if (this.savedStates[i].isSelected) {
+                this.savedStates[i].isSelected = false;
+                this.notifyPath('savedStates.' + i + '.isSelected', false, false);
+                return;
+            }
+        }
+    };
+    /** Handles a radio button click on a saved state. */
+    BookmarkPanel.prototype._radioButtonHandler = function (evt) {
+        var index = +evt.target.parentElement.getAttribute('data-index');
+        this.loadSavedState(index);
+    };
+    BookmarkPanel.prototype.loadSavedState = function (index) {
+        for (var i = 0; i < this.savedStates.length; i++) {
+            if (this.savedStates[i].isSelected) {
+                this.savedStates[i].isSelected = false;
+                this.notifyPath('savedStates.' + i + '.isSelected', false, false);
+            }
+            else if (index === i) {
+                this.savedStates[i].isSelected = true;
+                this.notifyPath('savedStates.' + i + '.isSelected', true, false);
+                // Update the world to this state.
+                this.projector.loadState(this.savedStates[i]);
+            }
+        }
+    };
+    /**
+     * Crawls up the DOM to find an ancestor with a data-index attribute. This is
+     * used to match events to their bookmark index.
+     */
+    BookmarkPanel.prototype._getParentDataIndex = function (evt) {
+        for (var i = 0; i < evt.path.length; i++) {
+            var dataIndex = evt.path[i].getAttribute('data-index');
+            if (dataIndex != null) {
+                return +dataIndex;
+            }
+        }
+        return -1;
+    };
+    /** Handles a clear button click on a bookmark. */
+    BookmarkPanel.prototype._clearButtonHandler = function (evt) {
+        var index = this._getParentDataIndex(evt);
+        this.splice('savedStates', index, 1);
+    };
+    /** Handles a label change event on a bookmark. */
+    BookmarkPanel.prototype._labelChange = function (evt) {
+        var index = this._getParentDataIndex(evt);
+        this.savedStates[index].label = evt.target.value;
+    };
+    /**
+     * Used to determine whether to select the radio button for a given bookmark.
+     */
+    BookmarkPanel.prototype._isSelectedState = function (index) {
+        return index === this.selectedState;
+    };
+    BookmarkPanel.prototype._isNotSelectedState = function (index) {
+        return index !== this.selectedState;
+    };
+    /**
+     * Gets all of the saved states as a serialized string.
+     */
+    BookmarkPanel.prototype.serializeAllSavedStates = function () {
+        return JSON.stringify(this.savedStates);
+    };
+    /**
+     * Loads all of the serialized states and shows them in the list of
+     * viewable states.
+     */
+    BookmarkPanel.prototype.loadSavedStates = function (serializedStates) {
+        this.savedStates = JSON.parse(serializedStates);
+    };
+    return BookmarkPanel;
+}(exports.BookmarkPanelPolymer));
+exports.BookmarkPanel = BookmarkPanel;
+document.registerElement(BookmarkPanel.prototype.is, BookmarkPanel);
+
+},{"./vz-projector-util":33}],27:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var __extends = (this && this.__extends) || function (d, b) {
+    for (var p in b) if (b.hasOwnProperty(p)) d[p] = b[p];
+    function __() { this.constructor = d; }
+    d.prototype = b === null ? Object.create(b) : (__.prototype = b.prototype, new __());
+};
+var data_provider_1 = require('./data-provider');
+// tslint:disable-next-line:no-unused-variable
+var vz_projector_util_1 = require('./vz-projector-util');
+exports.DataPanelPolymer = vz_projector_util_1.PolymerElement({
+    is: 'vz-projector-data-panel',
+    properties: {
+        selectedTensor: { type: String, observer: '_selectedTensorChanged' },
+        selectedRun: { type: String, observer: '_selectedRunChanged' },
+        selectedColorOptionName: {
+            type: String,
+            notify: true,
+            observer: '_selectedColorOptionNameChanged'
+        },
+        selectedLabelOption: { type: String, notify: true, observer: '_selectedLabelOptionChanged' },
+        normalizeData: Boolean
+    }
+});
+var DataPanel = (function (_super) {
+    __extends(DataPanel, _super);
+    function DataPanel() {
+        _super.apply(this, arguments);
+    }
+    DataPanel.prototype.ready = function () {
+        this.dom = d3.select(this);
+        this.normalizeData = true;
+    };
+    DataPanel.prototype.initialize = function (projector, dp) {
+        var _this = this;
+        this.projector = projector;
+        this.dataProvider = dp;
+        this.setupUploadButtons();
+        // Tell the projector whenever the data normalization changes.
+        // Unknown why, but the polymer checkbox button stops working as soon as
+        // you do d3.select() on it.
+        this.querySelector('#normalize-data-checkbox')
+            .addEventListener('change', function () {
+            _this.projector.setNormalizeData(_this.normalizeData);
+        });
+        // Get all the runs.
+        this.dataProvider.retrieveRuns(function (runs) {
+            _this.runNames = runs;
+            // Choose the first run by default.
+            if (_this.runNames.length > 0) {
+                _this.selectedRun = runs[0];
+            }
+        });
+    };
+    DataPanel.prototype.getSeparatorClass = function (isSeparator) {
+        return isSeparator ? 'separator' : null;
+    };
+    DataPanel.prototype.metadataChanged = function (spriteAndMetadata, metadataFile) {
+        this.updateMetadataUI(spriteAndMetadata.stats, metadataFile);
+    };
+    DataPanel.prototype.updateMetadataUI = function (columnStats, metadataFile) {
+        this.dom.select('#metadata-file')
+            .text(metadataFile)
+            .attr('title', metadataFile);
+        // Label by options.
+        var labelIndex = -1;
+        this.labelOptions = columnStats.map(function (stats, i) {
+            // Make the default label by the first non-numeric column.
+            if (!stats.isNumeric && labelIndex === -1) {
+                labelIndex = i;
+            }
+            return stats.name;
+        });
+        this.selectedLabelOption = this.labelOptions[Math.max(0, labelIndex)];
+        // Color by options.
+        var standardColorOption = [
+            { name: 'No color map' },
+        ];
+        var metadataColorOption = columnStats
+            .filter(function (stats) {
+            return !stats.tooManyUniqueValues || stats.isNumeric;
+        })
+            .map(function (stats) {
+            var map;
+            var items;
+            var thresholds;
+            if (!stats.tooManyUniqueValues) {
+                var scale = d3.scale.category20();
+                var range_1 = scale.range();
+                // Re-order the range.
+                var newRange = range_1.map(function (color, i) {
+                    var index = (i * 3) % range_1.length;
+                    return range_1[index];
+                });
+                items = stats.uniqueEntries;
+                scale.range(newRange).domain(items.map(function (x) { return x.label; }));
+                map = scale;
+            }
+            else {
+                thresholds = [
+                    { color: '#ffffdd', value: stats.min },
+                    { color: '#1f2d86', value: stats.max }
+                ];
+                map = d3.scale.linear()
+                    .domain(thresholds.map(function (t) { return t.value; }))
+                    .range(thresholds.map(function (t) { return t.color; }));
+            }
+            var desc = stats.tooManyUniqueValues ?
+                'gradient' :
+                stats.uniqueEntries.length +
+                    ((stats.uniqueEntries.length > 20) ? ' non-unique' : '') +
+                    ' colors';
+            return { name: stats.name, desc: desc, map: map, items: items, thresholds: thresholds };
+        });
+        if (metadataColorOption.length > 0) {
+            // Add a separator line between built-in color maps
+            // and those based on metadata columns.
+            standardColorOption.push({ name: 'Metadata', isSeparator: true });
+        }
+        this.colorOptions = standardColorOption.concat(metadataColorOption);
+        this.selectedColorOptionName = this.colorOptions[0].name;
+    };
+    DataPanel.prototype.setNormalizeData = function (normalizeData) {
+        this.normalizeData = normalizeData;
+    };
+    DataPanel.prototype._selectedTensorChanged = function () {
+        var _this = this;
+        if (this.selectedTensor == null) {
+            return;
+        }
+        this.dataProvider.retrieveTensor(this.selectedRun, this.selectedTensor, function (ds) {
+            var metadataFile = _this.getEmbeddingInfoByName(_this.selectedTensor).metadataPath;
+            _this.dataProvider.retrieveSpriteAndMetadata(_this.selectedRun, _this.selectedTensor, function (metadata) {
+                _this.projector.updateDataSet(ds, metadata, metadataFile);
+            });
+        });
+        this.projector.setSelectedTensor(this.selectedRun, this.getEmbeddingInfoByName(this.selectedTensor));
+    };
+    DataPanel.prototype._selectedRunChanged = function () {
+        var _this = this;
+        this.dataProvider.retrieveProjectorConfig(this.selectedRun, function (info) {
+            _this.projectorConfig = info;
+            var names = _this.projectorConfig.embeddings.map(function (e) { return e.tensorName; })
+                .filter(function (name) {
+                var shape = _this.getEmbeddingInfoByName(name).tensorShape;
+                return shape.length === 2 && shape[0] > 1 && shape[1] > 1;
+            })
+                .sort(function (a, b) {
+                var sizeA = _this.getEmbeddingInfoByName(a).tensorShape[0];
+                var sizeB = _this.getEmbeddingInfoByName(b).tensorShape[0];
+                if (sizeA === sizeB) {
+                    // If the same dimension, sort alphabetically by tensor
+                    // name.
+                    return a <= b ? -1 : 1;
+                }
+                // Sort by first tensor dimension.
+                return sizeB - sizeA;
+            });
+            _this.tensorNames = names.map(function (name) {
+                return {
+                    name: name,
+                    shape: _this.getEmbeddingInfoByName(name).tensorShape
+                };
+            });
+            _this.dom.select('#checkpoint-file')
+                .text(_this.projectorConfig.modelCheckpointPath)
+                .attr('title', _this.projectorConfig.modelCheckpointPath);
+            _this.dataProvider.getDefaultTensor(_this.selectedRun, function (defaultTensor) {
+                if (_this.selectedTensor === defaultTensor) {
+                    // Explicitly call the observer. Polymer won't call it if the previous
+                    // string matches the current string.
+                    _this._selectedTensorChanged();
+                }
+                else {
+                    _this.selectedTensor = defaultTensor;
+                }
+            });
+        });
+    };
+    DataPanel.prototype._selectedLabelOptionChanged = function () {
+        this.projector.setSelectedLabelOption(this.selectedLabelOption);
+    };
+    DataPanel.prototype._selectedColorOptionNameChanged = function () {
+        var colorOption;
+        for (var i = 0; i < this.colorOptions.length; i++) {
+            if (this.colorOptions[i].name === this.selectedColorOptionName) {
+                colorOption = this.colorOptions[i];
+                break;
+            }
+        }
+        if (!colorOption) {
+            return;
+        }
+        if (colorOption.map == null) {
+            this.colorLegendRenderInfo = null;
+        }
+        else if (colorOption.items) {
+            var items = colorOption.items.map(function (item) {
+                return {
+                    color: colorOption.map(item.label),
+                    label: item.label,
+                    count: item.count
+                };
+            });
+            this.colorLegendRenderInfo = { items: items, thresholds: null };
+        }
+        else {
+            this.colorLegendRenderInfo = {
+                items: null,
+                thresholds: colorOption.thresholds
+            };
+        }
+        this.projector.setSelectedColorOption(colorOption);
+    };
+    DataPanel.prototype.tensorWasReadFromFile = function (rawContents, fileName) {
+        var _this = this;
+        data_provider_1.parseRawTensors(rawContents, function (ds) {
+            _this.dom.select('#checkpoint-file')
+                .text(fileName)
+                .attr('title', fileName);
+            _this.projector.updateDataSet(ds);
+        });
+    };
+    DataPanel.prototype.metadataWasReadFromFile = function (rawContents, fileName) {
+        var _this = this;
+        data_provider_1.parseRawMetadata(rawContents, function (metadata) {
+            _this.projector.updateDataSet(_this.projector.dataSet, metadata, fileName);
+        });
+    };
+    DataPanel.prototype.getEmbeddingInfoByName = function (tensorName) {
+        for (var i = 0; i < this.projectorConfig.embeddings.length; i++) {
+            var e = this.projectorConfig.embeddings[i];
+            if (e.tensorName === tensorName) {
+                return e;
+            }
+        }
+    };
+    DataPanel.prototype.setupUploadButtons = function () {
+        var _this = this;
+        // Show and setup the upload button.
+        var fileInput = this.dom.select('#file');
+        fileInput.on('change', function () {
+            var file = d3.event.target.files[0];
+            // Clear out the value of the file chooser. This ensures that if the user
+            // selects the same file, we'll re-read it.
+            d3.event.target.value = '';
+            var fileReader = new FileReader();
+            fileReader.onload = function (evt) {
+                var content = evt.target.result;
+                _this.tensorWasReadFromFile(content, file.name);
+            };
+            fileReader.readAsText(file);
+        });
+        var uploadButton = this.dom.select('#upload');
+        uploadButton.on('click', function () { fileInput.node().click(); });
+        // Show and setup the upload metadata button.
+        var fileMetadataInput = this.dom.select('#file-metadata');
+        fileMetadataInput.on('change', function () {
+            var file = d3.event.target.files[0];
+            // Clear out the value of the file chooser. This ensures that if the user
+            // selects the same file, we'll re-read it.
+            d3.event.target.value = '';
+            var fileReader = new FileReader();
+            fileReader.onload = function (evt) {
+                var contents = evt.target.result;
+                _this.metadataWasReadFromFile(contents, file.name);
+            };
+            fileReader.readAsText(file);
+        });
+        var uploadMetadataButton = this.dom.select('#upload-metadata');
+        uploadMetadataButton.on('click', function () {
+            fileMetadataInput.node().click();
+        });
+    };
+    DataPanel.prototype._getNumTensorsLabel = function () {
+        return this.tensorNames.length === 1 ? '1 tensor' :
+            this.tensorNames.length + ' tensors';
+    };
+    DataPanel.prototype._getNumRunsLabel = function () {
+        return this.runNames.length === 1 ? '1 run' :
+            this.runNames.length + ' runs';
+    };
+    DataPanel.prototype._hasChoices = function (choices) {
+        return choices.length > 1;
+    };
+    return DataPanel;
+}(exports.DataPanelPolymer));
+exports.DataPanel = DataPanel;
+document.registerElement(DataPanel.prototype.is, DataPanel);
+
+},{"./data-provider":5,"./vz-projector-util":33}],28:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var __extends = (this && this.__extends) || function (d, b) {
+    for (var p in b) if (b.hasOwnProperty(p)) d[p] = b[p];
+    function __() { this.constructor = d; }
+    d.prototype = b === null ? Object.create(b) : (__.prototype = b.prototype, new __());
+};
+// tslint:disable-next-line:no-unused-variable
+var vz_projector_util_1 = require('./vz-projector-util');
+// tslint:disable-next-line
+exports.PolymerClass = vz_projector_util_1.PolymerElement({ is: 'vz-projector-input', properties: { label: String, message: String } });
+/** Input control with custom capabilities (e.g. regex). */
+var ProjectorInput = (function (_super) {
+    __extends(ProjectorInput, _super);
+    function ProjectorInput() {
+        _super.apply(this, arguments);
+    }
+    /** Subscribe to be called everytime the input changes. */
+    ProjectorInput.prototype.registerInputChangedListener = function (listener) {
+        this.textChangedListeners.push(listener);
+    };
+    ProjectorInput.prototype.ready = function () {
+        var _this = this;
+        this.inRegexMode = false;
+        this.textChangedListeners = [];
+        this.dom = d3.select(this);
+        this.paperInput = this.querySelector('paper-input');
+        this.inRegexModeButton =
+            this.querySelector('paper-button');
+        this.paperInput.setAttribute('error-message', 'Invalid regex');
+        this.paperInput.addEventListener('input', function () {
+            _this.onTextChanged();
+        });
+        this.paperInput.addEventListener('keydown', function (event) {
+            event.stopPropagation();
+        });
+        this.inRegexModeButton.addEventListener('click', function () { return _this.onClickRegexModeButton(); });
+        this.updateRegexModeDisplaySlashes();
+        this.onTextChanged();
+    };
+    ProjectorInput.prototype.onClickRegexModeButton = function () {
+        this.inRegexMode = this.inRegexModeButton.active;
+        this.updateRegexModeDisplaySlashes();
+        this.onTextChanged();
+    };
+    ProjectorInput.prototype.notifyInputChanged = function (value, inRegexMode) {
+        this.textChangedListeners.forEach(function (l) { return l(value, inRegexMode); });
+    };
+    ProjectorInput.prototype.onTextChanged = function () {
+        try {
+            if (this.inRegexMode) {
+                new RegExp(this.paperInput.value);
+            }
+        }
+        catch (invalidRegexException) {
+            this.paperInput.setAttribute('invalid', 'true');
+            this.message = '';
+            this.notifyInputChanged(null, true);
+            return;
+        }
+        this.paperInput.removeAttribute('invalid');
+        this.notifyInputChanged(this.paperInput.value, this.inRegexMode);
+    };
+    ProjectorInput.prototype.updateRegexModeDisplaySlashes = function () {
+        d3.select(this.paperInput)
+            .selectAll('.slash')
+            .style('display', this.inRegexMode ? null : 'none');
+    };
+    ProjectorInput.prototype.getValue = function () {
+        return this.paperInput.value;
+    };
+    ProjectorInput.prototype.getInRegexMode = function () {
+        return this.inRegexMode;
+    };
+    ProjectorInput.prototype.set = function (value, inRegexMode) {
+        this.inRegexModeButton.active = inRegexMode;
+        this.paperInput.value = value;
+        this.onClickRegexModeButton();
+    };
+    return ProjectorInput;
+}(exports.PolymerClass));
+exports.ProjectorInput = ProjectorInput;
+document.registerElement(ProjectorInput.prototype.is, ProjectorInput);
+
+},{"./vz-projector-util":33}],29:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var __extends = (this && this.__extends) || function (d, b) {
+    for (var p in b) if (b.hasOwnProperty(p)) d[p] = b[p];
+    function __() { this.constructor = d; }
+    d.prototype = b === null ? Object.create(b) : (__.prototype = b.prototype, new __());
+};
+var vector = require('./vector');
+// tslint:disable-next-line:no-unused-variable
+var vz_projector_util_1 = require('./vz-projector-util');
+/** Color scale for nearest neighbors. */
+var NN_COLOR_SCALE = d3.scale.linear()
+    .domain([1, 0.7, 0.4])
+    .range(['hsl(285, 80%, 40%)', 'hsl(0, 80%, 65%)', 'hsl(40, 70%, 60%)'])
+    .clamp(true);
+/** Limit the number of search results we show to the user. */
+var LIMIT_RESULTS = 100;
+// tslint:disable-next-line
+exports.PolymerClass = vz_projector_util_1.PolymerElement({
+    is: 'vz-projector-inspector-panel',
+    properties: {
+        selectedMetadataField: String,
+        metadataFields: Array
+    }
+});
+var InspectorPanel = (function (_super) {
+    __extends(InspectorPanel, _super);
+    function InspectorPanel() {
+        _super.apply(this, arguments);
+    }
+    InspectorPanel.prototype.ready = function () {
+        this.dom = d3.select(this);
+        this.resetFilterButton = this.dom.select('.reset-filter');
+        this.setFilterButton = this.dom.select('.set-filter');
+        this.clearSelectionButton = this.dom.select('.clear-selection');
+        this.limitMessage = this.dom.select('.limit-msg');
+        this.searchBox = this.querySelector('#search-box');
+        // https://www.polymer-project.org/1.0/docs/devguide/styling#scope-subtree
+        this.scopeSubtree(this, true);
+    };
+    InspectorPanel.prototype.initialize = function (projector) {
+        this.projector = projector;
+        this.setupUI();
+    };
+    /** Updates the nearest neighbors list in the inspector. */
+    InspectorPanel.prototype.updateInspectorPane = function (indices, neighbors) {
+        if (neighbors.length > 0) {
+            this.selectedPointIndex = indices[0];
+        }
+        else {
+            this.selectedPointIndex = null;
+        }
+        this.updateFilterButtons(indices.length + neighbors.length);
+        this.updateNeighborsList(neighbors);
+        if (neighbors.length === 0) {
+            this.updateSearchResults(indices);
+        }
+        else {
+            this.updateSearchResults([]);
+        }
+    };
+    InspectorPanel.prototype.metadataChanged = function (spriteAndMetadata) {
+        var labelIndex = -1;
+        this.metadataFields = spriteAndMetadata.stats.map(function (stats, i) {
+            if (!stats.isNumeric && labelIndex === -1) {
+                labelIndex = i;
+            }
+            return stats.name;
+        });
+        labelIndex = Math.max(0, labelIndex);
+        // Make the default label the first non-numeric column.
+        this.selectedMetadataField = spriteAndMetadata.stats[labelIndex].name;
+    };
+    InspectorPanel.prototype.datasetChanged = function () {
+        this.resetFilterButton.attr('disabled', true);
+    };
+    InspectorPanel.prototype.updateSearchResults = function (indices) {
+        var _this = this;
+        var container = this.dom.select('.matches-list');
+        container.style('display', indices.length ? null : 'none');
+        var list = container.select('.list');
+        list.html('');
+        if (indices.length === 0) {
+            return;
+        }
+        this.limitMessage.style('display', indices.length <= LIMIT_RESULTS ? 'none' : null);
+        indices = indices.slice(0, LIMIT_RESULTS);
+        var rows = list.selectAll('.row')
+            .data(indices)
+            .enter()
+            .append('div').attr('class', 'row');
+        rows.append('a')
+            .attr('class', 'label')
+            .attr('title', function (index) { return _this.getLabelFromIndex(index); })
+            .text(function (index) { return _this.getLabelFromIndex(index); });
+        rows.on('mouseenter', function (index) {
+            _this.projector.notifyHoverOverPoint(index);
+        });
+        rows.on('mouseleave', function () {
+            _this.projector.notifyHoverOverPoint(null);
+        });
+        rows.on('click', function (index) {
+            _this.projector.notifySelectionChanged([index]);
+        });
+    };
+    InspectorPanel.prototype.getLabelFromIndex = function (pointIndex) {
+        var point = this.projector.dataSet.points[pointIndex];
+        return point.metadata[this.selectedMetadataField].toString();
+    };
+    InspectorPanel.prototype.updateNeighborsList = function (neighbors) {
+        var _this = this;
+        var nnlist = this.dom.select('.nn-list');
+        nnlist.html('');
+        this.dom.select('.nn').style('display', neighbors.length ? null : 'none');
+        if (neighbors.length === 0) {
+            return;
+        }
+        this.searchBox.message = '';
+        var minDist = neighbors.length > 0 ? neighbors[0].dist : 0;
+        var n = nnlist.selectAll('.neighbor')
+            .data(neighbors)
+            .enter()
+            .append('div')
+            .attr('class', 'neighbor')
+            .append('a')
+            .attr('class', 'neighbor-link')
+            .attr('title', function (d) { return _this.getLabelFromIndex(d.index); });
+        var labelValue = n.append('div').attr('class', 'label-and-value');
+        labelValue.append('div')
+            .attr('class', 'label')
+            .style('color', function (d) { return dist2color(_this.distFunc, d.dist, minDist); })
+            .text(function (d) { return _this.getLabelFromIndex(d.index); });
+        labelValue.append('div')
+            .attr('class', 'value')
+            .text(function (d) { return d.dist.toFixed(3); });
+        var bar = n.append('div').attr('class', 'bar');
+        bar.append('div')
+            .attr('class', 'fill')
+            .style('border-top-color', function (d) {
+            return dist2color(_this.distFunc, d.dist, minDist);
+        })
+            .style('width', function (d) {
+            return normalizeDist(_this.distFunc, d.dist, minDist) * 100 + '%';
+        });
+        bar.selectAll('.tick')
+            .data(d3.range(1, 4))
+            .enter()
+            .append('div')
+            .attr('class', 'tick')
+            .style('left', function (d) { return d * 100 / 4 + '%'; });
+        n.on('mouseenter', function (d) {
+            _this.projector.notifyHoverOverPoint(d.index);
+        });
+        n.on('mouseleave', function () {
+            _this.projector.notifyHoverOverPoint(null);
+        });
+        n.on('click', function (d) {
+            _this.projector.notifySelectionChanged([d.index]);
+        });
+    };
+    InspectorPanel.prototype.updateFilterButtons = function (numPoints) {
+        if (numPoints > 1) {
+            this.setFilterButton.text("Isolate " + numPoints + " points")
+                .attr('disabled', null);
+            this.clearSelectionButton.attr('disabled', null);
+        }
+        else {
+            this.setFilterButton.attr('disabled', true);
+            this.clearSelectionButton.attr('disabled', true);
+        }
+    };
+    InspectorPanel.prototype.setupUI = function () {
+        var _this = this;
+        this.distFunc = vector.cosDist;
+        var eucDist = this.dom.select('.distance a.euclidean');
+        eucDist.on('click', function () {
+            _this.dom.selectAll('.distance a').classed('selected', false);
+            eucDist.classed('selected', true);
+            _this.distFunc = vector.dist;
+            var neighbors = _this.projector.dataSet.findNeighbors(_this.selectedPointIndex, _this.distFunc, _this.numNN);
+            _this.updateNeighborsList(neighbors);
+        });
+        var cosDist = this.dom.select('.distance a.cosine');
+        cosDist.on('click', function () {
+            _this.dom.selectAll('.distance a').classed('selected', false);
+            cosDist.classed('selected', true);
+            _this.distFunc = vector.cosDist;
+            var neighbors = _this.projector.dataSet.findNeighbors(_this.selectedPointIndex, _this.distFunc, _this.numNN);
+            _this.updateNeighborsList(neighbors);
+        });
+        // Called whenever the search text input changes.
+        var updateInput = function (value, inRegexMode) {
+            if (value == null || value.trim() === '') {
+                _this.searchBox.message = '';
+                _this.projector.notifySelectionChanged([]);
+                return;
+            }
+            var indices = _this.projector.dataSet.query(value, inRegexMode, _this.selectedMetadataField);
+            if (indices.length === 0) {
+                _this.searchBox.message = '0 matches.';
+            }
+            else {
+                _this.searchBox.message = indices.length + " matches.";
+            }
+            _this.projector.notifySelectionChanged(indices);
+        };
+        this.searchBox.registerInputChangedListener(function (value, inRegexMode) {
+            updateInput(value, inRegexMode);
+        });
+        // Nearest neighbors controls.
+        var numNNInput = this.$$('#nn-slider');
+        var updateNumNN = function () {
+            _this.numNN = +numNNInput.value;
+            _this.dom.select('.num-nn .nn-count').text(_this.numNN);
+            if (_this.selectedPointIndex != null) {
+                _this.projector.notifySelectionChanged([_this.selectedPointIndex]);
+            }
+        };
+        numNNInput.addEventListener('change', updateNumNN);
+        updateNumNN();
+        // Filtering dataset.
+        this.setFilterButton.on('click', function () {
+            _this.projector.filterDataset();
+            _this.resetFilterButton.attr('disabled', null);
+            _this.updateFilterButtons(0);
+        });
+        this.resetFilterButton.on('click', function () {
+            _this.projector.resetFilterDataset();
+            _this.resetFilterButton.attr('disabled', true);
+        });
+        this.clearSelectionButton.on('click', function () {
+            _this.projector.adjustSelectionAndHover([]);
+        });
+        this.resetFilterButton.attr('disabled', true);
+    };
+    return InspectorPanel;
+}(exports.PolymerClass));
+exports.InspectorPanel = InspectorPanel;
+/**
+ * Normalizes the distance so it can be visually encoded with color.
+ * The normalization depends on the distance metric (cosine vs euclidean).
+ */
+function normalizeDist(distFunc, d, minDist) {
+    return distFunc === vector.dist ? minDist / d : 1 - d;
+}
+/** Normalizes and encodes the provided distance with color. */
+function dist2color(distFunc, d, minDist) {
+    return NN_COLOR_SCALE(normalizeDist(distFunc, d, minDist));
+}
+document.registerElement(InspectorPanel.prototype.is, InspectorPanel);
+
+},{"./vector":25,"./vz-projector-util":33}],30:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var __extends = (this && this.__extends) || function (d, b) {
+    for (var p in b) if (b.hasOwnProperty(p)) d[p] = b[p];
+    function __() { this.constructor = d; }
+    d.prototype = b === null ? Object.create(b) : (__.prototype = b.prototype, new __());
+};
+// tslint:disable-next-line:no-unused-variable
+var vz_projector_util_1 = require('./vz-projector-util');
+// tslint:disable-next-line
+exports.LegendPolymer = vz_projector_util_1.PolymerElement({
+    is: 'vz-projector-legend',
+    properties: { renderInfo: { type: Object, observer: '_renderInfoChanged' } }
+});
+var Legend = (function (_super) {
+    __extends(Legend, _super);
+    function Legend() {
+        _super.apply(this, arguments);
+    }
+    Legend.prototype.ready = function () {
+        this.dom = d3.select(this);
+    };
+    Legend.prototype._renderInfoChanged = function () {
+        var _this = this;
+        if (this.renderInfo == null) {
+            return;
+        }
+        if (this.renderInfo.thresholds) {
+            // <linearGradient> is under dom-if so we should wait for it to be
+            // inserted in the dom tree using async().
+            this.async(function () { return _this.setupLinearGradient(); });
+        }
+    };
+    Legend.prototype._getLastThreshold = function () {
+        if (this.renderInfo == null || this.renderInfo.thresholds == null) {
+            return;
+        }
+        return this.renderInfo.thresholds[this.renderInfo.thresholds.length - 1]
+            .value;
+    };
+    Legend.prototype.getOffset = function (value) {
+        var min = this.renderInfo.thresholds[0].value;
+        var max = this.renderInfo.thresholds[this.renderInfo.thresholds.length - 1].value;
+        return (100 * (value - min) / (max - min)).toFixed(2) + '%';
+    };
+    Legend.prototype.setupLinearGradient = function () {
+        var _this = this;
+        var linearGradient = this.dom.select('#gradient');
+        var width = this.dom.select('svg.gradient').node().clientWidth;
+        // Set the svg <rect> to be the width of its <svg> parent.
+        this.dom.select('svg.gradient rect').attr('width', width);
+        // Remove all <stop> children from before.
+        linearGradient.selectAll('*').remove();
+        // Add a <stop> child in <linearGradient> for each gradient threshold.
+        this.renderInfo.thresholds.forEach(function (t) {
+            linearGradient.append('stop')
+                .attr('offset', _this.getOffset(t.value))
+                .attr('stop-color', t.color);
+        });
+    };
+    return Legend;
+}(exports.LegendPolymer));
+exports.Legend = Legend;
+document.registerElement(Legend.prototype.is, Legend);
+
+},{"./vz-projector-util":33}],31:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var __extends = (this && this.__extends) || function (d, b) {
+    for (var p in b) if (b.hasOwnProperty(p)) d[p] = b[p];
+    function __() { this.constructor = d; }
+    d.prototype = b === null ? Object.create(b) : (__.prototype = b.prototype, new __());
+};
+// tslint:disable-next-line:no-unused-variable
+var vz_projector_util_1 = require('./vz-projector-util');
+// tslint:disable-next-line
+exports.MetadataCardPolymer = vz_projector_util_1.PolymerElement({
+    is: 'vz-projector-metadata-card',
+    properties: {
+        hasMetadata: { type: Boolean, value: false },
+        metadata: { type: Array },
+        label: String
+    }
+});
+var MetadataCard = (function (_super) {
+    __extends(MetadataCard, _super);
+    function MetadataCard() {
+        _super.apply(this, arguments);
+    }
+    MetadataCard.prototype.ready = function () {
+        this.dom = d3.select(this);
+    };
+    /** Handles a click on the expand more icon. */
+    MetadataCard.prototype._expandMore = function () {
+        this.$$('#metadata-container').toggle();
+        this.dom.select('#expand-more').style('display', 'none');
+        this.dom.select('#expand-less').style('display', '');
+    };
+    /** Handles a click on the expand less icon. */
+    MetadataCard.prototype._expandLess = function () {
+        this.$$('#metadata-container').toggle();
+        this.dom.select('#expand-more').style('display', '');
+        this.dom.select('#expand-less').style('display', 'none');
+    };
+    MetadataCard.prototype.updateMetadata = function (pointMetadata) {
+        this.pointMetadata = pointMetadata;
+        this.hasMetadata = (pointMetadata != null);
+        if (pointMetadata) {
+            var metadata = [];
+            for (var metadataKey in pointMetadata) {
+                if (!pointMetadata.hasOwnProperty(metadataKey)) {
+                    continue;
+                }
+                metadata.push({ key: metadataKey, value: pointMetadata[metadataKey] });
+            }
+            this.metadata = metadata;
+            this.label = '' + this.pointMetadata[this.labelOption];
+        }
+    };
+    MetadataCard.prototype.setLabelOption = function (labelOption) {
+        this.labelOption = labelOption;
+        if (this.pointMetadata) {
+            this.label = '' + this.pointMetadata[this.labelOption];
+        }
+    };
+    return MetadataCard;
+}(exports.MetadataCardPolymer));
+exports.MetadataCard = MetadataCard;
+document.registerElement(MetadataCard.prototype.is, MetadataCard);
+
+},{"./vz-projector-util":33}],32:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var __extends = (this && this.__extends) || function (d, b) {
+    for (var p in b) if (b.hasOwnProperty(p)) d[p] = b[p];
+    function __() { this.constructor = d; }
+    d.prototype = b === null ? Object.create(b) : (__.prototype = b.prototype, new __());
+};
+var data_1 = require('./data');
+var vector = require('./vector');
+// tslint:disable-next-line:no-unused-variable
+var vz_projector_util_1 = require('./vz-projector-util');
+// tslint:disable-next-line
+exports.ProjectionsPanelPolymer = vz_projector_util_1.PolymerElement({
+    is: 'vz-projector-projections-panel',
+    properties: {
+        pcaIs3d: { type: Boolean, value: true, observer: '_pcaDimensionToggleObserver' },
+        tSNEis3d: { type: Boolean, value: true, observer: '_tsneDimensionToggleObserver' },
+        // PCA projection.
+        pcaComponents: { type: Array, value: d3.range(0, 10) },
+        pcaX: { type: Number, value: 0, observer: 'showPCAIfEnabled' },
+        pcaY: { type: Number, value: 1, observer: 'showPCAIfEnabled' },
+        pcaZ: { type: Number, value: 2, observer: 'showPCAIfEnabled' },
+        // Custom projection.
+        customSelectedSearchByMetadataOption: {
+            type: String,
+            observer: '_customSelectedSearchByMetadataOptionChanged'
+        },
+    }
+});
+/**
+ * A polymer component which handles the projection tabs in the projector.
+ */
+var ProjectionsPanel = (function (_super) {
+    __extends(ProjectionsPanel, _super);
+    function ProjectionsPanel() {
+        _super.apply(this, arguments);
+    }
+    ProjectionsPanel.prototype.initialize = function (projector) {
+        this.polymerChangesTriggerReprojection = true;
+        this.projector = projector;
+        // Set up TSNE projections.
+        this.perplexity = 30;
+        this.learningRate = 10;
+        // Setup Custom projections.
+        this.centroidValues = { xLeft: null, xRight: null, yUp: null, yDown: null };
+        this.clearCentroids();
+        this.setupUIControls();
+    };
+    ProjectionsPanel.prototype.ready = function () {
+        this.dom = d3.select(this);
+        this.zDropdown = this.dom.select('#z-dropdown');
+        this.runTsneButton = this.dom.select('.run-tsne');
+        this.stopTsneButton = this.dom.select('.stop-tsne');
+        this.perplexitySlider = this.$$('#perplexity-slider');
+        this.learningRateInput =
+            this.$$('#learning-rate-slider');
+        this.iterationLabel = this.dom.select('.run-tsne-iter');
+    };
+    ProjectionsPanel.prototype.disablePolymerChangesTriggerReprojection = function () {
+        this.polymerChangesTriggerReprojection = false;
+    };
+    ProjectionsPanel.prototype.enablePolymerChangesTriggerReprojection = function () {
+        this.polymerChangesTriggerReprojection = true;
+    };
+    ProjectionsPanel.prototype.updateTSNEPerplexityFromUIChange = function () {
+        if (this.perplexitySlider) {
+            this.perplexity = +this.perplexitySlider.value;
+        }
+        this.dom.select('.tsne-perplexity span').text(this.perplexity);
+    };
+    ProjectionsPanel.prototype.updateTSNELearningRateFromUIChange = function () {
+        if (this.learningRateInput) {
+            this.learningRate = Math.pow(10, +this.learningRateInput.value);
+        }
+        this.dom.select('.tsne-learning-rate span').text(this.learningRate);
+    };
+    ProjectionsPanel.prototype.setupUIControls = function () {
+        var _this = this;
+        {
+            var self_1 = this;
+            this.dom.selectAll('.ink-tab').on('click', function () {
+                var id = this.getAttribute('data-tab');
+                self_1.showTab(id);
+            });
+        }
+        this.runTsneButton.on('click', function () { return _this.runTSNE(); });
+        this.stopTsneButton.on('click', function () { return _this.dataSet.stopTSNE(); });
+        this.perplexitySlider.value = this.perplexity.toString();
+        this.perplexitySlider.addEventListener('change', function () { return _this.updateTSNEPerplexityFromUIChange(); });
+        this.updateTSNEPerplexityFromUIChange();
+        this.learningRateInput.addEventListener('change', function () { return _this.updateTSNELearningRateFromUIChange(); });
+        this.updateTSNELearningRateFromUIChange();
+        this.setupCustomProjectionInputFields();
+        // TODO: figure out why `--paper-input-container-input` css mixin didn't
+        // work.
+        this.dom.selectAll('paper-dropdown-menu paper-input input')
+            .style('font-size', '14px');
+    };
+    ProjectionsPanel.prototype.restoreUIFromBookmark = function (bookmark) {
+        this.disablePolymerChangesTriggerReprojection();
+        // PCA
+        this.pcaX = bookmark.pcaComponentDimensions[0];
+        this.pcaY = bookmark.pcaComponentDimensions[1];
+        if (bookmark.pcaComponentDimensions.length === 3) {
+            this.pcaZ = bookmark.pcaComponentDimensions[2];
+        }
+        this.pcaIs3d = (bookmark.pcaComponentDimensions.length === 3);
+        // t-SNE
+        if (this.perplexitySlider) {
+            this.perplexitySlider.value = bookmark.tSNEPerplexity.toString();
+        }
+        if (this.learningRateInput) {
+            this.learningRateInput.value = bookmark.tSNELearningRate.toString();
+        }
+        this.tSNEis3d = bookmark.tSNEis3d;
+        // custom
+        this.customSelectedSearchByMetadataOption =
+            bookmark.customSelectedSearchByMetadataOption;
+        if (this.customProjectionXLeftInput) {
+            this.customProjectionXLeftInput.set(bookmark.customXLeftText, bookmark.customXLeftRegex);
+        }
+        if (this.customProjectionXRightInput) {
+            this.customProjectionXRightInput.set(bookmark.customXRightText, bookmark.customXRightRegex);
+        }
+        if (this.customProjectionYUpInput) {
+            this.customProjectionYUpInput.set(bookmark.customYUpText, bookmark.customYUpRegex);
+        }
+        if (this.customProjectionYDownInput) {
+            this.customProjectionYDownInput.set(bookmark.customYDownText, bookmark.customYDownRegex);
+        }
+        this.computeAllCentroids();
+        this.setZDropdownEnabled(this.pcaIs3d);
+        this.updateTSNEPerplexityFromUIChange();
+        this.updateTSNELearningRateFromUIChange();
+        if (this.iterationLabel) {
+            this.iterationLabel.text(bookmark.tSNEIteration.toString());
+        }
+        this.showTab(bookmark.selectedProjection);
+        this.enablePolymerChangesTriggerReprojection();
+    };
+    ProjectionsPanel.prototype.populateBookmarkFromUI = function (bookmark) {
+        this.disablePolymerChangesTriggerReprojection();
+        // PCA
+        bookmark.pcaComponentDimensions = [this.pcaX, this.pcaY];
+        if (this.pcaIs3d) {
+            bookmark.pcaComponentDimensions.push(this.pcaZ);
+        }
+        // t-SNE
+        if (this.perplexitySlider != null) {
+            bookmark.tSNEPerplexity = +this.perplexitySlider.value;
+        }
+        if (this.learningRateInput != null) {
+            bookmark.tSNELearningRate = +this.learningRateInput.value;
+        }
+        bookmark.tSNEis3d = this.tSNEis3d;
+        // custom
+        bookmark.customSelectedSearchByMetadataOption =
+            this.customSelectedSearchByMetadataOption;
+        if (this.customProjectionXLeftInput != null) {
+            bookmark.customXLeftText = this.customProjectionXLeftInput.getValue();
+            bookmark.customXLeftRegex =
+                this.customProjectionXLeftInput.getInRegexMode();
+        }
+        if (this.customProjectionXRightInput != null) {
+            bookmark.customXRightText = this.customProjectionXRightInput.getValue();
+            bookmark.customXRightRegex =
+                this.customProjectionXRightInput.getInRegexMode();
+        }
+        if (this.customProjectionYUpInput != null) {
+            bookmark.customYUpText = this.customProjectionYUpInput.getValue();
+            bookmark.customYUpRegex = this.customProjectionYUpInput.getInRegexMode();
+        }
+        if (this.customProjectionYDownInput != null) {
+            bookmark.customYDownText = this.customProjectionYDownInput.getValue();
+            bookmark.customYDownRegex =
+                this.customProjectionYDownInput.getInRegexMode();
+        }
+        this.enablePolymerChangesTriggerReprojection();
+    };
+    // This method is marked as public as it is used as the view method that
+    // abstracts DOM manipulation so we can stub it in a test.
+    // TODO(nsthorat): Move this to its own class as the glue between this class
+    // and the DOM.
+    ProjectionsPanel.prototype.setZDropdownEnabled = function (enabled) {
+        if (this.zDropdown) {
+            this.zDropdown.attr('disabled', enabled ? null : true);
+        }
+    };
+    ProjectionsPanel.prototype.dataSetUpdated = function (dataSet, originalDataSet, dim) {
+        this.dataSet = dataSet;
+        this.originalDataSet = originalDataSet;
+        this.dim = dim;
+        this.clearCentroids();
+        this.dom.select('#tsne-sampling')
+            .style('display', dataSet.points.length > data_1.SAMPLE_SIZE ? null : 'none');
+        this.dom.select('#pca-sampling')
+            .style('display', dataSet.dim[1] > data_1.PCA_SAMPLE_DIM ? null : 'none');
+        this.showTab('pca');
+    };
+    ProjectionsPanel.prototype._pcaDimensionToggleObserver = function () {
+        this.setZDropdownEnabled(this.pcaIs3d);
+        this.beginProjection(this.currentProjection);
+    };
+    ProjectionsPanel.prototype._tsneDimensionToggleObserver = function () {
+        this.beginProjection(this.currentProjection);
+    };
+    ProjectionsPanel.prototype.metadataChanged = function (spriteAndMetadata) {
+        // Project by options for custom projections.
+        var searchByMetadataIndex = -1;
+        this.searchByMetadataOptions = spriteAndMetadata.stats.map(function (stats, i) {
+            // Make the default label by the first non-numeric column.
+            if (!stats.isNumeric && searchByMetadataIndex === -1) {
+                searchByMetadataIndex = i;
+            }
+            return stats.name;
+        });
+        this.customSelectedSearchByMetadataOption =
+            this.searchByMetadataOptions[Math.max(0, searchByMetadataIndex)];
+    };
+    ProjectionsPanel.prototype.showTab = function (id) {
+        var _this = this;
+        this.currentProjection = id;
+        var tab = this.dom.select('.ink-tab[data-tab="' + id + '"]');
+        this.dom.selectAll('.ink-tab').classed('active', false);
+        tab.classed('active', true);
+        this.dom.selectAll('.ink-panel-content').classed('active', false);
+        this.dom.select('.ink-panel-content[data-panel="' + id + '"]')
+            .classed('active', true);
+        // guard for unit tests, where polymer isn't attached and $ doesn't exist.
+        if (this.$ != null) {
+            var main_1 = this.$['main'];
+            // In order for the projections panel to animate its height, we need to
+            // set it explicitly.
+            requestAnimationFrame(function () {
+                _this.style.height = main_1.clientHeight + 'px';
+            });
+        }
+        this.beginProjection(id);
+    };
+    ProjectionsPanel.prototype.beginProjection = function (projection) {
+        if (this.polymerChangesTriggerReprojection === false) {
+            return;
+        }
+        if (projection === 'pca') {
+            this.dataSet.stopTSNE();
+            this.showPCA();
+        }
+        else if (projection === 'tsne') {
+            this.showTSNE();
+        }
+        else if (projection === 'custom') {
+            this.dataSet.stopTSNE();
+            this.computeAllCentroids();
+            this.reprojectCustom();
+        }
+    };
+    ProjectionsPanel.prototype.showTSNE = function () {
+        var dataSet = this.dataSet;
+        if (dataSet == null) {
+            return;
+        }
+        var accessors = dataSet.getPointAccessors('tsne', [0, 1, this.tSNEis3d ? 2 : null]);
+        this.projector.setProjection('tsne', this.tSNEis3d ? 3 : 2, accessors);
+        if (!this.dataSet.hasTSNERun) {
+            this.runTSNE();
+        }
+        else {
+            this.projector.notifyProjectionsUpdated();
+        }
+    };
+    ProjectionsPanel.prototype.runTSNE = function () {
+        var _this = this;
+        this.runTsneButton.attr('disabled', true);
+        this.stopTsneButton.attr('disabled', null);
+        this.dataSet.projectTSNE(this.perplexity, this.learningRate, this.tSNEis3d ? 3 : 2, function (iteration) {
+            if (iteration != null) {
+                _this.iterationLabel.text(iteration);
+                _this.projector.notifyProjectionsUpdated();
+            }
+            else {
+                _this.runTsneButton.attr('disabled', null);
+                _this.stopTsneButton.attr('disabled', true);
+            }
+        });
+    };
+    // tslint:disable-next-line:no-unused-variable
+    ProjectionsPanel.prototype.showPCAIfEnabled = function () {
+        if (this.polymerChangesTriggerReprojection) {
+            this.showPCA();
+        }
+    };
+    ProjectionsPanel.prototype.showPCA = function () {
+        var _this = this;
+        if (this.dataSet == null) {
+            return;
+        }
+        this.dataSet.projectPCA().then(function () {
+            // Polymer properties are 1-based.
+            var accessors = _this.dataSet.getPointAccessors('pca', [_this.pcaX, _this.pcaY, _this.pcaZ]);
+            _this.projector.setProjection('pca', _this.pcaIs3d ? 3 : 2, accessors);
+        });
+    };
+    ProjectionsPanel.prototype.reprojectCustom = function () {
+        if (this.centroids == null || this.centroids.xLeft == null ||
+            this.centroids.xRight == null || this.centroids.yUp == null ||
+            this.centroids.yDown == null) {
+            return;
+        }
+        var xDir = vector.sub(this.centroids.xRight, this.centroids.xLeft);
+        this.dataSet.projectLinear(xDir, 'linear-x');
+        var yDir = vector.sub(this.centroids.yUp, this.centroids.yDown);
+        this.dataSet.projectLinear(yDir, 'linear-y');
+        var accessors = this.dataSet.getPointAccessors('custom', ['x', 'y']);
+        this.projector.setProjection('custom', 2, accessors);
+    };
+    ProjectionsPanel.prototype.clearCentroids = function () {
+        this.centroids = { xLeft: null, xRight: null, yUp: null, yDown: null };
+        this.allCentroid = null;
+    };
+    ProjectionsPanel.prototype._customSelectedSearchByMetadataOptionChanged = function (newVal, oldVal) {
+        if (this.polymerChangesTriggerReprojection === false) {
+            return;
+        }
+        if (this.currentProjection === 'custom') {
+            this.computeAllCentroids();
+            this.reprojectCustom();
+        }
+    };
+    ProjectionsPanel.prototype.setupCustomProjectionInputFields = function () {
+        this.customProjectionXLeftInput =
+            this.setupCustomProjectionInputField('xLeft');
+        this.customProjectionXRightInput =
+            this.setupCustomProjectionInputField('xRight');
+        this.customProjectionYUpInput = this.setupCustomProjectionInputField('yUp');
+        this.customProjectionYDownInput =
+            this.setupCustomProjectionInputField('yDown');
+    };
+    ProjectionsPanel.prototype.computeAllCentroids = function () {
+        this.computeCentroid('xLeft');
+        this.computeCentroid('xRight');
+        this.computeCentroid('yUp');
+        this.computeCentroid('yDown');
+    };
+    ProjectionsPanel.prototype.computeCentroid = function (name) {
+        var input = this.querySelector('#' + name);
+        if (input == null) {
+            return;
+        }
+        var value = input.getValue();
+        if (value == null) {
+            return;
+        }
+        var inRegexMode = input.getInRegexMode();
+        var result = this.getCentroid(value, inRegexMode);
+        if (result.numMatches === 0) {
+            input.message = '0 matches. Using a random vector.';
+            result.centroid = vector.rn(this.dim);
+        }
+        else {
+            input.message = result.numMatches + " matches.";
+        }
+        this.centroids[name] = result.centroid;
+        this.centroidValues[name] = value;
+    };
+    ProjectionsPanel.prototype.setupCustomProjectionInputField = function (name) {
+        var _this = this;
+        var input = this.querySelector('#' + name);
+        input.registerInputChangedListener(function (input, inRegexMode) {
+            if (_this.polymerChangesTriggerReprojection) {
+                _this.computeCentroid(name);
+                _this.reprojectCustom();
+            }
+        });
+        return input;
+    };
+    ProjectionsPanel.prototype.getCentroid = function (pattern, inRegexMode) {
+        var _this = this;
+        if (pattern == null || pattern === '') {
+            return { numMatches: 0 };
+        }
+        // Search by the original dataset since we often want to filter and project
+        // only the nearest neighbors of A onto B-C where B and C are not nearest
+        // neighbors of A.
+        var accessor = function (i) { return _this.originalDataSet.points[i].vector; };
+        var r = this.originalDataSet.query(pattern, inRegexMode, this.customSelectedSearchByMetadataOption);
+        return { centroid: vector.centroid(r, accessor), numMatches: r.length };
+    };
+    ProjectionsPanel.prototype.getPcaSampledDim = function () {
+        return data_1.PCA_SAMPLE_DIM.toLocaleString();
+    };
+    ProjectionsPanel.prototype.getTsneSampleSize = function () {
+        return data_1.SAMPLE_SIZE.toLocaleString();
+    };
+    ProjectionsPanel.prototype._addOne = function (value) {
+        return value + 1;
+    };
+    return ProjectionsPanel;
+}(exports.ProjectionsPanelPolymer));
+exports.ProjectionsPanel = ProjectionsPanel;
+document.registerElement(ProjectionsPanel.prototype.is, ProjectionsPanel);
+
+},{"./data":6,"./vector":25,"./vz-projector-util":33}],33:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+function PolymerElement(spec) {
+    return Polymer.Class(spec);
+}
+exports.PolymerElement = PolymerElement;
+
+},{}],34:[function(require,module,exports){
+/* Copyright 2016 The TensorFlow Authors. All Rights Reserved.
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+==============================================================================*/
+"use strict";
+var __extends = (this && this.__extends) || function (d, b) {
+    for (var p in b) if (b.hasOwnProperty(p)) d[p] = b[p];
+    function __() { this.constructor = d; }
+    d.prototype = b === null ? Object.create(b) : (__.prototype = b.prototype, new __());
+};
+var data_1 = require('./data');
+var data_provider_demo_1 = require('./data-provider-demo');
+var data_provider_proto_1 = require('./data-provider-proto');
+var data_provider_server_1 = require('./data-provider-server');
+var logging = require('./logging');
+var projectorScatterPlotAdapter_1 = require('./projectorScatterPlotAdapter');
+var scatterPlot_1 = require('./scatterPlot');
+var scatterPlotVisualizer3DLabels_1 = require('./scatterPlotVisualizer3DLabels');
+var scatterPlotVisualizerCanvasLabels_1 = require('./scatterPlotVisualizerCanvasLabels');
+var scatterPlotVisualizerSprites_1 = require('./scatterPlotVisualizerSprites');
+var scatterPlotVisualizerTraces_1 = require('./scatterPlotVisualizerTraces');
+// tslint:disable-next-line:no-unused-variable
+var vz_projector_util_1 = require('./vz-projector-util');
+/**
+ * The minimum number of dimensions the data should have to automatically
+ * decide to normalize the data.
+ */
+var THRESHOLD_DIM_NORMALIZE = 50;
+var POINT_COLOR_MISSING = 'black';
+exports.ProjectorPolymer = vz_projector_util_1.PolymerElement({
+    is: 'vz-projector',
+    properties: {
+        routePrefix: String,
+        dataProto: { type: String, observer: '_dataProtoChanged' },
+        servingMode: String
+    }
+});
+var INDEX_METADATA_FIELD = '__index__';
+var Projector = (function (_super) {
+    __extends(Projector, _super);
+    function Projector() {
+        _super.apply(this, arguments);
+    }
+    Projector.prototype.ready = function () {
+        this.selectionChangedListeners = [];
+        this.hoverListeners = [];
+        this.selectedPointIndices = [];
+        this.neighborsOfFirstPoint = [];
+        this.dom = d3.select(this);
+        logging.setDomContainer(this);
+        this.dataPanel = this.$['data-panel'];
+        this.inspectorPanel = this.$['inspector-panel'];
+        this.inspectorPanel.initialize(this);
+        this.projectionsPanel = this.$['projections-panel'];
+        this.projectionsPanel.initialize(this);
+        this.metadataCard = this.$['metadata-card'];
+        this.statusBar = this.dom.select('#status-bar');
+        this.bookmarkPanel = this.$['bookmark-panel'];
+        this.scopeSubtree(this.$$('#wrapper-notify-msg'), true);
+        this.setupUIControls();
+        this.initializeDataProvider();
+    };
+    Projector.prototype.setSelectedLabelOption = function (labelOption) {
+        var _this = this;
+        this.selectedLabelOption = labelOption;
+        var labelAccessor = function (i) {
+            return _this.dataSet.points[i]
+                .metadata[_this.selectedLabelOption];
+        };
+        this.scatterPlot.setLabelAccessor(labelAccessor);
+        this.metadataCard.setLabelOption(this.selectedLabelOption);
+    };
+    Projector.prototype.setSelectedColorOption = function (colorOption) {
+        this.selectedColorOption = colorOption;
+        this.updateScatterPlot();
+    };
+    Projector.prototype.setNormalizeData = function (normalizeData) {
+        this.normalizeData = normalizeData;
+        this.setCurrentDataSet(this.originalDataSet.getSubset());
+    };
+    Projector.prototype.updateDataSet = function (ds, spriteAndMetadata, metadataFile) {
+        this.originalDataSet = ds;
+        if (this.scatterPlot == null || this.originalDataSet == null) {
+            // We are not ready yet.
+            return;
+        }
+        this.normalizeData = this.originalDataSet.dim[1] >= THRESHOLD_DIM_NORMALIZE;
+        spriteAndMetadata = spriteAndMetadata || {};
+        if (spriteAndMetadata.pointsInfo == null) {
+            var _a = this.makeDefaultPointsInfoAndStats(ds.points), pointsInfo = _a[0], stats = _a[1];
+            spriteAndMetadata.pointsInfo = pointsInfo;
+            spriteAndMetadata.stats = stats;
+        }
+        ds.mergeMetadata(spriteAndMetadata);
+        this.dataPanel.setNormalizeData(this.normalizeData);
+        this.setCurrentDataSet(this.originalDataSet.getSubset());
+        this.inspectorPanel.datasetChanged();
+        this.inspectorPanel.metadataChanged(spriteAndMetadata);
+        this.projectionsPanel.metadataChanged(spriteAndMetadata);
+        this.dataPanel.metadataChanged(spriteAndMetadata, metadataFile);
+        // Set the container to a fixed height, otherwise in Colab the
+        // height can grow indefinitely.
+        var container = this.dom.select('#container');
+        container.style('height', container.property('clientHeight') + 'px');
+    };
+    Projector.prototype.setSelectedTensor = function (run, tensorInfo) {
+        this.bookmarkPanel.setSelectedTensor(run, tensorInfo);
+    };
+    /**
+     * Registers a listener to be called any time the selected point set changes.
+     */
+    Projector.prototype.registerSelectionChangedListener = function (listener) {
+        this.selectionChangedListeners.push(listener);
+    };
+    Projector.prototype.filterDataset = function () {
+        var indices = this.selectedPointIndices.concat(this.neighborsOfFirstPoint.map(function (n) { return n.index; }));
+        var selectionSize = this.selectedPointIndices.length;
+        this.setCurrentDataSet(this.dataSet.getSubset(indices));
+        this.adjustSelectionAndHover(d3.range(selectionSize));
+        this.scatterPlot.recreateScene();
+    };
+    Projector.prototype.resetFilterDataset = function () {
+        var _this = this;
+        var originalPointIndices = this.selectedPointIndices.map(function (localIndex) {
+            return _this.dataSet.points[localIndex].index;
+        });
+        this.setCurrentDataSet(this.originalDataSet.getSubset());
+        this.adjustSelectionAndHover(originalPointIndices);
+    };
+    /**
+     * Used by clients to indicate that a selection has occurred.
+     */
+    Projector.prototype.notifySelectionChanged = function (newSelectedPointIndices) {
+        var _this = this;
+        this.selectedPointIndices = newSelectedPointIndices;
+        var neighbors = [];
+        if (newSelectedPointIndices.length === 1) {
+            neighbors = this.dataSet.findNeighbors(newSelectedPointIndices[0], this.inspectorPanel.distFunc, this.inspectorPanel.numNN);
+            this.metadataCard.updateMetadata(this.dataSet.points[newSelectedPointIndices[0]].metadata);
+        }
+        else {
+            this.metadataCard.updateMetadata(null);
+        }
+        this.selectionChangedListeners.forEach(function (l) { return l(_this.selectedPointIndices, neighbors); });
+    };
+    /**
+     * Registers a listener to be called any time the mouse hovers over a point.
+     */
+    Projector.prototype.registerHoverListener = function (listener) {
+        this.hoverListeners.push(listener);
+    };
+    /**
+     * Used by clients to indicate that a hover is occurring.
+     */
+    Projector.prototype.notifyHoverOverPoint = function (pointIndex) {
+        this.hoverListeners.forEach(function (l) { return l(pointIndex); });
+    };
+    Projector.prototype._dataProtoChanged = function (dataProtoString) {
+        var dataProto = dataProtoString ?
+            JSON.parse(dataProtoString) : null;
+        this.initializeDataProvider(dataProto);
+    };
+    Projector.prototype.makeDefaultPointsInfoAndStats = function (points) {
+        var pointsInfo = [];
+        points.forEach(function (p) {
+            var pointInfo = {};
+            pointInfo[INDEX_METADATA_FIELD] = p.index;
+            pointsInfo.push(pointInfo);
+        });
+        var stats = [{
+                name: INDEX_METADATA_FIELD,
+                isNumeric: false,
+                tooManyUniqueValues: true,
+                min: 0,
+                max: pointsInfo.length - 1
+            }];
+        return [pointsInfo, stats];
+    };
+    Projector.prototype.initializeDataProvider = function (dataProto) {
+        if (this.servingMode === 'demo') {
+            this.dataProvider = new data_provider_demo_1.DemoDataProvider();
+        }
+        else if (this.servingMode === 'server') {
+            if (!this.routePrefix) {
+                throw 'route-prefix is a required parameter';
+            }
+            this.dataProvider = new data_provider_server_1.ServerDataProvider(this.routePrefix);
+        }
+        else if (this.servingMode === 'proto' && dataProto != null) {
+            this.dataProvider = new data_provider_proto_1.ProtoDataProvider(dataProto);
+        }
+        this.dataPanel.initialize(this, this.dataProvider);
+        this.bookmarkPanel.initialize(this, this.dataProvider);
+    };
+    Projector.prototype.getLegendPointColorer = function (colorOption) {
+        var _this = this;
+        if ((colorOption == null) || (colorOption.map == null)) {
+            return null;
+        }
+        var colorer = function (i) {
+            var value = _this.dataSet.points[i].metadata[_this.selectedColorOption.name];
+            if (value == null) {
+                return POINT_COLOR_MISSING;
+            }
+            return colorOption.map(value);
+        };
+        return colorer;
+    };
+    Projector.prototype.get3DLabelModeButton = function () {
+        return this.querySelector('#labels3DMode');
+    };
+    Projector.prototype.get3DLabelMode = function () {
+        var label3DModeButton = this.get3DLabelModeButton();
+        return label3DModeButton.active;
+    };
+    Projector.prototype.getSpriteImageMode = function () {
+        return this.dataSet &&
+            this.dataSet.spriteAndMetadataInfo &&
+            this.dataSet.spriteAndMetadataInfo.spriteImage != null;
+    };
+    Projector.prototype.adjustSelectionAndHover = function (selectedPointIndices, hoverIndex) {
+        this.notifySelectionChanged(selectedPointIndices);
+        this.notifyHoverOverPoint(hoverIndex);
+        this.scatterPlot.setMode(scatterPlot_1.Mode.HOVER);
+    };
+    Projector.prototype.unsetCurrentDataSet = function () {
+        this.dataSet.stopTSNE();
+    };
+    Projector.prototype.setCurrentDataSet = function (ds) {
+        this.adjustSelectionAndHover([]);
+        if (this.dataSet != null) {
+            this.unsetCurrentDataSet();
+        }
+        this.dataSet = ds;
+        if (this.normalizeData) {
+            this.dataSet.normalize();
+        }
+        this.dim = this.dataSet.dim[1];
+        this.dom.select('span.numDataPoints').text(this.dataSet.dim[0]);
+        this.dom.select('span.dim').text(this.dataSet.dim[1]);
+        this.projectionsPanel.dataSetUpdated(this.dataSet, this.originalDataSet, this.dim);
+        this.scatterPlot.setCameraParametersForNextCameraCreation(null, true);
+        this.scatterPlot.setDataSet(this.dataSet);
+        this.updateScatterPlot();
+    };
+    Projector.prototype.setupUIControls = function () {
+        var _this = this;
+        // View controls
+        this.querySelector('#reset-zoom').addEventListener('click', function () {
+            _this.scatterPlot.resetZoom();
+            _this.scatterPlot.startOrbitAnimation();
+        });
+        var selectModeButton = this.querySelector('#selectMode');
+        selectModeButton.addEventListener('click', function (event) {
+            _this.scatterPlot.setMode(selectModeButton.active ? scatterPlot_1.Mode.SELECT : scatterPlot_1.Mode.HOVER);
+        });
+        var nightModeButton = this.querySelector('#nightDayMode');
+        nightModeButton.addEventListener('click', function () {
+            _this.scatterPlot.setDayNightMode(nightModeButton.active);
+        });
+        var labels3DModeButton = this.get3DLabelModeButton();
+        labels3DModeButton.addEventListener('click', function () {
+            _this.createVisualizers(labels3DModeButton.active);
+            _this.scatterPlot.recreateScene();
+            _this.updateScatterPlot();
+            _this.scatterPlot.update();
+        });
+        window.addEventListener('resize', function () {
+            var container = _this.dom.select('#container');
+            var parentHeight = container.node().parentNode.clientHeight;
+            container.style('height', parentHeight + 'px');
+            _this.scatterPlot.resize();
+        });
+        this.projectorScatterPlotAdapter = new projectorScatterPlotAdapter_1.ProjectorScatterPlotAdapter();
+        this.scatterPlot = new scatterPlot_1.ScatterPlot(this.getScatterContainer(), function (i) { return '' +
+            _this.dataSet.points[i].metadata[_this.selectedLabelOption]; }, this, this);
+        this.createVisualizers(false);
+        this.scatterPlot.onCameraMove(function (cameraPosition, cameraTarget) {
+            return _this.bookmarkPanel.clearStateSelection();
+        });
+        this.registerHoverListener(function (hoverIndex) { return _this.onHover(hoverIndex); });
+        this.registerSelectionChangedListener(function (selectedPointIndices, neighborsOfFirstPoint) {
+            return _this.onSelectionChanged(selectedPointIndices, neighborsOfFirstPoint);
+        });
+    };
+    Projector.prototype.onHover = function (hoverIndex) {
+        this.hoverPointIndex = hoverIndex;
+        var hoverText = null;
+        if (hoverIndex != null) {
+            var point = this.dataSet.points[hoverIndex];
+            if (point.metadata[this.selectedLabelOption]) {
+                hoverText = point.metadata[this.selectedLabelOption].toString();
+            }
+        }
+        this.updateScatterPlot();
+        if (this.selectedPointIndices.length === 0) {
+            this.statusBar.style('display', hoverText ? null : 'none');
+            this.statusBar.text(hoverText);
+        }
+    };
+    Projector.prototype.updateScatterPlot = function () {
+        var dataSet = this.dataSet;
+        var selectedSet = this.selectedPointIndices;
+        var hoverIndex = this.hoverPointIndex;
+        var neighbors = this.neighborsOfFirstPoint;
+        var pointColorer = this.getLegendPointColorer(this.selectedColorOption);
+        var pointColors = this.projectorScatterPlotAdapter.generatePointColorArray(dataSet, pointColorer, selectedSet, neighbors, hoverIndex, this.get3DLabelMode(), this.getSpriteImageMode());
+        var pointScaleFactors = this.projectorScatterPlotAdapter.generatePointScaleFactorArray(dataSet, selectedSet, neighbors, hoverIndex);
+        var labels = this.projectorScatterPlotAdapter.generateVisibleLabelRenderParams(dataSet, selectedSet, neighbors, hoverIndex);
+        var traceColors = this.projectorScatterPlotAdapter.generateLineSegmentColorMap(dataSet, pointColorer);
+        this.scatterPlot.setPointColors(pointColors);
+        this.scatterPlot.setPointScaleFactors(pointScaleFactors);
+        this.scatterPlot.setLabels(labels);
+        this.scatterPlot.setTraceColors(traceColors);
+        this.scatterPlot.render();
+    };
+    Projector.prototype.getScatterContainer = function () {
+        return this.dom.select('#scatter');
+    };
+    Projector.prototype.createVisualizers = function (inLabels3DMode) {
+        var scatterPlot = this.scatterPlot;
+        var selectionContext = this;
+        scatterPlot.removeAllVisualizers();
+        if (inLabels3DMode) {
+            scatterPlot.addVisualizer(new scatterPlotVisualizer3DLabels_1.ScatterPlotVisualizer3DLabels());
+        }
+        else {
+            scatterPlot.addVisualizer(new scatterPlotVisualizerSprites_1.ScatterPlotVisualizerSprites());
+            scatterPlot.addVisualizer(new scatterPlotVisualizerTraces_1.ScatterPlotVisualizerTraces(selectionContext));
+            scatterPlot.addVisualizer(new scatterPlotVisualizerCanvasLabels_1.ScatterPlotVisualizerCanvasLabels(this.getScatterContainer()));
+        }
+    };
+    Projector.prototype.onSelectionChanged = function (selectedPointIndices, neighborsOfFirstPoint) {
+        this.selectedPointIndices = selectedPointIndices;
+        this.neighborsOfFirstPoint = neighborsOfFirstPoint;
+        var totalNumPoints = this.selectedPointIndices.length + neighborsOfFirstPoint.length;
+        this.statusBar.text("Selected " + totalNumPoints + " points")
+            .style('display', totalNumPoints > 0 ? null : 'none');
+        this.inspectorPanel.updateInspectorPane(selectedPointIndices, neighborsOfFirstPoint);
+        this.updateScatterPlot();
+    };
+    Projector.prototype.setProjection = function (projection, dimensionality, pointAccessors) {
+        this.selectedProjection = projection;
+        this.scatterPlot.setDimensions(dimensionality);
+        this.scatterPlot.showTickLabels(false);
+        this.scatterPlot.setPointAccessors(pointAccessors);
+        if (this.dataSet.hasMeaningfulVisualization(projection)) {
+            this.scatterPlot.update();
+        }
+        this.scatterPlot.recreateScene();
+        this.scatterPlot.setCameraParametersForNextCameraCreation(null, false);
+    };
+    Projector.prototype.notifyProjectionsUpdated = function () {
+        this.scatterPlot.update();
+    };
+    /**
+     * Gets the current view of the embedding and saves it as a State object.
+     */
+    Projector.prototype.getCurrentState = function () {
+        var state = new data_1.State();
+        // Save the individual datapoint projections.
+        state.projections = [];
+        for (var i = 0; i < this.dataSet.points.length; i++) {
+            var point = this.dataSet.points[i];
+            var projections = {};
+            var keys = Object.keys(point.projections);
+            for (var j = 0; j < keys.length; ++j) {
+                projections[keys[j]] = point.projections[keys[j]];
+            }
+            state.projections.push(projections);
+        }
+        state.selectedProjection = this.selectedProjection;
+        state.tSNEIteration = this.dataSet.tSNEIteration;
+        state.selectedPoints = this.selectedPointIndices;
+        state.cameraDef = this.scatterPlot.getCameraDef();
+        state.selectedColorOptionName = this.dataPanel.selectedColorOptionName;
+        state.selectedLabelOption = this.selectedLabelOption;
+        this.projectionsPanel.populateBookmarkFromUI(state);
+        return state;
+    };
+    /** Loads a State object into the world. */
+    Projector.prototype.loadState = function (state) {
+        for (var i = 0; i < state.projections.length; i++) {
+            var point = this.dataSet.points[i];
+            var projection = state.projections[i];
+            var keys = Object.keys(projection);
+            for (var j = 0; j < keys.length; ++j) {
+                point.projections[keys[j]] = projection[keys[j]];
+            }
+        }
+        this.dataSet.hasTSNERun = (state.selectedProjection === 'tsne');
+        this.dataSet.tSNEIteration = state.tSNEIteration;
+        this.projectionsPanel.restoreUIFromBookmark(state);
+        this.dataPanel.selectedColorOptionName = state.selectedColorOptionName;
+        this.selectedLabelOption = state.selectedLabelOption;
+        this.scatterPlot.setCameraParametersForNextCameraCreation(state.cameraDef, false);
+        {
+            var dimensions = data_1.stateGetAccessorDimensions(state);
+            var accessors = this.dataSet.getPointAccessors(state.selectedProjection, dimensions);
+            this.setProjection(state.selectedProjection, dimensions.length, accessors);
+        }
+        this.notifySelectionChanged(state.selectedPoints);
+    };
+    return Projector;
+}(exports.ProjectorPolymer));
+exports.Projector = Projector;
+document.registerElement(Projector.prototype.is, Projector);
+
+},{"./data":6,"./data-provider-demo":2,"./data-provider-proto":3,"./data-provider-server":4,"./logging":12,"./projectorScatterPlotAdapter":13,"./scatterPlot":15,"./scatterPlotVisualizer3DLabels":17,"./scatterPlotVisualizerCanvasLabels":19,"./scatterPlotVisualizerSprites":20,"./scatterPlotVisualizerTraces":21,"./vz-projector-util":33}],35:[function(require,module,exports){
+arguments[4][7][0].apply(exports,arguments)
+},{"dup":7}]},{},[35,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34]);
+</script>
 </dom-module>
 </body></html>
\ No newline at end of file
diff --git a/tensorflow/tensorboard/plugins/projector/plugin.py b/tensorflow/tensorboard/plugins/projector/plugin.py
index b6d19650943..4b0c36ce5eb 100644
--- a/tensorflow/tensorboard/plugins/projector/plugin.py
+++ b/tensorflow/tensorboard/plugins/projector/plugin.py
@@ -28,11 +28,12 @@ from tensorflow.contrib.tensorboard.plugins.projector.projector_config_pb2 impor
 from tensorflow.python.lib.io import file_io
 from tensorflow.python.platform import tf_logging as logging
 from tensorflow.python.pywrap_tensorflow import NewCheckpointReader
+from tensorflow.python.training.saver import checkpoint_exists
 from tensorflow.python.training.saver import latest_checkpoint
 from tensorflow.tensorboard.plugins.base_plugin import TBPlugin
 
 # HTTP routes.
-INFO_ROUTE = '/info'
+CONFIG_ROUTE = '/info'
 TENSOR_ROUTE = '/tensor'
 METADATA_ROUTE = '/metadata'
 RUNS_ROUTE = '/runs'
@@ -51,6 +52,15 @@ _IMGHDR_TO_MIMETYPE = {
 _DEFAULT_IMAGE_MIMETYPE = 'application/octet-stream'
 
 
+def _read_tensor_file(fpath):
+  with file_io.FileIO(fpath, 'r') as f:
+    tensor = []
+    for line in f:
+      if line:
+        tensor.append(line.rstrip('\n').split('\t'))
+  return tensor
+
+
 class ProjectorPlugin(TBPlugin):
   """Embedding projector."""
 
@@ -58,16 +68,47 @@ class ProjectorPlugin(TBPlugin):
     self.configs, self.config_fpaths = self._read_config_files(run_paths,
                                                                logdir)
     self.readers = {}
+    self._augment_configs_with_checkpoint_info()
 
     return {
         RUNS_ROUTE: self._serve_runs,
-        INFO_ROUTE: self._serve_info,
+        CONFIG_ROUTE: self._serve_config,
         TENSOR_ROUTE: self._serve_tensor,
         METADATA_ROUTE: self._serve_metadata,
         BOOKMARKS_ROUTE: self._serve_bookmarks,
         SPRITE_IMAGE_ROUTE: self._serve_sprite_image
     }
 
+  def _augment_configs_with_checkpoint_info(self):
+    for run, config in self.configs.items():
+      # Find the size of the embeddings that are associated with a tensor file.
+      for embedding in config.embeddings:
+        if embedding.tensor_path and not embedding.tensor_shape:
+          tensor = _read_tensor_file(embedding.tensor_path)
+          embedding.tensor_shape.extend([len(tensor), len(tensor[0])])
+
+      reader = self._get_reader_for_run(run)
+      if not reader:
+        continue
+      # Augment the configuration with the tensors in the checkpoint file.
+      special_embedding = None
+      if config.embeddings and not config.embeddings[0].tensor_name:
+        special_embedding = config.embeddings[0]
+        config.embeddings.remove(special_embedding)
+      var_map = reader.get_variable_to_shape_map()
+      for tensor_name, tensor_shape in var_map.items():
+        if len(tensor_shape) != 2:
+          continue
+        embedding = self._get_embedding(tensor_name, config)
+        if not embedding:
+          embedding = config.embeddings.add()
+          embedding.tensor_name = tensor_name
+          if special_embedding:
+            embedding.metadata_path = special_embedding.metadata_path
+            embedding.bookmarks_path = special_embedding.bookmarks_path
+        if not embedding.tensor_shape:
+          embedding.tensor_shape.extend(tensor_shape)
+
   def _read_config_files(self, run_paths, logdir):
     # If there are no summary event files, the projector can still work,
     # thus treating the `logdir` as the model checkpoint directory.
@@ -77,14 +118,17 @@ class ProjectorPlugin(TBPlugin):
     configs = {}
     config_fpaths = {}
     for run_name, logdir in run_paths.items():
-      config_fpath = os.path.join(logdir, PROJECTOR_FILENAME)
-      if not file_io.file_exists(config_fpath):
-        # Skip runs that have no config file.
-        continue
-      # Read the config file.
-      file_content = file_io.read_file_to_string(config_fpath).decode('utf-8')
       config = ProjectorConfig()
-      text_format.Merge(file_content, config)
+      config_fpath = os.path.join(logdir, PROJECTOR_FILENAME)
+      if file_io.file_exists(config_fpath):
+        file_content = file_io.read_file_to_string(config_fpath).decode('utf-8')
+        text_format.Merge(file_content, config)
+
+      has_tensor_files = False
+      for embedding in config.embeddings:
+        if embedding.tensor_path:
+          has_tensor_files = True
+          break
 
       if not config.model_checkpoint_path:
         # See if you can find a checkpoint file in the logdir.
@@ -92,13 +136,15 @@ class ProjectorPlugin(TBPlugin):
         if not ckpt_path:
           # Or in the parent of logdir.
           ckpt_path = latest_checkpoint(os.path.join('../', logdir))
-          if not ckpt_path:
+          if not ckpt_path and not has_tensor_files:
             logging.warning('Cannot find model checkpoint in %s', logdir)
             continue
-        config.model_checkpoint_path = ckpt_path
+        if ckpt_path:
+          config.model_checkpoint_path = ckpt_path
 
       # Sanity check for the checkpoint file.
-      if not file_io.file_exists(config.model_checkpoint_path):
+      if (config.model_checkpoint_path and
+          not checkpoint_exists(config.model_checkpoint_path)):
         logging.warning('Checkpoint file %s not found',
                         config.model_checkpoint_path)
         continue
@@ -111,18 +157,20 @@ class ProjectorPlugin(TBPlugin):
       return self.readers[run]
 
     config = self.configs[run]
-    reader = NewCheckpointReader(config.model_checkpoint_path)
+    reader = None
+    if config.model_checkpoint_path:
+      reader = NewCheckpointReader(config.model_checkpoint_path)
     self.readers[run] = reader
     return reader
 
   def _get_metadata_file_for_tensor(self, tensor_name, config):
-    embedding_info = self._get_embedding_info_for_tensor(tensor_name, config)
+    embedding_info = self._get_embedding(tensor_name, config)
     if embedding_info:
       return embedding_info.metadata_path
     return None
 
   def _get_bookmarks_file_for_tensor(self, tensor_name, config):
-    embedding_info = self._get_embedding_info_for_tensor(tensor_name, config)
+    embedding_info = self._get_embedding(tensor_name, config)
     if embedding_info:
       return embedding_info.bookmarks_path
     return None
@@ -133,7 +181,7 @@ class ProjectorPlugin(TBPlugin):
     else:
       return tensor_name
 
-  def _get_embedding_info_for_tensor(self, tensor_name, config):
+  def _get_embedding(self, tensor_name, config):
     if not config.embeddings:
       return None
     for info in config.embeddings:
@@ -146,7 +194,7 @@ class ProjectorPlugin(TBPlugin):
     """Returns a list of runs that have embeddings."""
     self.handler.respond(list(self.configs.keys()), 'application/json')
 
-  def _serve_info(self, query_params):
+  def _serve_config(self, query_params):
     run = query_params.get('run')
     if run is None:
       self.handler.respond('query parameter "run" is required',
@@ -157,19 +205,6 @@ class ProjectorPlugin(TBPlugin):
       return
 
     config = self.configs[run]
-    reader = self._get_reader_for_run(run)
-    var_map = reader.get_variable_to_shape_map()
-
-    for tensor_name, tensor_shape in var_map.items():
-      if len(tensor_shape) != 2:
-        continue
-      info = self._get_embedding_info_for_tensor(tensor_name, config)
-      if not info:
-        info = config.embeddings.add()
-        info.tensor_name = tensor_name
-      if not info.tensor_shape:
-        info.tensor_shape.extend(tensor_shape)
-
     self.handler.respond(json_format.MessageToJson(config), 'application/json')
 
   def _serve_metadata(self, query_params):
@@ -192,7 +227,7 @@ class ProjectorPlugin(TBPlugin):
     fpath = self._get_metadata_file_for_tensor(name, config)
     if not fpath:
       self.handler.respond(
-          'Not metadata file found for tensor %s in the config file %s' %
+          'No metadata file found for tensor %s in the config file %s' %
           (name, self.config_fpaths[run]), 'text/plain', 400)
       return
     if not file_io.file_exists(fpath) or file_io.is_directory(fpath):
@@ -231,12 +266,27 @@ class ProjectorPlugin(TBPlugin):
 
     reader = self._get_reader_for_run(run)
     config = self.configs[run]
-    if not reader.has_tensor(name):
-      self.handler.respond('Tensor %s not found in checkpoint dir %s' %
-                           (name, config.model_checkpoint_path),
-                           'text/plain', 400)
-      return
-    tensor = reader.get_tensor(name)
+
+    if reader is None:
+      # See if there is a tensor file in the config.
+      embedding = self._get_embedding(name, config)
+      if not embedding or not embedding.tensor_path:
+        self.handler.respond('Tensor %s has no tensor_path in the config' %
+                             name, 'text/plain', 400)
+        return
+      if not file_io.file_exists(embedding.tensor_path):
+        self.handler.respond('Tensor file %s does not exist' %
+                             embedding.tensor_path, 'text/plain', 400)
+        return
+      tensor = _read_tensor_file(embedding.tensor_path)
+    else:
+      if not reader.has_tensor(name):
+        self.handler.respond('Tensor %s not found in checkpoint dir %s' %
+                             (name, config.model_checkpoint_path),
+                             'text/plain', 400)
+        return
+      tensor = reader.get_tensor(name)
+
     # Sample the tensor
     tensor = tensor[:LIMIT_NUM_POINTS]
     # Stream it as TSV.
@@ -294,7 +344,7 @@ class ProjectorPlugin(TBPlugin):
       return
 
     config = self.configs[run]
-    embedding_info = self._get_embedding_info_for_tensor(name, config)
+    embedding_info = self._get_embedding(name, config)
 
     if not embedding_info or not embedding_info.sprite.image_path:
       self.handler.respond(
diff --git a/tensorflow/tensorflow.bzl b/tensorflow/tensorflow.bzl
index 0270001eafa..388dba33b53 100644
--- a/tensorflow/tensorflow.bzl
+++ b/tensorflow/tensorflow.bzl
@@ -545,11 +545,28 @@ def tf_kernel_library(name, prefix=None, srcs=None, gpu_srcs=None, hdrs=None,
       deps = deps,
       **kwargs)
 
-def tf_kernel_libraries(name, prefixes, deps=None, **kwargs):
-  """Makes one target per prefix, and one target that includes them all."""
+def tf_kernel_libraries(name, prefixes, deps=None, libs=None, **kwargs):
+  """Makes one target per prefix, and one target that includes them all.
+
+  Args:
+    name: The name of the omnibus cc_library target that depends on each
+          generated tf_kernel_library target.
+    prefixes: A list of source file name prefixes used to generate individual
+              libraries.  See the definition of tf_kernel_library for details.
+    deps: The dependencies list associated with each generated target.
+    libs: Additional tf_kernel_library targets that should be included in the
+          omnibus cc_library target but not as deps of individual libraries.
+          This can be used, for example, if a library that was previously
+          generated by this rule is refactored into a separate definition
+          in order to specify more or fewer deps for it.
+
+  Other attributes are forwarded to each individual target but not to the
+  omnibus cc_library target.
+  """
   for p in prefixes:
     tf_kernel_library(name=p, prefix=p, deps=deps, **kwargs)
-  native.cc_library(name=name, deps=[":" + p for p in prefixes])
+  native.cc_library(name=name,
+                    deps=[":" + p for p in prefixes] + (libs or []))
 
 # Bazel rules for building swig files.
 def _py_wrap_cc_impl(ctx):
diff --git a/tensorflow/tools/ci_build/builds/test_tutorials.sh b/tensorflow/tools/ci_build/builds/test_tutorials.sh
index 3c83f5dbe16..0b0af5a189e 100755
--- a/tensorflow/tools/ci_build/builds/test_tutorials.sh
+++ b/tensorflow/tools/ci_build/builds/test_tutorials.sh
@@ -198,13 +198,6 @@ test_cifar10_train() {
     return 1
   fi
 
-  # Check ckpt files
-  if [[ ! -f "${TUT_TEST_ROOT}/cifar10_train/model.ckpt-0.index" ]] ||
-    [[ ! -f "${TUT_TEST_ROOT}/cifar10_train/model.ckpt-49.index" ]]; then
-    echo "FAILED: cifar10_train did not generate expected model checkpoint files"
-    return 1
-  fi
-
   return 0
 }
 
diff --git a/tensorflow/tools/docker/Dockerfile b/tensorflow/tools/docker/Dockerfile
index a8f5f263a24..39da8b2e656 100644
--- a/tensorflow/tools/docker/Dockerfile
+++ b/tensorflow/tools/docker/Dockerfile
@@ -33,7 +33,7 @@ RUN pip --no-cache-dir install \
         && \
     python -m ipykernel.kernelspec
 
-ENV TENSORFLOW_VERSION 0.11.0rc1
+ENV TENSORFLOW_VERSION 0.11.0rc2
 
 # --- DO NOT EDIT OR DELETE BETWEEN THE LINES --- #
 # These lines will be edited automatically by parameterized_docker_build.sh. #
diff --git a/tensorflow/tools/docker/Dockerfile.gpu b/tensorflow/tools/docker/Dockerfile.gpu
index 9ad57d6486d..b369bc10e76 100644
--- a/tensorflow/tools/docker/Dockerfile.gpu
+++ b/tensorflow/tools/docker/Dockerfile.gpu
@@ -33,7 +33,7 @@ RUN pip --no-cache-dir install \
         && \
     python -m ipykernel.kernelspec
 
-ENV TENSORFLOW_VERSION 0.11.0rc1
+ENV TENSORFLOW_VERSION 0.11.0rc2
 
 # --- DO NOT EDIT OR DELETE BETWEEN THE LINES --- #
 # These lines will be edited automatically by parameterized_docker_build.sh. #
diff --git a/tensorflow/tools/gcs_test/Dockerfile b/tensorflow/tools/gcs_test/Dockerfile
index 782a63f77fa..3b95e326658 100644
--- a/tensorflow/tools/gcs_test/Dockerfile
+++ b/tensorflow/tools/gcs_test/Dockerfile
@@ -17,7 +17,7 @@ RUN ./install_google_cloud_sdk.bash --disable-prompts --install-dir=/var/gcloud
 
 # Install nightly TensorFlow pip
 RUN pip install \
-   https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=cpu-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc1-cp27-none-linux_x86_64.whl
+   https://ci.tensorflow.org/view/Nightly/job/nightly-matrix-cpu/TF_BUILD_IS_OPT=OPT,TF_BUILD_IS_PIP=PIP,TF_BUILD_PYTHON_VERSION=PYTHON2,label=cpu-slave/lastSuccessfulBuild/artifact/pip_test/whl/tensorflow-0.11.0rc2-cp27-none-linux_x86_64.whl
 
 # Copy test files
 RUN mkdir -p /gcs-smoke/python
diff --git a/tensorflow/tools/git/gen_git_source.py b/tensorflow/tools/git/gen_git_source.py
index 267bcad816b..adc6bdbd17e 100755
--- a/tensorflow/tools/git/gen_git_source.py
+++ b/tensorflow/tools/git/gen_git_source.py
@@ -147,8 +147,10 @@ def get_git_version(git_base_path):
   """
   unknown_label = b"unknown"
   try:
-    val = subprocess.check_output(["git", str("--git-dir="+git_base_path+"/.git"), str("--work-tree="+git_base_path), "describe",
-                                   "--long", "--dirty", "--tags"]).strip()
+    val = bytes(subprocess.check_output([
+        "git", str("--git-dir=%s/.git" % git_base_path),
+        str("--work-tree=" + git_base_path), "describe", "--long", "--dirty", "--tags"
+    ]).strip())
     return val if val else unknown_label
   except subprocess.CalledProcessError:
     return unknown_label
@@ -199,7 +201,7 @@ def generate(arglist):
   data = json.load(open(spec))
   git_version = None
   if not data["git"]:
-    git_version = "unknown"
+    git_version = b"unknown"
   else:
     old_branch = data["branch"]
     new_branch = parse_branch_ref(head_symlink)
diff --git a/tensorflow/tools/pip_package/setup.py b/tensorflow/tools/pip_package/setup.py
index 9b475e58a30..2dc84ef652d 100644
--- a/tensorflow/tools/pip_package/setup.py
+++ b/tensorflow/tools/pip_package/setup.py
@@ -26,7 +26,7 @@ from setuptools import find_packages, setup, Command
 from setuptools.command.install import install as InstallCommandBase
 from setuptools.dist import Distribution
 
-_VERSION = '0.11.0rc1'
+_VERSION = '0.11.0rc2'
 
 REQUIRED_PACKAGES = [
     'numpy >= 1.11.0',
diff --git a/tensorflow/tools/quantization/quantize_graph.py b/tensorflow/tools/quantization/quantize_graph.py
index 894806f186e..d11fbf65ed1 100644
--- a/tensorflow/tools/quantization/quantize_graph.py
+++ b/tensorflow/tools/quantization/quantize_graph.py
@@ -28,6 +28,7 @@ from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function
 
+import collections
 import re
 import numpy as np
 import tensorflow as tf
@@ -283,6 +284,11 @@ def quantize_weight_eightbit(input_node, quantization_mode):
   return [quint8_const_node, min_node, max_node, dequantize_node]
 
 
+EightbitizeRecursionState = collections.namedtuple(
+    "EightbitizeRecursionState", ["already_visited", "output_node_stack",
+                                  "merged_with_fake_quant"])
+
+
 class GraphRewriter(object):
   """Takes a float graph, and rewrites it in quantized form."""
 
@@ -316,6 +322,9 @@ class GraphRewriter(object):
     else:
       self.input_range = None
 
+    # Data that is valid only during the recursive call to rewrite the graph.
+    self.state = None
+
   def create_nodes_map(self, graph):
     """Builds a mapping of node names to their defs from the graph."""
     nodes_map = {}
@@ -353,11 +362,12 @@ class GraphRewriter(object):
       output_nodes = [self.nodes_map[output_node_name]
                       for output_node_name in output_node_names]
 
-      self.already_visited = {}
-      self.layers_eightbitized = []
+      self.state = EightbitizeRecursionState(already_visited={},
+                                             output_node_stack=[],
+                                             merged_with_fake_quant={})
       for output_node in output_nodes:
         self.eightbitize_nodes_recursively(output_node)
-      self.output_graph = self.quantize_weights(self.output_graph, b"MIN_FIRST")
+      self.state = None
       if self.input_range:
         self.add_output_graph_node(create_constant_node(
             "quantized_input_min_value", self.input_range[0], tf.float32, []))
@@ -477,20 +487,54 @@ class GraphRewriter(object):
     set_attr_string(dequantize_node, "mode", b"MIN_FIRST")
     self.add_output_graph_node(dequantize_node)
 
+  def should_merge_with_fake_quant_node(self):
+    """Should the current node merge with self.state.output_node_stack[-1]?"""
+    if not self.state.output_node_stack: return False
+    top = self.state.output_node_stack[-1]
+    return top[1] == 0 and top[0].op in ["FakeQuantWithMinMaxVars"]
+
+  def should_quantize_const(self, node):
+    if not self.state.output_node_stack: return False
+    top = self.state.output_node_stack[-1]
+    if not top[2]: return False
+    assert tf.as_dtype(node.attr["dtype"].type) == tf.float32, (
+        "Quantizing constant %s" % node.name)
+    return True
+
   def eightbitize_nodes_recursively(self, current_node):
     """The entry point for transforming a graph into full eight bit."""
-    self.already_visited[current_node.name] = True
-    for input_node_name in current_node.input:
+    if current_node.name in self.state.already_visited:
+      if (self.should_merge_with_fake_quant_node() or
+          current_node.name in self.state.merged_with_fake_quant):
+        raise ValueError("Unsupported graph structure: output of node %s "
+                         "is processed by a FakeQuant* node and should have "
+                         "no other outputs.", current_node.name)
+      return
+    self.state.already_visited[current_node.name] = True
+
+    for i, input_node_name in enumerate(current_node.input):
+      quantize_input = False
+      if current_node.op in ("MatMul", "Conv2D", "BiasAdd", "MaxPool",
+                             "AvgPool", "Relu", "Relu6",
+                             "BatchNormWithGlobalNormalization"):
+        quantize_input = True
+      elif current_node.op == "Concat" and i > 0:
+        quantize_input = True
+      elif current_node.op == "Reshape" and i == 0:
+        quantize_input = True
+
+      self.state.output_node_stack.append((current_node, i, quantize_input))
+
       input_node_name = node_name_from_input(input_node_name)
-      if input_node_name in self.already_visited:
-        continue
       input_node = self.nodes_map[input_node_name]
       self.eightbitize_nodes_recursively(input_node)
+
+      self.state.output_node_stack.pop()
+
     if current_node.op == "MatMul":
       self.eightbitize_mat_mul_node(current_node)
     elif current_node.op == "Conv2D":
       self.eightbitize_conv_node(current_node)
-      self.layers_eightbitized.append(current_node.name)
     elif current_node.op == "BiasAdd":
       self.eightbitize_bias_add_node(current_node)
     elif current_node.op == "MaxPool" or current_node.op == "AvgPool":
@@ -508,11 +552,29 @@ class GraphRewriter(object):
     elif (self.input_range and
           current_node.op in ("Placeholder", "PlaceholderV2")):
       self.eightbitize_placeholder_node(current_node)
+    elif current_node.op == "FakeQuantWithMinMaxVars":
+      # It will have been merged into the underlying node.
+      pass
+    elif current_node.op == "Const":
+      if self.should_quantize_const(current_node):
+        for n in quantize_weight_eightbit(current_node, b"MIN_FIRST"):
+          self.add_output_graph_node(n)
+      else:
+        new_node = tf.NodeDef()
+        new_node.CopyFrom(current_node)
+        self.add_output_graph_node(new_node)
     else:
       new_node = tf.NodeDef()
       new_node.CopyFrom(current_node)
       self.add_output_graph_node(new_node)
 
+    if (self.should_merge_with_fake_quant_node() and
+        current_node.name not in self.state.merged_with_fake_quant):
+      raise ValueError(
+          "FakeQuant* node %s failed to merge with node %s of type %s" % (
+              self.state.output_node_stack[-1][0], current_node.name,
+              current_node.op))
+
   def add_eightbit_prologue_nodes(self, original_node):
     """Adds input conversion nodes to handle quantizing the underlying node."""
     namespace_prefix = original_node.name + "_eightbit"
@@ -583,16 +645,26 @@ class GraphRewriter(object):
         quantized_output_name, quantized_output_name + ":1",
         quantized_output_name + ":2"
     ]
-    requant_range_node = create_node(
-        "RequantizationRange", original_node.name + "_eightbit_requant_range",
-        quantized_outputs)
-    set_attr_dtype(requant_range_node, "Tinput", tf.qint32)
-    self.add_output_graph_node(requant_range_node)
-
+    min_max_inputs = None
+    if self.should_merge_with_fake_quant_node():
+      # Use the inputs to the FakeQuantWithMinMaxVars node as the inputs to
+      # Requantize.
+      fake_quant_node = self.state.output_node_stack[-1][0]
+      min_max_inputs = [fake_quant_node.input[1], fake_quant_node.input[2]]
+      assert original_node.name not in self.state.merged_with_fake_quant
+      self.state.merged_with_fake_quant[original_node.name] = True
+    else:
+      # Add a RequantizationRange node for finding the min and max values.
+      requant_range_node = create_node(
+          "RequantizationRange", original_node.name + "_eightbit_requant_range",
+          quantized_outputs)
+      set_attr_dtype(requant_range_node, "Tinput", tf.qint32)
+      self.add_output_graph_node(requant_range_node)
+      min_max_inputs = [requant_range_node.name + ":0",
+                        requant_range_node.name + ":1"]
     requantize_node = create_node(
         "Requantize", original_node.name + "_eightbit_requantize",
-        (quantized_outputs +
-         [requant_range_node.name + ":0", requant_range_node.name + ":1"]))
+        quantized_outputs + min_max_inputs)
     set_attr_dtype(requantize_node, "Tinput", tf.qint32)
     set_attr_dtype(requantize_node, "out_type", tf.quint8)
     self.add_output_graph_node(requantize_node)
@@ -600,12 +672,20 @@ class GraphRewriter(object):
 
   def add_dequantize_result_node(self, quantized_output_name,
                                  original_node_name, min_tensor_index=1):
+    min_max_inputs = [
+        "%s:%s" % (quantized_output_name, min_tensor_index),
+        "%s:%s" % (quantized_output_name, (min_tensor_index + 1))]
     dequantize_name = original_node_name
+    if self.should_merge_with_fake_quant_node():
+      fake_quant_node = self.state.output_node_stack[-1][0]
+      if original_node_name not in self.state.merged_with_fake_quant:
+        min_max_inputs = [fake_quant_node.input[1], fake_quant_node.input[2]]
+        self.state.merged_with_fake_quant[original_node_name] = True
+      dequantize_name = fake_quant_node.name
+
     dequantize_node = create_node(
         "Dequantize", dequantize_name,
-        [quantized_output_name,
-         "%s:%s" % (quantized_output_name, min_tensor_index),
-         "%s:%s" % (quantized_output_name, (min_tensor_index + 1))])
+        [quantized_output_name, min_max_inputs[0], min_max_inputs[1]])
     set_attr_dtype(dequantize_node, "T", tf.quint8)
     set_attr_string(dequantize_node, "mode", b"MIN_FIRST")
     self.add_output_graph_node(dequantize_node)
diff --git a/tensorflow/tools/quantization/quantize_graph_test.py b/tensorflow/tools/quantization/quantize_graph_test.py
index 1521240f284..42f06ef2ed5 100644
--- a/tensorflow/tools/quantization/quantize_graph_test.py
+++ b/tensorflow/tools/quantization/quantize_graph_test.py
@@ -160,7 +160,7 @@ def get_top_value(input_values):
   return max_index, max_value
 
 
-def test_graph(float_graph_def, input_map, output_names):
+def test_graph(float_graph_def, input_map, output_names, log_graph=False):
   """Runs the float graph through the rewriter and tests the results."""
   float_results = run_graph_def(float_graph_def, input_map,
                                 [output_name + ":0"
@@ -184,6 +184,9 @@ def test_graph(float_graph_def, input_map, output_names):
   for expected, result in zip(float_results, eightbit_results):
     assert are_tensors_near(expected, result, 1.0)
 
+  if log_graph:
+    tf.logging.info("8bit:\n%s", str(eightbit_graph_def))
+
   # Test the weights_rounded mode. This uses the default bit_depth.
   weights_rounded_rewriter = quantize_graph.GraphRewriter(
       float_graph_def, "weights_rounded", quantized_input_range=None)
@@ -580,6 +583,40 @@ class QuantizeGraphTest(tf.test.TestCase):
     float_graph_def.node.extend([relu_node])
     test_graph(float_graph_def, {}, [relu_name])
 
+  def test_relu_w_fake_quant_w_min_max_vars(self):
+    input_node = quantize_graph.create_constant_node(
+        "input", value=[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12],
+        dtype=tf.float32, shape=[1, 2, 6, 1])
+    relu_node = quantize_graph.create_node("Relu", "relu",
+                                           [input_node.name])
+    quantize_graph.set_attr_dtype(relu_node, "T", tf.float32)
+
+    min_node = quantize_graph.create_constant_node(
+        "min_bias_add", value=0, dtype=tf.float32, shape=[])
+    max_node = quantize_graph.create_constant_node(
+        "max_bias_add", value=12, dtype=tf.float32, shape=[])
+    fake_quant_node = quantize_graph.create_node(
+        "FakeQuantWithMinMaxVars", "fake_quant",
+        [relu_node.name, min_node.name, max_node.name])
+
+    float_graph_def = tf.GraphDef()
+    float_graph_def.node.extend([input_node, relu_node, min_node, max_node,
+                                 fake_quant_node])
+    test_graph(float_graph_def, {}, [fake_quant_node.name], log_graph=True)
+
+    # Verify there is only one Quantize and one Requantize op.
+    eightbit_rewriter = quantize_graph.GraphRewriter(float_graph_def,
+                                                     "eightbit",
+                                                     quantized_input_range=None)
+    eightbit_graph_def = eightbit_rewriter.rewrite([fake_quant_node.name])
+
+    ops = [node.op for node in eightbit_graph_def.node]
+    # No quantize since all inputs are const and can be quantized up-front.
+    self.assertEqual(0, ops.count("QuantizeV2") + ops.count("Quantize"))
+
+    # One dequantize at the end.
+    self.assertEqual(1, ops.count("Dequantize"))
+
   def test_relu6(self):
     input_constant_name = "input_constant"
     relu6_name = "relu6"
@@ -720,6 +757,42 @@ class QuantizeGraphTest(tf.test.TestCase):
                      ops.count("QuantizeV2") + ops.count("Quantize"))
     self.assertEqual(len(output_names), ops.count("Dequantize"))
 
+  def test_bias_add_w_fake_quant_w_min_max_vars(self):
+    input_node = quantize_graph.create_constant_node(
+        "input", value=[1, 2, 3, 4, 5, 6, 7, 8, 9, 10],
+        dtype=tf.float32, shape=[1, 1, 2, 5])
+    offset_node = quantize_graph.create_constant_node(
+        "offset", value=[1, 2, 3, 4, 5], dtype=tf.float32, shape=[5])
+    bias_add_node = quantize_graph.create_node(
+        "BiasAdd", "bias_add", [input_node.name, offset_node.name])
+    quantize_graph.set_attr_dtype(bias_add_node, "T", tf.float32)
+
+    min_node = quantize_graph.create_constant_node(
+        "min_bias_add", value=-.5, dtype=tf.float32, shape=[])
+    max_node = quantize_graph.create_constant_node(
+        "max_bias_add", value=15.5, dtype=tf.float32, shape=[])
+    fake_quant_node = quantize_graph.create_node(
+        "FakeQuantWithMinMaxVars", "fake_quant",
+        [bias_add_node.name, min_node.name, max_node.name])
+
+    float_graph_def = tf.GraphDef()
+    float_graph_def.node.extend([input_node, offset_node, bias_add_node,
+                                 min_node, max_node, fake_quant_node])
+    test_graph(float_graph_def, {}, [fake_quant_node.name], log_graph=True)
+
+    # Verify there is only one Quantize and one Requantize op.
+    eightbit_rewriter = quantize_graph.GraphRewriter(float_graph_def,
+                                                     "eightbit",
+                                                     quantized_input_range=None)
+    eightbit_graph_def = eightbit_rewriter.rewrite([fake_quant_node.name])
+
+    ops = [node.op for node in eightbit_graph_def.node]
+    # No quantize since all inputs are const and can be quantized up-front.
+    self.assertEqual(0, ops.count("QuantizeV2") + ops.count("Quantize"))
+
+    # One dequantize at the end.
+    self.assertEqual(1, ops.count("Dequantize"))
+
   def test_remove_redundant_quantization(self):
     a_constant_name = "a_constant"
     a_constant_min_name = "a_constant_min"
diff --git a/tensorflow/workspace.bzl b/tensorflow/workspace.bzl
index a485e25a9d2..c683a10a219 100644
--- a/tensorflow/workspace.bzl
+++ b/tensorflow/workspace.bzl
@@ -80,7 +80,7 @@ def tf_workspace(path_prefix = "", tf_repo_name = ""):
 
   native.new_http_archive(
     name = "gif_archive",
-    url = "http://ufpr.dl.sourceforge.net/project/giflib/giflib-5.1.4.tar.gz",
+    url = "http://cdimage.debian.org/mirror/xbmc.org/build-deps/sources/giflib-5.1.4.tar.gz",
     sha256 = "34a7377ba834397db019e8eb122e551a49c98f49df75ec3fcc92b9a794a4f6d1",
     strip_prefix = "giflib-5.1.4/lib",
     build_file = str(Label("//:gif.BUILD")),
@@ -140,7 +140,7 @@ def tf_workspace(path_prefix = "", tf_repo_name = ""):
   native.new_http_archive(
     name = "swig",
     sha256 = "58a475dbbd4a4d7075e5fe86d4e54c9edde39847cdb96a3053d87cb64a23a453",
-    url = "http://ufpr.dl.sourceforge.net/project/swig/swig/swig-3.0.8/swig-3.0.8.tar.gz",
+    url = "http://cdimage.debian.org/mirror/xbmc.org/build-deps/sources/swig-3.0.8.tar.gz",
     strip_prefix = "swig-3.0.8",
     build_file = str(Label("//third_party:swig.BUILD")),
   )