From 6f4a1bfbf2c2077d7c26112d8862737c1190f186 Mon Sep 17 00:00:00 2001 From: Eugene Zhulenev Date: Fri, 19 Apr 2019 10:23:31 -0700 Subject: [PATCH] Merge non-build changes from #26722 PiperOrigin-RevId: 244379269 --- tensorflow/core/kernels/batchtospace_op.cc | 4 ++-- tensorflow/core/kernels/fill_functor.cu.cc | 4 ++-- third_party/eigen3/gpu_packet_math.patch | 4 ++-- 3 files changed, 6 insertions(+), 6 deletions(-) diff --git a/tensorflow/core/kernels/batchtospace_op.cc b/tensorflow/core/kernels/batchtospace_op.cc index e099dcfb0a0..b07c5fd718d 100644 --- a/tensorflow/core/kernels/batchtospace_op.cc +++ b/tensorflow/core/kernels/batchtospace_op.cc @@ -266,7 +266,7 @@ class BatchToSpaceOp : public OpKernel { TF_CALL_REAL_NUMBER_TYPES(REGISTER); #undef REGISTER -#if GOOGLE_CUDA || TENSORFLOW_USE_ROCM +#if GOOGLE_CUDA #define REGISTER(T) \ REGISTER_KERNEL_BUILDER(Name("BatchToSpaceND") \ .Device(DEVICE_GPU) \ @@ -282,6 +282,6 @@ TF_CALL_REAL_NUMBER_TYPES(REGISTER); TF_CALL_GPU_NUMBER_TYPES(REGISTER); #undef REGISTER -#endif // GOOGLE_CUDA || TENSORFLOW_USE_ROCM +#endif // GOOGLE_CUDA } // end namespace tensorflow diff --git a/tensorflow/core/kernels/fill_functor.cu.cc b/tensorflow/core/kernels/fill_functor.cu.cc index d4c92586897..c759be12d0f 100644 --- a/tensorflow/core/kernels/fill_functor.cu.cc +++ b/tensorflow/core/kernels/fill_functor.cu.cc @@ -13,7 +13,7 @@ See the License for the specific language governing permissions and limitations under the License. ==============================================================================*/ -#if GOOGLE_CUDA +#if GOOGLE_CUDA || TENSORFLOW_USE_ROCM #define EIGEN_USE_GPU @@ -116,4 +116,4 @@ TF_CALL_bool(DEFINE_SETONE_GPU); } // end namespace functor } // end namespace tensorflow -#endif // GOOGLE_CUDA +#endif // GOOGLE_CUDA || TENSORFLOW_USE_ROCM diff --git a/third_party/eigen3/gpu_packet_math.patch b/third_party/eigen3/gpu_packet_math.patch index 3d58cafd035..b8afb1b48f7 100644 --- a/third_party/eigen3/gpu_packet_math.patch +++ b/third_party/eigen3/gpu_packet_math.patch @@ -4,7 +4,7 @@ return make_double2(from, from); } -+#if defined(EIGEN_CUDA_ARCH) ++#if defined(EIGEN_CUDA_ARCH) || defined(EIGEN_HIP_DEVICE_COMPILE) namespace { EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE float bitwise_and(const float& a, @@ -12,7 +12,7 @@ pcmp_eq(const double2& a, const double2& b) { return make_double2(eq_mask(a.x, b.x), eq_mask(a.y, b.y)); } -+#endif // EIGEN_CUDA_ARCH ++#endif // EIGEN_CUDA_ARCH || defined(EIGEN_HIP_DEVICE_COMPILE) template<> EIGEN_DEVICE_FUNC EIGEN_STRONG_INLINE float4 plset(const float& a) { return make_float4(a, a+1, a+2, a+3);