Disable SparseFillEmptyRows[Grad] on GPU It breaks an internal workload with the error message "segment ids are not increasing", which probably means that the output indices are not sorted in some cases. PiperOrigin-RevId: 371980850 Change-Id: Ie7eb322de5917fe55ee6318d262236e8db8da26d

commit: 6ec5f4a03e1181fbfcfdffa10a82cd52d9724ae9 [log] [tgz]
author: Sanjoy Das <sanjoy@google.com> Tue May 04 13:16:07 2021 -0700
committer: TensorFlower Gardener <gardener@tensorflow.org> Tue May 04 13:21:02 2021 -0700
tree: 9454fd13698405f86d7aa84485a99ad3e988e5fe
parent: 55338bb43c76edad2557be1cd62dc315c4106314 [diff]
diff --git a/tensorflow/core/kernels/sparse_fill_empty_rows_op.cc b/tensorflow/core/kernels/sparse_fill_empty_rows_op.cc
index de97e63..a2b8b07 100644
--- a/tensorflow/core/kernels/sparse_fill_empty_rows_op.cc
+++ b/tensorflow/core/kernels/sparse_fill_empty_rows_op.cc

@@ -263,7 +263,7 @@
 
 #undef REGISTER_KERNELS
 
-#if GOOGLE_CUDA || TENSORFLOW_USE_ROCM
+#if 0 && (GOOGLE_CUDA || TENSORFLOW_USE_ROCM)
 
 // The GPU implementation is async because it requires waiting for a
 // host->device memcpy before the output is allocated (similar to
@@ -411,7 +411,7 @@
 TF_CALL_NUMBER_TYPES(REGISTER_CPU_KERNELS);
 #undef REGISTER_CPU_KERNELS
 
-#if GOOGLE_CUDA || TENSORFLOW_USE_ROCM
+#if 0 && (GOOGLE_CUDA || TENSORFLOW_USE_ROCM)
 
 // Forward declarations of the functor specializations for GPU.
 namespace functor {
commit	6ec5f4a03e1181fbfcfdffa10a82cd52d9724ae9	[log] [tgz]
author	Sanjoy Das <sanjoy@google.com>	Tue May 04 13:16:07 2021 -0700
committer	TensorFlower Gardener <gardener@tensorflow.org>	Tue May 04 13:21:02 2021 -0700
tree	9454fd13698405f86d7aa84485a99ad3e988e5fe
parent	55338bb43c76edad2557be1cd62dc315c4106314 [diff]