tensorflow/python/eager/def_function_xla_jit_test.py - platform/external/tensorflow - Git at Google

 # Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================

 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function

 from tensorflow.compiler.tests import xla_test
 from tensorflow.python.eager import backprop
 from tensorflow.python.eager import context
 from tensorflow.python.eager import def_function
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import errors
 from tensorflow.python.framework import ops
 from tensorflow.python.framework import test_util
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import control_flow_util
 from tensorflow.python.ops import math_ops
 from tensorflow.python.ops import random_ops
 from tensorflow.python.ops import resource_variable_ops
 from tensorflow.python.ops import tensor_array_ops
 from tensorflow.python.ops import variables
 from tensorflow.python.platform import test


 class DefFunctionTest(xla_test.XLATestCase):

   def testAutoclusteringWithTfFunction(self):
     if 'tpu' in self.device.lower():
       self.skipTest('Autoclustering does not run on TPU')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=False)
       def outer(a, b, c):
         return a * inner(b, c) + c

       @def_function.function(experimental_compile=True)
       def inner(b, c):
         return b + c * b

       i1 = constant_op.constant([1.0, 2.0, 3.0, 4.0, 5.0])
       i2 = constant_op.constant([1.0, 2.0, 3.0, 4.0, 5.0])
       i3 = constant_op.constant([1.0, 2.0, 3.0, 4.0, 5.0])

       with context.collect_graphs(optimized=True) as graphs:
         outer(i1, i2, i3)

       if test_util.is_xla_enabled():
         self.assertIn('_XlaRun', [n.op for n in graphs[0].node])
       else:
         self.assertNotIn('_XlaRun', [n.op for n in graphs[0].node])

   def testBasic(self):
     with ops.device('device:{}:0'.format(self.device)):

       def fn(x, a):
         return x + a

       func = def_function.function(fn, experimental_compile=False)
       xla_func = def_function.function(fn, experimental_compile=True)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       self.assertAllClose([2, 3, 3, 4, 4], func(inputs, 1))
       self.assertAllClose([2, 3, 3, 4, 4], xla_func(inputs, 1))

   def testBasicInt32(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def fn(x, a):
         return x + a

       inputs = constant_op.constant([1, 2, 2, 3, 3], dtype=dtypes.int32)
       self.assertAllClose([2, 3, 3, 4, 4], fn(inputs, 1))

   def testDerivative(self):
     with ops.device('device:{}:0'.format(self.device)):

       def fn(x, a):
         return 2 * x + a

       xla_func = def_function.function(fn, experimental_compile=True)

       with backprop.GradientTape() as tape:
         inputs = constant_op.constant([1., 2., 2., 3., 3.])
         tape.watch(inputs)
         outputs = xla_func(inputs, 1)

       self.assertAllClose([2, 2, 2, 2, 2], tape.gradient(outputs, inputs))

       # pylint: disable=protected-access
       (forward, backward) = xla_func.get_concrete_function(
           inputs, 1)._delayed_rewrite_functions.forward_backward()

       # Check that the must-compile attribute gets correctly propagated to the
       # created derivatives.
       self.assertTrue(backward.function_def.attr['_XlaMustCompile'])
       self.assertTrue(forward.definition.attr['_XlaMustCompile'])

   # Calling function with experimental_compile=True from
   # experimental_compile=False should compile the inner func.
   def testNestedCall(self):
     if 'tpu' in self.device.lower():
       self.skipTest('b/162800687: Inner function runs on host')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def fn(x, a):
         return x + a

       @def_function.function(experimental_compile=False)
       def fn2(x, a):
         return fn(x, a)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       self.assertAllClose([2, 3, 3, 4, 4], fn2(inputs, 1))

   @test_util.disable_mlir_bridge('TODO(b/162272821): MLIR bridge returns'
                                  ' wrong status type')
   def testNestedCallUnsupportedOps(self):
     with ops.device('device:{}:0'.format(self.device)):

       def fn(x):
         return array_ops.unique(x).y

       xla_func = def_function.function(fn, experimental_compile=True)

       def fn2(x):
         return xla_func(x)

       func = def_function.function(fn2, experimental_compile=False)
       inputs = constant_op.constant([1, 2, 2, 3, 3])
       with self.assertRaisesRegex(errors.InvalidArgumentError,
                                   'not compilable'):
         func(inputs)

   @test_util.disable_mlir_bridge('TODO(b/162272821): MLIR bridge returns'
                                  ' wrong status type')
   def testUnsupportedOps(self):
     with ops.device('device:{}:0'.format(self.device)):

       def fn(x):
         return array_ops.unique(x).y  # Unique is not supported by XLA

       func = def_function.function(fn, experimental_compile=False)
       xla_func = def_function.function(fn, experimental_compile=True)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       self.assertAllClose([1, 2, 3], func(inputs))
       with self.assertRaisesRegex(errors.InvalidArgumentError,
                                   'not compilable'):
         xla_func(inputs)

   def testFunctionGradient(self):
     with ops.device('device:{}:0'.format(self.device)):
       v = resource_variable_ops.ResourceVariable(2.0)

       def fn(x):
         return v * x

       func = def_function.function(fn, experimental_compile=False)
       xla_func = def_function.function(fn, experimental_compile=True)

       def run_and_check(test_func):
         x = constant_op.constant(3.0)
         with backprop.GradientTape() as tape:
           y = test_func(x)
         dy = tape.gradient(y, v)

         self.assertAllClose(6.0, y)
         self.assertAllClose(3.0, dy)

       run_and_check(func)
       run_and_check(xla_func)

   @test_util.disable_mlir_bridge('TODO(b/162521846): MLIR bridge fails'
                                  ' msan, function library not found')
   def testControlFlow(self):

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def f(x):
         assert control_flow_util.GraphOrParentsInXlaContext(
             ops.get_default_graph())
         x = ops.convert_to_tensor(x)

         def body(i, a):
           return i + 1, control_flow_ops.cond(i > 2, lambda: a + (x**2),
                                               lambda: a + 3)

         return control_flow_ops.while_loop(
             lambda i, *_: i < 10,
             body, (constant_op.constant(0), constant_op.constant(3.)),
             maximum_iterations=10)[1]

       @def_function.function(experimental_compile=True)
       def g(x):
         x = ops.convert_to_tensor(x)
         with backprop.GradientTape() as tape:
           tape.watch(x)
           y = f(x)
         return y, tape.gradient(y, x)

       self.assertAllClose(40.0, f(2.0))
       self.assertAllClose([40.0, 28.0], g(2.0))
       self.assertAllClose(40.0, f.get_concrete_function(2.0)(2.0))
       self.assertAllClose([40.0, 28.0], g.get_concrete_function(2.0)(2.0))

   def testMethodCompilation(self):

     with ops.device('device:{}:0'.format(self.device)):

       class C(object):

         @def_function.function(experimental_compile=True)
         def f1(self, x, a):
           return x + a

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       c = C()
       self.assertAllClose([2, 3, 3, 4, 4], c.f1(inputs, 1))

   @test_util.disable_mlir_bridge('TODO(b/162272821): MLIR bridge returns '
                                  ' wrong status type')
   def testMethodCompilationUnsupportedFunc(self):

     with ops.device('device:{}:0'.format(self.device)):

       class C(object):

         @def_function.function(experimental_compile=True)
         def f1(self, x):
           return array_ops.unique(x).y

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       c = C()
       with self.assertRaisesRegex(errors.InvalidArgumentError,
                                   'not compilable'):
         c.f1(inputs)

   def testMustBeConstantPropagation(self):
     if 'tpu' in self.device.lower():
       self.skipTest('b/162799319: Cannot resolve constant on TPU')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def f():
         return constant_op.constant([0, 2, 1], dtype=dtypes.int32)

       @def_function.function(experimental_compile=True)
       def g(a, b):
         return array_ops.transpose(a, b)

       @def_function.function
       def z():
         return g(array_ops.ones([3, 4, 3], dtype=dtypes.float32), f())

       z()

   @test_util.disable_mlir_bridge('TODO(b/162271237): argmax gives different'
                                  ' results in MLIR-based bridge')
   def testArgMinMax(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def argmax(x):
         return math_ops.argmax(x)

       @def_function.function(experimental_compile=True)
       def argmin(x):
         return math_ops.argmin(x)

       self.assertAllClose(0, argmax(array_ops.ones([10], dtype=dtypes.float32)))
       self.assertAllClose(0, argmax(array_ops.ones([10])))
       self.assertAllClose(0, argmin(array_ops.ones([10], dtype=dtypes.float32)))
       self.assertAllClose(0, argmin(array_ops.ones([10])))

   @test_util.disable_mlir_bridge('TensorArray support not implemented')
   def testErrorMessagePassingTensorArray(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=1, element_shape=[])
         ta = ta.write(0, 2 * x)
         y = ta.read(0)
         return y

       x = constant_op.constant(3.14)
       with backprop.GradientTape() as tape:
         tape.watch(x)
         with self.assertRaisesRegex(errors.UnimplementedError,
                                     'TensorList crossing the XLA/TF boundary'):
           y = f(x)
           tape.gradient(y, x)

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatV2(self):
     with ops.device('device:{}:0'.format(self.device)):

       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[3])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       compiled_f = def_function.function(experimental_compile=True)(f)

       inputs = constant_op.constant([3.14, 2.68, 7.69])

       self.assertAllClose([6.28, 5.36, 15.38, 9.42, 8.04, 23.07], f(inputs))

       self.assertAllClose(compiled_f(inputs), f(inputs))

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatV2Multidim(self):
     with ops.device('device:{}:0'.format(self.device)):

       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[3, 2])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       compiled_f = def_function.function(experimental_compile=True)(f)

       inputs = constant_op.constant([[3.14, 21.1], [2.68, 22.2], [7.69, 23.3]])
       self.assertAllClose(f(inputs), compiled_f(inputs))

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatV2Scalars(self):
     with ops.device('device:{}:0'.format(self.device)):

       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[1])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       compiled_f = def_function.function(experimental_compile=True)(f)
       inputs = constant_op.constant([3.14])
       self.assertAllClose(f(inputs), compiled_f(inputs))

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatGrad(self):
     with ops.device('device:{}:0'.format(self.device)):

       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[3])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       def g():
         x = constant_op.constant([3.14, 2.68, 7.69])
         with backprop.GradientTape() as tape:
           tape.watch(x)
           y = f(x)
           return tape.gradient(y, x)

       compiled_g = def_function.function(experimental_compile=True)(g)

       self.assertAllClose([5.0, 5.0, 5.0], g())
       self.assertAllClose(compiled_g(), g())

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatGradNestedCompile(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[3])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       @def_function.function(experimental_compile=True)
       def g():
         x = constant_op.constant([3.14, 2.68, 7.69])
         with backprop.GradientTape() as tape:
           tape.watch(x)
           y = f(x)
           out = tape.gradient(y, x)
         return out

       self.assertAllClose([5.0, 5.0, 5.0], g())

   def testCumsum(self):
     if 'tpu' in self.device.lower():
       self.skipTest('b/162771302: 64bit rewrite of cumsum not supported')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def f(x):
         return math_ops.cumsum(x)

       f64_input = constant_op.constant([1.1, 2.2, 3.3], dtype=dtypes.float64)
       self.assertAllClose([1.1, 3.3, 6.6], f(f64_input))

   def testNoExcessiveRetracing(self):
     with ops.device('device:{}:0'.format(self.device)):
       inner_retracings = 0

       @def_function.function(experimental_compile=True)
       def inner(a, b):
         nonlocal inner_retracings
         inner_retracings += 1
         return a * b + a

       def outer(a, b):
         return inner(a, b)

       func_input = random_ops.random_normal([10, 10])
       for _ in range(2):
         def_function.function(outer)(func_input, func_input)

       self.assertEqual(inner_retracings, 1)

   def testUpdateVariable(self):
     with ops.device('device:{}:0'.format(self.device)):

       on_gpu = 'gpu' in self.device.lower()
       v = variables.Variable([3.1, 3.2])

       @def_function.function(experimental_compile=True)
       def update_var(a, b):
         v.assign_add(a * b)

       arg1 = random_ops.random_normal([2])
       arg2 = random_ops.random_normal([2])

       initial_usage = context.context().get_total_memory_usage(
           v.device) if on_gpu else 0
       update_var(arg1, arg2)
       final_usage = context.context().get_total_memory_usage(
           v.device) if on_gpu else 0
       self.assertEqual(initial_usage, final_usage)

   @test_util.disable_mlir_bridge('TODO(b/162381930): MLIR bridge renames '
                                  ' functions')
   def testUpdateVariableInClass(self):
     with ops.device('device:{}:0'.format(self.device)):

       class C(object):

         @def_function.function(experimental_compile=True)
         def update_var(self, a, b):
           if not hasattr(self, 'v'):
             self.v = variables.Variable(3.1)
           self.v.assign_add(a * b)

       c = C()

       @def_function.function
       def outer():
         c.update_var(constant_op.constant(0.7), constant_op.constant(0.6))

       outer()
       self.assertAllClose(c.v, 3.52)

   @test_util.disable_mlir_bridge('TODO(b/162801728): MLIR bridge causes '
                                  ' invalid free on TPUs')
   def testUpdateVariableMultipleOutputs(self):
     with ops.device('device:{}:0'.format(self.device)):
       v = variables.Variable(3.1)

       @def_function.function(experimental_compile=True)
       def update_var(a, b):
         v.assign_add(a * b)
         return a * b + v

       out = update_var(constant_op.constant(0.7), constant_op.constant(0.6))
       self.assertAllClose(v, 3.52)
       self.assertAllClose(out, 3.94)

   def testReturnIdentity(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def f(a, b):
         return (a, b)

       a = random_ops.random_normal([10, 10])
       b = random_ops.random_normal([10, 10])

       on_gpu = 'gpu' in self.device.lower()
       initial_usage = context.context().get_total_memory_usage(
           b.backing_device) if on_gpu else 0

       f(a, b)

       final_usage = context.context().get_total_memory_usage(
           b.backing_device) if on_gpu else 0
       self.assertEqual(initial_usage, final_usage)


 if __name__ == '__main__':
   ops.enable_eager_execution()
   test.main()
	# Copyright 2019 The TensorFlow Authors. All Rights Reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	# ==============================================================================

	from __future__ import absolute_import
	from __future__ import division
	from __future__ import print_function

	from tensorflow.compiler.tests import xla_test
	from tensorflow.python.eager import backprop
	from tensorflow.python.eager import context
	from tensorflow.python.eager import def_function
	from tensorflow.python.framework import constant_op
	from tensorflow.python.framework import dtypes
	from tensorflow.python.framework import errors
	from tensorflow.python.framework import ops
	from tensorflow.python.framework import test_util
	from tensorflow.python.ops import array_ops
	from tensorflow.python.ops import control_flow_ops
	from tensorflow.python.ops import control_flow_util
	from tensorflow.python.ops import math_ops
	from tensorflow.python.ops import random_ops
	from tensorflow.python.ops import resource_variable_ops
	from tensorflow.python.ops import tensor_array_ops
	from tensorflow.python.ops import variables
	from tensorflow.python.platform import test


	class DefFunctionTest(xla_test.XLATestCase):

	def testAutoclusteringWithTfFunction(self):
	if 'tpu' in self.device.lower():
	self.skipTest('Autoclustering does not run on TPU')

	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=False)
	def outer(a, b, c):
	return a * inner(b, c) + c

	@def_function.function(experimental_compile=True)
	def inner(b, c):
	return b + c * b

	i1 = constant_op.constant([1.0, 2.0, 3.0, 4.0, 5.0])
	i2 = constant_op.constant([1.0, 2.0, 3.0, 4.0, 5.0])
	i3 = constant_op.constant([1.0, 2.0, 3.0, 4.0, 5.0])

	with context.collect_graphs(optimized=True) as graphs:
	outer(i1, i2, i3)

	if test_util.is_xla_enabled():
	self.assertIn('_XlaRun', [n.op for n in graphs[0].node])
	else:
	self.assertNotIn('_XlaRun', [n.op for n in graphs[0].node])

	def testBasic(self):
	with ops.device('device:{}:0'.format(self.device)):

	def fn(x, a):
	return x + a

	func = def_function.function(fn, experimental_compile=False)
	xla_func = def_function.function(fn, experimental_compile=True)

	inputs = constant_op.constant([1, 2, 2, 3, 3])
	self.assertAllClose([2, 3, 3, 4, 4], func(inputs, 1))
	self.assertAllClose([2, 3, 3, 4, 4], xla_func(inputs, 1))

	def testBasicInt32(self):
	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=True)
	def fn(x, a):
	return x + a

	inputs = constant_op.constant([1, 2, 2, 3, 3], dtype=dtypes.int32)
	self.assertAllClose([2, 3, 3, 4, 4], fn(inputs, 1))

	def testDerivative(self):
	with ops.device('device:{}:0'.format(self.device)):

	def fn(x, a):
	return 2 * x + a

	xla_func = def_function.function(fn, experimental_compile=True)

	with backprop.GradientTape() as tape:
	inputs = constant_op.constant([1., 2., 2., 3., 3.])
	tape.watch(inputs)
	outputs = xla_func(inputs, 1)

	self.assertAllClose([2, 2, 2, 2, 2], tape.gradient(outputs, inputs))

	# pylint: disable=protected-access
	(forward, backward) = xla_func.get_concrete_function(
	inputs, 1)._delayed_rewrite_functions.forward_backward()

	# Check that the must-compile attribute gets correctly propagated to the
	# created derivatives.
	self.assertTrue(backward.function_def.attr['_XlaMustCompile'])
	self.assertTrue(forward.definition.attr['_XlaMustCompile'])

	# Calling function with experimental_compile=True from
	# experimental_compile=False should compile the inner func.
	def testNestedCall(self):
	if 'tpu' in self.device.lower():
	self.skipTest('b/162800687: Inner function runs on host')

	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=True)
	def fn(x, a):
	return x + a

	@def_function.function(experimental_compile=False)
	def fn2(x, a):
	return fn(x, a)

	inputs = constant_op.constant([1, 2, 2, 3, 3])
	self.assertAllClose([2, 3, 3, 4, 4], fn2(inputs, 1))

	@test_util.disable_mlir_bridge('TODO(b/162272821): MLIR bridge returns'
	' wrong status type')
	def testNestedCallUnsupportedOps(self):
	with ops.device('device:{}:0'.format(self.device)):

	def fn(x):
	return array_ops.unique(x).y

	xla_func = def_function.function(fn, experimental_compile=True)

	def fn2(x):
	return xla_func(x)

	func = def_function.function(fn2, experimental_compile=False)
	inputs = constant_op.constant([1, 2, 2, 3, 3])
	with self.assertRaisesRegex(errors.InvalidArgumentError,
	'not compilable'):
	func(inputs)

	@test_util.disable_mlir_bridge('TODO(b/162272821): MLIR bridge returns'
	' wrong status type')
	def testUnsupportedOps(self):
	with ops.device('device:{}:0'.format(self.device)):

	def fn(x):
	return array_ops.unique(x).y # Unique is not supported by XLA

	func = def_function.function(fn, experimental_compile=False)
	xla_func = def_function.function(fn, experimental_compile=True)

	inputs = constant_op.constant([1, 2, 2, 3, 3])
	self.assertAllClose([1, 2, 3], func(inputs))
	with self.assertRaisesRegex(errors.InvalidArgumentError,
	'not compilable'):
	xla_func(inputs)

	def testFunctionGradient(self):
	with ops.device('device:{}:0'.format(self.device)):
	v = resource_variable_ops.ResourceVariable(2.0)

	def fn(x):
	return v * x

	func = def_function.function(fn, experimental_compile=False)
	xla_func = def_function.function(fn, experimental_compile=True)

	def run_and_check(test_func):
	x = constant_op.constant(3.0)
	with backprop.GradientTape() as tape:
	y = test_func(x)
	dy = tape.gradient(y, v)

	self.assertAllClose(6.0, y)
	self.assertAllClose(3.0, dy)

	run_and_check(func)
	run_and_check(xla_func)

	@test_util.disable_mlir_bridge('TODO(b/162521846): MLIR bridge fails'
	' msan, function library not found')
	def testControlFlow(self):

	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=True)
	def f(x):
	assert control_flow_util.GraphOrParentsInXlaContext(
	ops.get_default_graph())
	x = ops.convert_to_tensor(x)

	def body(i, a):
	return i + 1, control_flow_ops.cond(i > 2, lambda: a + (x**2),
	lambda: a + 3)

	return control_flow_ops.while_loop(
	lambda i, *_: i < 10,
	body, (constant_op.constant(0), constant_op.constant(3.)),
	maximum_iterations=10)[1]

	@def_function.function(experimental_compile=True)
	def g(x):
	x = ops.convert_to_tensor(x)
	with backprop.GradientTape() as tape:
	tape.watch(x)
	y = f(x)
	return y, tape.gradient(y, x)

	self.assertAllClose(40.0, f(2.0))
	self.assertAllClose([40.0, 28.0], g(2.0))
	self.assertAllClose(40.0, f.get_concrete_function(2.0)(2.0))
	self.assertAllClose([40.0, 28.0], g.get_concrete_function(2.0)(2.0))

	def testMethodCompilation(self):

	with ops.device('device:{}:0'.format(self.device)):

	class C(object):

	@def_function.function(experimental_compile=True)
	def f1(self, x, a):
	return x + a

	inputs = constant_op.constant([1, 2, 2, 3, 3])
	c = C()
	self.assertAllClose([2, 3, 3, 4, 4], c.f1(inputs, 1))

	@test_util.disable_mlir_bridge('TODO(b/162272821): MLIR bridge returns '
	' wrong status type')
	def testMethodCompilationUnsupportedFunc(self):

	with ops.device('device:{}:0'.format(self.device)):

	class C(object):

	@def_function.function(experimental_compile=True)
	def f1(self, x):
	return array_ops.unique(x).y

	inputs = constant_op.constant([1, 2, 2, 3, 3])
	c = C()
	with self.assertRaisesRegex(errors.InvalidArgumentError,
	'not compilable'):
	c.f1(inputs)

	def testMustBeConstantPropagation(self):
	if 'tpu' in self.device.lower():
	self.skipTest('b/162799319: Cannot resolve constant on TPU')

	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=True)
	def f():
	return constant_op.constant([0, 2, 1], dtype=dtypes.int32)

	@def_function.function(experimental_compile=True)
	def g(a, b):
	return array_ops.transpose(a, b)

	@def_function.function
	def z():
	return g(array_ops.ones([3, 4, 3], dtype=dtypes.float32), f())

	z()

	@test_util.disable_mlir_bridge('TODO(b/162271237): argmax gives different'
	' results in MLIR-based bridge')
	def testArgMinMax(self):
	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=True)
	def argmax(x):
	return math_ops.argmax(x)

	@def_function.function(experimental_compile=True)
	def argmin(x):
	return math_ops.argmin(x)

	self.assertAllClose(0, argmax(array_ops.ones([10], dtype=dtypes.float32)))
	self.assertAllClose(0, argmax(array_ops.ones([10])))
	self.assertAllClose(0, argmin(array_ops.ones([10], dtype=dtypes.float32)))
	self.assertAllClose(0, argmin(array_ops.ones([10])))

	@test_util.disable_mlir_bridge('TensorArray support not implemented')
	def testErrorMessagePassingTensorArray(self):
	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=True)
	def f(x):
	ta = tensor_array_ops.TensorArray(
	dtype=dtypes.float32, size=1, element_shape=[])
	ta = ta.write(0, 2 * x)
	y = ta.read(0)
	return y

	x = constant_op.constant(3.14)
	with backprop.GradientTape() as tape:
	tape.watch(x)
	with self.assertRaisesRegex(errors.UnimplementedError,
	'TensorList crossing the XLA/TF boundary'):
	y = f(x)
	tape.gradient(y, x)

	@test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
	' lowering TensorListConcatV2')
	def testTensorListConcatV2(self):
	with ops.device('device:{}:0'.format(self.device)):

	def f(x):
	ta = tensor_array_ops.TensorArray(
	dtype=dtypes.float32, size=2, element_shape=[3])
	ta = ta.write(0, 2 * x)
	ta = ta.write(1, 3 * x)
	return ta.concat()

	compiled_f = def_function.function(experimental_compile=True)(f)

	inputs = constant_op.constant([3.14, 2.68, 7.69])

	self.assertAllClose([6.28, 5.36, 15.38, 9.42, 8.04, 23.07], f(inputs))

	self.assertAllClose(compiled_f(inputs), f(inputs))

	@test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
	' lowering TensorListConcatV2')
	def testTensorListConcatV2Multidim(self):
	with ops.device('device:{}:0'.format(self.device)):

	def f(x):
	ta = tensor_array_ops.TensorArray(
	dtype=dtypes.float32, size=2, element_shape=[3, 2])
	ta = ta.write(0, 2 * x)
	ta = ta.write(1, 3 * x)
	return ta.concat()

	compiled_f = def_function.function(experimental_compile=True)(f)

	inputs = constant_op.constant([[3.14, 21.1], [2.68, 22.2], [7.69, 23.3]])
	self.assertAllClose(f(inputs), compiled_f(inputs))

	@test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
	' lowering TensorListConcatV2')
	def testTensorListConcatV2Scalars(self):
	with ops.device('device:{}:0'.format(self.device)):

	def f(x):
	ta = tensor_array_ops.TensorArray(
	dtype=dtypes.float32, size=2, element_shape=[1])
	ta = ta.write(0, 2 * x)
	ta = ta.write(1, 3 * x)
	return ta.concat()

	compiled_f = def_function.function(experimental_compile=True)(f)
	inputs = constant_op.constant([3.14])
	self.assertAllClose(f(inputs), compiled_f(inputs))

	@test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
	' lowering TensorListConcatV2')
	def testTensorListConcatGrad(self):
	with ops.device('device:{}:0'.format(self.device)):

	def f(x):
	ta = tensor_array_ops.TensorArray(
	dtype=dtypes.float32, size=2, element_shape=[3])
	ta = ta.write(0, 2 * x)
	ta = ta.write(1, 3 * x)
	return ta.concat()

	def g():
	x = constant_op.constant([3.14, 2.68, 7.69])
	with backprop.GradientTape() as tape:
	tape.watch(x)
	y = f(x)
	return tape.gradient(y, x)

	compiled_g = def_function.function(experimental_compile=True)(g)

	self.assertAllClose([5.0, 5.0, 5.0], g())
	self.assertAllClose(compiled_g(), g())

	@test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
	' lowering TensorListConcatV2')
	def testTensorListConcatGradNestedCompile(self):
	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=True)
	def f(x):
	ta = tensor_array_ops.TensorArray(
	dtype=dtypes.float32, size=2, element_shape=[3])
	ta = ta.write(0, 2 * x)
	ta = ta.write(1, 3 * x)
	return ta.concat()

	@def_function.function(experimental_compile=True)
	def g():
	x = constant_op.constant([3.14, 2.68, 7.69])
	with backprop.GradientTape() as tape:
	tape.watch(x)
	y = f(x)
	out = tape.gradient(y, x)
	return out

	self.assertAllClose([5.0, 5.0, 5.0], g())

	def testCumsum(self):
	if 'tpu' in self.device.lower():
	self.skipTest('b/162771302: 64bit rewrite of cumsum not supported')

	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=True)
	def f(x):
	return math_ops.cumsum(x)

	f64_input = constant_op.constant([1.1, 2.2, 3.3], dtype=dtypes.float64)
	self.assertAllClose([1.1, 3.3, 6.6], f(f64_input))

	def testNoExcessiveRetracing(self):
	with ops.device('device:{}:0'.format(self.device)):
	inner_retracings = 0

	@def_function.function(experimental_compile=True)
	def inner(a, b):
	nonlocal inner_retracings
	inner_retracings += 1
	return a * b + a

	def outer(a, b):
	return inner(a, b)

	func_input = random_ops.random_normal([10, 10])
	for _ in range(2):
	def_function.function(outer)(func_input, func_input)

	self.assertEqual(inner_retracings, 1)

	def testUpdateVariable(self):
	with ops.device('device:{}:0'.format(self.device)):

	on_gpu = 'gpu' in self.device.lower()
	v = variables.Variable([3.1, 3.2])

	@def_function.function(experimental_compile=True)
	def update_var(a, b):
	v.assign_add(a * b)

	arg1 = random_ops.random_normal([2])
	arg2 = random_ops.random_normal([2])

	initial_usage = context.context().get_total_memory_usage(
	v.device) if on_gpu else 0
	update_var(arg1, arg2)
	final_usage = context.context().get_total_memory_usage(
	v.device) if on_gpu else 0
	self.assertEqual(initial_usage, final_usage)

	@test_util.disable_mlir_bridge('TODO(b/162381930): MLIR bridge renames '
	' functions')
	def testUpdateVariableInClass(self):
	with ops.device('device:{}:0'.format(self.device)):

	class C(object):

	@def_function.function(experimental_compile=True)
	def update_var(self, a, b):
	if not hasattr(self, 'v'):
	self.v = variables.Variable(3.1)
	self.v.assign_add(a * b)

	c = C()

	@def_function.function
	def outer():
	c.update_var(constant_op.constant(0.7), constant_op.constant(0.6))

	outer()
	self.assertAllClose(c.v, 3.52)

	@test_util.disable_mlir_bridge('TODO(b/162801728): MLIR bridge causes '
	' invalid free on TPUs')
	def testUpdateVariableMultipleOutputs(self):
	with ops.device('device:{}:0'.format(self.device)):
	v = variables.Variable(3.1)

	@def_function.function(experimental_compile=True)
	def update_var(a, b):
	v.assign_add(a * b)
	return a * b + v

	out = update_var(constant_op.constant(0.7), constant_op.constant(0.6))
	self.assertAllClose(v, 3.52)
	self.assertAllClose(out, 3.94)

	def testReturnIdentity(self):
	with ops.device('device:{}:0'.format(self.device)):

	@def_function.function(experimental_compile=True)
	def f(a, b):
	return (a, b)

	a = random_ops.random_normal([10, 10])
	b = random_ops.random_normal([10, 10])

	on_gpu = 'gpu' in self.device.lower()
	initial_usage = context.context().get_total_memory_usage(
	b.backing_device) if on_gpu else 0

	f(a, b)

	final_usage = context.context().get_total_memory_usage(
	b.backing_device) if on_gpu else 0
	self.assertEqual(initial_usage, final_usage)


	if __name__ == '__main__':
	ops.enable_eager_execution()
	test.main()