tensorflow/python/eager/def_function_xla_jit_test.py - platform/external/tensorflow - Git at Google

 # Copyright 2019 The TensorFlow Authors. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 # ==============================================================================

 from __future__ import absolute_import
 from __future__ import division
 from __future__ import print_function

 from tensorflow.compiler.tests import xla_test
 from tensorflow.python.eager import backprop
 from tensorflow.python.eager import context
 from tensorflow.python.eager import def_function
 from tensorflow.python.framework import constant_op
 from tensorflow.python.framework import dtypes
 from tensorflow.python.framework import errors
 from tensorflow.python.framework import ops
 from tensorflow.python.framework import tensor_spec
 from tensorflow.python.framework import test_util
 from tensorflow.python.ops import array_ops
 from tensorflow.python.ops import control_flow_ops
 from tensorflow.python.ops import control_flow_util
 from tensorflow.python.ops import math_ops
 from tensorflow.python.ops import random_ops
 from tensorflow.python.ops import resource_variable_ops
 from tensorflow.python.ops import tensor_array_ops
 from tensorflow.python.ops import variables
 from tensorflow.python.platform import test


 class DefFunctionTest(xla_test.XLATestCase):

   def testAutoclusteringWithTfFunction(self):
     if 'tpu' in self.device.lower():
       self.skipTest('Autoclustering does not run on TPU')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=False)
       def outer(a, b, c):
         return a * inner(b, c) + c

       @def_function.function(jit_compile=True)
       def inner(b, c):
         return b + c * b

       i1 = constant_op.constant([1.0, 2.0, 3.0, 4.0, 5.0])
       i2 = constant_op.constant([1.0, 2.0, 3.0, 4.0, 5.0])
       i3 = constant_op.constant([1.0, 2.0, 3.0, 4.0, 5.0])

       with context.collect_graphs(optimized=True) as graphs:
         outer(i1, i2, i3)

       if test_util.is_xla_enabled():
         self.assertIn('_XlaRun', [n.op for n in graphs[0].node])
       else:
         self.assertNotIn('_XlaRun', [n.op for n in graphs[0].node])

   def testBasic(self):
     with ops.device('device:{}:0'.format(self.device)):

       def fn(x, a):
         return x + a

       func = def_function.function(fn, jit_compile=False)
       xla_func = def_function.function(fn, jit_compile=True)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       self.assertAllClose([2, 3, 3, 4, 4], func(inputs, 1))
       self.assertAllClose([2, 3, 3, 4, 4], xla_func(inputs, 1))

   def testBasicInt32(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def fn(x, a):
         return x + a

       inputs = constant_op.constant([1, 2, 2, 3, 3], dtype=dtypes.int32)
       self.assertAllClose([2, 3, 3, 4, 4], fn(inputs, 1))

   def testDerivative(self):
     with ops.device('device:{}:0'.format(self.device)):

       def fn(x, a):
         return 2 * x + a

       xla_func = def_function.function(fn, jit_compile=True)

       with backprop.GradientTape() as tape:
         inputs = constant_op.constant([1., 2., 2., 3., 3.])
         tape.watch(inputs)
         outputs = xla_func(inputs, 1)

       self.assertAllClose([2, 2, 2, 2, 2], tape.gradient(outputs, inputs))

       # pylint: disable=protected-access
       (forward, backward) = xla_func.get_concrete_function(
           inputs, 1)._delayed_rewrite_functions.forward_backward()

       # Check that the must-compile attribute gets correctly propagated to the
       # created derivatives.
       self.assertTrue(backward.function_def.attr['_XlaMustCompile'])
       self.assertTrue(forward.definition.attr['_XlaMustCompile'])

   # Calling function with jit_compile=True from
   # jit_compile=False should compile the inner func.
   def testNestedCall(self):
     if 'tpu' in self.device.lower():
       self.skipTest('b/162800687: Inner function runs on host')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def fn(x, a):
         return x + a

       @def_function.function(jit_compile=False)
       def fn2(x, a):
         return fn(x, a)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       self.assertAllClose([2, 3, 3, 4, 4], fn2(inputs, 1))

   def testNestedCallUnsupportedOps(self):
     if 'tpu' in self.device.lower():
       self.skipTest('XLA TPU supports tf.unique')

     with ops.device('device:{}:0'.format(self.device)):

       def fn(x):
         return array_ops.unique(x).y

       xla_func = def_function.function(fn, jit_compile=True)

       def fn2(x):
         return xla_func(x)

       func = def_function.function(fn2, jit_compile=False)
       inputs = constant_op.constant([1, 2, 2, 3, 3])
       with self.assertRaisesRegex(
           errors.InvalidArgumentError, 'legalization failed'
           if test_util.is_mlir_bridge_enabled() else 'unsupported operations'):
         func(inputs)

   def testUnsupportedOps(self):
     if 'tpu' in self.device.lower():
       self.skipTest('XLA TPU supports tf.unique')

     with ops.device('device:{}:0'.format(self.device)):

       def fn(x):
         return array_ops.unique(x).y  # Unique is not supported by XLA

       func = def_function.function(fn, jit_compile=False)
       xla_func = def_function.function(fn, jit_compile=True)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       self.assertAllClose([1, 2, 3], func(inputs))
       with self.assertRaisesRegex(
           errors.InvalidArgumentError, 'legalization failed'
           if test_util.is_mlir_bridge_enabled() else 'unsupported operations'):
         xla_func(inputs)

   @test_util.disable_mlir_bridge('TODO(b/155782411): MLIR bridge does not'
                                  'support stack traces')
   def testPythonLocationInMetadata(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def fn(x, y):
         return x + y

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       self.assertIn('def_function_xla_jit_test',
                     fn.experimental_get_compiler_ir(inputs, inputs)())

   @test_util.disable_mlir_bridge('TODO(b/155782411): MLIR bridge does not'
                                  'support stack traces')
   def testPythonLocationNestedInMetadata(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(x, y):
         return x + y

       @def_function.function(jit_compile=True)
       def g(x, y):
         return f(x, y)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       self.assertIn('def_function_xla_jit_test',
                     g.experimental_get_compiler_ir(inputs, inputs)())

   def testPythonStackTrace(self):
     if 'tpu' in self.device.lower():
       self.skipTest('XLA TPU supports tf.unique')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def fn(x):
         return array_ops.unique(x).y  # COMMENT2

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       with self.assertRaisesRegex(errors.InvalidArgumentError, 'COMMENT2'):
         fn(inputs)

   @test_util.disable_mlir_bridge('TODO(b/181176476): Wrong stack trace for '
                                  'failed legalization in MLIR bridge')
   def testPythonStackTraceControlFlow(self):
     if 'tpu' in self.device.lower():
       self.skipTest('XLA TPU supports tf.unique')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(x):
         x = ops.convert_to_tensor(x)

         def body(i, a):
           return i + 1 + array_ops.unique([i]).y[0], \
               control_flow_ops.cond(i > 2, lambda: a + (x**2), lambda: a + 3)

         return control_flow_ops.while_loop(
             lambda i, *_: i < 10,
             body, (constant_op.constant(0), constant_op.constant(3.)),
             maximum_iterations=10)[1]

       with self.assertRaisesRegex(errors.InvalidArgumentError, r'\.y\[0\]'):
         f(constant_op.constant(100.0))

   def testPythonStackTraceUncompiledWithinCompiled(self):
     if 'tpu' in self.device.lower():
       self.skipTest('XLA TPU supports tf.unique')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function
       def fn(x):
         return array_ops.unique(x).y  # COMMENT3

       @def_function.function(jit_compile=True)
       def outer(x):
         return fn(x)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       with self.assertRaisesRegex(errors.InvalidArgumentError, 'COMMENT3'):
         outer(inputs)

   @test_util.disable_mlir_bridge('TODO(b/155782411): MLIR bridge does not'
                                  'support stack traces')
   def testPythonStackTraceCompiledWithinUncompiled(self):
     if 'tpu' in self.device.lower():
       self.skipTest('XLA TPU supports tf.unique')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def fn(x):
         return array_ops.unique(x).y  # COMMENT1

       @def_function.function
       def outer(x):
         return fn(x)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       with self.assertRaisesRegex(errors.InvalidArgumentError, 'COMMENT1'):
         outer(inputs)

   @test_util.disable_mlir_bridge('TODO(b/155782411): MLIR bridge does not'
                                  'support stack traces')
   def testPythonStackTraceCompiledWithinCompiled(self):
     if 'tpu' in self.device.lower():
       self.skipTest('XLA TPU supports tf.unique')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def fn(x):
         return array_ops.unique(x).y  # COMMENT4

       @def_function.function
       def outer(x):
         return fn(x)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       with self.assertRaisesRegex(errors.InvalidArgumentError, 'COMMENT4'):
         outer(inputs)

   def testFunctionGradient(self):
     with ops.device('device:{}:0'.format(self.device)):
       v = resource_variable_ops.ResourceVariable(2.0)

       def fn(x):
         return v * x

       func = def_function.function(fn, jit_compile=False)
       xla_func = def_function.function(fn, jit_compile=True)

       def run_and_check(test_func):
         x = constant_op.constant(3.0)
         with backprop.GradientTape() as tape:
           y = test_func(x)
         dy = tape.gradient(y, v)

         self.assertAllClose(6.0, y)
         self.assertAllClose(3.0, dy)

       run_and_check(func)
       run_and_check(xla_func)

   @test_util.disable_mlir_bridge('TODO(b/162521846): MLIR bridge fails'
                                  ' msan, function library not found')
   def testControlFlow(self):

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(x):
         assert control_flow_util.GraphOrParentsInXlaContext(
             ops.get_default_graph())
         x = ops.convert_to_tensor(x)

         def body(i, a):
           return i + 1, control_flow_ops.cond(i > 2, lambda: a + (x**2),
                                               lambda: a + 3)

         return control_flow_ops.while_loop(
             lambda i, *_: i < 10,
             body, (constant_op.constant(0), constant_op.constant(3.)),
             maximum_iterations=10)[1]

       @def_function.function(jit_compile=True)
       def g(x):
         x = ops.convert_to_tensor(x)
         with backprop.GradientTape() as tape:
           tape.watch(x)
           y = f(x)
         return y, tape.gradient(y, x)

       # Test that XLA context gets correctly propagated.
       g._get_concrete_function_garbage_collected(2.0)(2.0)

       self.assertAllClose(40.0, f(2.0))
       self.assertAllClose([40.0, 28.0], g(2.0))
       self.assertAllClose(40.0, f.get_concrete_function(2.0)(2.0))
       self.assertAllClose([40.0, 28.0], g.get_concrete_function(2.0)(2.0))

   def testWhileLoopWithUnmodifiedCarriedShape(self):
     with ops.device('device:{}:0'.format(self.device)):
       signature = [tensor_spec.TensorSpec(shape=[None], dtype=dtypes.float32)]

       # We define a signature that specifies unknown vector shape, then test
       # that tf.shape constness gets properly propagated into the while_loop
       # even when carried as part of the loop state.
       @def_function.function(input_signature=signature, jit_compile=True)
       def g(x):
         return control_flow_ops.while_loop_v2(
             lambda *_: True,
             lambda y, shp: (y + random_ops.random_normal(shp)**2, shp),
             (x, array_ops.shape(x)),
             maximum_iterations=3)[0]

       self.assertAllGreater(g(array_ops.zeros([7])), 0.)

   def testNestedWhileLoopWithUnmodifiedCarriedShape(self):
     with ops.device('device:{}:0'.format(self.device)):
       signature = [tensor_spec.TensorSpec(shape=[None], dtype=dtypes.float32)]

       @def_function.function(input_signature=signature, jit_compile=True)
       def g(x):

         def inner(z, shp):
           return z + random_ops.random_normal(shp)**2, shp

         def outer(y, shp):
           y, shp = control_flow_ops.while_loop_v2(
               lambda *_: True, inner, (y, shp), maximum_iterations=3)
           y, shp = array_ops.identity_n([y, shp])
           return control_flow_ops.while_loop_v2(
               lambda *_: True, inner, (y, shp), maximum_iterations=5)

         shp = array_ops.shape(x, name='x_shp')
         return control_flow_ops.while_loop_v2(
             lambda *_: True, outer, (x, shp), maximum_iterations=4)[0]

       self.assertAllGreater(g(array_ops.zeros([7])), 0.)

   def testNestedWhileLoopWithUnmodifiedCarriedShapeSlice(self):
     with ops.device('device:{}:0'.format(self.device)):
       signature = [
           tensor_spec.TensorSpec(shape=[None, None], dtype=dtypes.float32)
       ]

       @def_function.function(input_signature=signature, jit_compile=True)
       def g(x):

         def inner(z, shp):
           return z + random_ops.random_normal(shp)**2, shp

         def outer(y, shp):
           y, shp = control_flow_ops.while_loop_v2(
               lambda *_: True, inner, (y, shp), maximum_iterations=3)
           return control_flow_ops.while_loop_v2(
               lambda *_: True, inner, (y, shp), maximum_iterations=4)

         shp = array_ops.shape(x, name='x_shp')
         x = control_flow_ops.while_loop_v2(
             lambda *_: True, outer, (x, shp), maximum_iterations=5)[0]

         shp2 = array_ops.shape(x, name='x_shp_after')[1:]
         w = control_flow_ops.while_loop_v2(
             lambda *_: True,
             outer, (array_ops.zeros_like(x[0]), shp2),
             maximum_iterations=6)[0]
         return x + w

       self.assertAllGreater(g(array_ops.zeros([7, 13])), 0.)

   def testMethodCompilation(self):

     with ops.device('device:{}:0'.format(self.device)):

       class C(object):

         @def_function.function(jit_compile=True)
         def f1(self, x, a):
           return x + a

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       c = C()
       self.assertAllClose([2, 3, 3, 4, 4], c.f1(inputs, 1))

   def testMethodCompilationUnsupportedFunc(self):
     if 'tpu' in self.device.lower():
       self.skipTest('XLA TPU supports tf.unique')

     with ops.device('device:{}:0'.format(self.device)):

       class C(object):

         @def_function.function(jit_compile=True)
         def f1(self, x):
           return array_ops.unique(x).y

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       c = C()
       with self.assertRaisesRegex(
           errors.InvalidArgumentError, 'legalization failed'
           if test_util.is_mlir_bridge_enabled() else 'unsupported operations'):
         c.f1(inputs)

   def testMustBeConstantPropagation(self):
     if 'tpu' in self.device.lower():
       self.skipTest('b/162799319: Cannot resolve constant on TPU')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f():
         return constant_op.constant([0, 2, 1], dtype=dtypes.int32)

       @def_function.function(jit_compile=True)
       def g(a, b):
         return array_ops.transpose(a, b)

       @def_function.function
       def z():
         return g(array_ops.ones([3, 4, 3], dtype=dtypes.float32), f())

       z()

   def testArgMinMax(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def argmax(x):
         return math_ops.argmax(x)

       @def_function.function(jit_compile=True)
       def argmin(x):
         return math_ops.argmin(x)

       self.assertAllClose(0, argmax(array_ops.ones([10], dtype=dtypes.float32)))
       self.assertAllClose(0, argmax(array_ops.ones([10])))
       self.assertAllClose(0, argmin(array_ops.ones([10], dtype=dtypes.float32)))
       self.assertAllClose(0, argmin(array_ops.ones([10])))

   @test_util.disable_mlir_bridge('TensorArray support not implemented')
   def testErrorMessagePassingTensorArray(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=1, element_shape=[])
         ta = ta.write(0, 2 * x)
         y = ta.read(0)
         return y

       x = constant_op.constant(3.14)
       with backprop.GradientTape() as tape:
         tape.watch(x)
         with self.assertRaisesRegex(errors.UnimplementedError,
                                     'TensorList crossing the XLA/TF boundary'):
           y = f(x)
           tape.gradient(y, x)

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatV2(self):
     with ops.device('device:{}:0'.format(self.device)):

       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[3])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       compiled_f = def_function.function(jit_compile=True)(f)

       inputs = constant_op.constant([3.14, 2.68, 7.69])

       self.assertAllClose([6.28, 5.36, 15.38, 9.42, 8.04, 23.07], f(inputs))

       self.assertAllClose(compiled_f(inputs), f(inputs))

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatV2Multidim(self):
     with ops.device('device:{}:0'.format(self.device)):

       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[3, 2])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       compiled_f = def_function.function(jit_compile=True)(f)

       inputs = constant_op.constant([[3.14, 21.1], [2.68, 22.2], [7.69, 23.3]])
       self.assertAllClose(f(inputs), compiled_f(inputs))

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatV2Scalars(self):
     with ops.device('device:{}:0'.format(self.device)):

       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[1])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       compiled_f = def_function.function(jit_compile=True)(f)
       inputs = constant_op.constant([3.14])
       self.assertAllClose(f(inputs), compiled_f(inputs))

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatGrad(self):
     with ops.device('device:{}:0'.format(self.device)):

       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[3])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       def g():
         x = constant_op.constant([3.14, 2.68, 7.69])
         with backprop.GradientTape() as tape:
           tape.watch(x)
           y = f(x)
           return tape.gradient(y, x)

       compiled_g = def_function.function(jit_compile=True)(g)

       self.assertAllClose([5.0, 5.0, 5.0], g())
       self.assertAllClose(compiled_g(), g())

   @test_util.disable_mlir_bridge('TODO(b/162281863): MLIR bridge errors out'
                                  ' lowering TensorListConcatV2')
   def testTensorListConcatGradNestedCompile(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(x):
         ta = tensor_array_ops.TensorArray(
             dtype=dtypes.float32, size=2, element_shape=[3])
         ta = ta.write(0, 2 * x)
         ta = ta.write(1, 3 * x)
         return ta.concat()

       @def_function.function(jit_compile=True)
       def g():
         x = constant_op.constant([3.14, 2.68, 7.69])
         with backprop.GradientTape() as tape:
           tape.watch(x)
           y = f(x)
           out = tape.gradient(y, x)
         return out

       self.assertAllClose([5.0, 5.0, 5.0], g())

   def testCumsum(self):
     if 'tpu' in self.device.lower():
       self.skipTest('b/162771302: 64bit rewrite of cumsum not supported')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(x):
         return math_ops.cumsum(x)

       f64_input = constant_op.constant([1.1, 2.2, 3.3], dtype=dtypes.float64)
       self.assertAllClose([1.1, 3.3, 6.6], f(f64_input))

   def testNoExcessiveRetracing(self):
     with ops.device('device:{}:0'.format(self.device)):
       inner_retracings = 0

       @def_function.function(jit_compile=True)
       def inner(a, b):
         nonlocal inner_retracings
         inner_retracings += 1
         return a * b + a

       def outer(a, b):
         return inner(a, b)

       func_input = random_ops.random_normal([10, 10])
       for _ in range(2):
         def_function.function(outer)(func_input, func_input)

       self.assertEqual(inner_retracings, 1)

   def testUpdateVariable(self):
     with ops.device('device:{}:0'.format(self.device)):

       on_gpu = 'gpu' in self.device.lower()
       v = variables.Variable([3.1, 3.2])

       @def_function.function(jit_compile=True)
       def update_var(a, b):
         v.assign_add(a * b)

       arg1 = random_ops.random_normal([2])
       arg2 = random_ops.random_normal([2])

       initial_usage = context.context().get_total_memory_usage(
           v.device) if on_gpu else 0
       update_var(arg1, arg2)
       final_usage = context.context().get_total_memory_usage(
           v.device) if on_gpu else 0
       self.assertEqual(initial_usage, final_usage)

   @test_util.disable_mlir_bridge('TODO(b/162381930): MLIR bridge renames '
                                  ' functions')
   def testUpdateVariableInClass(self):
     with ops.device('device:{}:0'.format(self.device)):

       class C(object):

         @def_function.function(jit_compile=True)
         def update_var(self, a, b):
           if not hasattr(self, 'v'):
             self.v = variables.Variable(3.1)
           self.v.assign_add(a * b)

       c = C()

       @def_function.function
       def outer():
         c.update_var(constant_op.constant(0.7), constant_op.constant(0.6))

       outer()
       self.assertAllClose(c.v, 3.52)

   def testUpdateVariableMultipleOutputs(self):
     with ops.device('device:{}:0'.format(self.device)):
       v = variables.Variable(3.1)

       @def_function.function(jit_compile=True)
       def update_var(a, b):
         v.assign_add(a * b)
         return a * b + v

       out = update_var(constant_op.constant(0.7), constant_op.constant(0.6))
       self.assertAllClose(v, 3.52)
       self.assertAllClose(out, 3.94)

   def testReturnIdentity(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(a, b):
         return (a, b)

       a = random_ops.random_normal([10, 10])
       b = random_ops.random_normal([10, 10])

       on_gpu = 'gpu' in self.device.lower()
       initial_usage = context.context().get_total_memory_usage(
           b.backing_device) if on_gpu else 0

       f(a, b)

       final_usage = context.context().get_total_memory_usage(
           b.backing_device) if on_gpu else 0
       self.assertEqual(initial_usage, final_usage)

   def testGetCompilerIrConstants(self):
     if 'tpu' in self.device.lower():
       self.skipTest('TPU generates different HLO')

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(a, b):
         return array_ops.transpose(a, b)

       a = array_ops.ones([3, 4, 3], dtype=dtypes.float32)
       b = constant_op.constant([0, 2, 1], dtype=dtypes.int32)

       self.assertIn('{1,2,0}',
                     f.experimental_get_compiler_ir(a, b)(stage='optimized_hlo'))

   @test_util.disable_mlir_bridge('TODO(b/168732524): MLIR bridge does not '
                                  ' optimize single-element tuples to scalars')
   def testGetCompilerIrResourceVars(self):
     with ops.device('device:{}:0'.format(self.device)):

       v = variables.Variable([3.1, 3.2])

       @def_function.function(jit_compile=True)
       def f(a, b):
         v.assign_add(a * b)

       a = random_ops.random_normal([2])
       b = random_ops.random_normal([2])

       self.assertIn('input_output_alias={ {}: (2, {}, may-alias) }',
                     f.experimental_get_compiler_ir(a, b)('optimized_hlo'))

   def testGetCompilerIrNotCompiled(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function
       def f(x):
         return x + 1

       a = random_ops.random_normal([10, 10])
       with self.assertRaisesRegex(ValueError,
                                   'marked with \'jit_compile'):
         f.experimental_get_compiler_ir(a)()

   def testGetCompilerIrNested(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def fn(x, a):
         return x + a

       @def_function.function(jit_compile=False)
       def fn2(x, a):
         fn.experimental_get_compiler_ir(x, a)()
         return fn(x, a)

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       with self.assertRaisesRegex(TypeError, '"Graph" tensor'):
         fn2(inputs, 1)

   def testGetCompilerIrKwargs(self):
     with ops.device('device:{}:0'.format(self.device)):

       v = variables.Variable([0.1, 0.1])

       @def_function.function(jit_compile=True)
       def f(a, b):
         return (a + b) * v

       a = constant_op.constant([1.1, 1.1])
       b = constant_op.constant([2.2, 2.2])

       self.assertIn('multiply',
                     f.experimental_get_compiler_ir(b=a, a=b)(stage='hlo'))

   def testGetCompilerIrDot(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(a, b):
         return a + b

       a = constant_op.constant([1.1, 1.1])
       b = constant_op.constant([2.2, 2.2])

       self.assertIn(
           'label',
           f.experimental_get_compiler_ir(a, b)(stage='optimized_hlo_dot'))

   def testGetCompilerIrNoDevicePlacement(self):
     if 'gpu' not in self.device.lower():
       self.skipTest('Testing get_compiler_ir on GPUs without placement')

     @def_function.function(jit_compile=True)
     def f(a, b):
       return a + b

     a = constant_op.constant([1.1, 1.1])
     b = constant_op.constant([2.2, 2.2])

     self.assertIn(
         'label',
         f.experimental_get_compiler_ir(a, b)(stage='optimized_hlo_dot'))

   def testGetCompilerIrNonTensors(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(l):
         return l[0] + l[1]

       l = [constant_op.constant(1.1), constant_op.constant(2.2)]

       self.assertIn('tuple',
                     f.experimental_get_compiler_ir(l)())

   def testGetCompilerIrSerialized(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def fn(x):
         return x - x

       inputs = constant_op.constant([1, 2, 2, 3, 3])
       for stage in ('hlo_serialized', 'optimized_hlo_serialized'):
         hlo = fn.experimental_get_compiler_ir(inputs)(
             stage=stage, device_name=f'/device:{self.device}:0')
         self.assertIsInstance(hlo, bytes)

   def testConstantOnWrongDevice(self):
     with ops.device('device:{}:0'.format(self.device)):

       s = random_ops.random_uniform([2], 1, 10, dtypes.int32)
       l = random_ops.random_normal([s[0] * s[1]])

       @def_function.function(jit_compile=True)
       def f(l):
         return array_ops.reshape(l, s)

       self.assertIn('tuple',
                     f.experimental_get_compiler_ir(l)())

   @test_util.disable_mlir_bridge('TODO(b/172845417): MLIR bridge does not '
                                  'support getting constants out of resources')
   def testGetConstantOutOfResourceVariable(self):
     with ops.device('device:{}:0'.format(self.device)):

       # Use floats to force device placement.
       a = variables.Variable(50.0)
       b = variables.Variable(2.0)

       @def_function.function(jit_compile=True)
       def f(x):
         return array_ops.reshape(
             x, [math_ops.cast(a, dtypes.int32),
                 math_ops.cast(b, dtypes.int32)])

       # OK since the value is known at compile time.
       out = f(random_ops.random_normal([10, 10]))
       self.assertEqual(out.shape[0], 50)
       self.assertEqual(out.shape[1], 2)

   @test_util.disable_mlir_bridge('TODO(b/172845417): MLIR bridge does not '
                                  'support getting constants out of resources')
   def testGetConstantOutOfResourceVariableAfterWrite(self):
     with ops.device('device:{}:0'.format(self.device)):

       # Use floats to force device placement.
       a = variables.Variable(50.0)
       b = variables.Variable(2.0)

       @def_function.function(jit_compile=True)
       def f(x, val1, val2):
         a.assign(math_ops.cast(val1, dtypes.float32))
         b.assign(math_ops.cast(val2, dtypes.float32))
         return array_ops.reshape(
             x, [math_ops.cast(a, dtypes.int32),
                 math_ops.cast(b, dtypes.int32)])

       val1 = constant_op.constant(2)
       val2 = constant_op.constant(50)

       # Returns an error, since the value known at compile time was overriden.
       with self.assertRaisesRegex(errors.InvalidArgumentError,
                                   'concrete values at compile time'):
         f(random_ops.random_normal([10, 10]), val1, val2)

   @test_util.disable_mlir_bridge('TODO(b/172845417): MLIR bridge does not '
                                  'support getting constants out of resources')
   def testGetConstantOutOfResourceVariableBeforeWrite(self):
     with ops.device('device:{}:0'.format(self.device)):

       # Use floats to force device placement.
       a = variables.Variable(50.0)
       b = variables.Variable(2.0)

       @def_function.function(jit_compile=True)
       def f(x, val1, val2):
         out = array_ops.reshape(
             x, [math_ops.cast(a, dtypes.int32),
                 math_ops.cast(b, dtypes.int32)])
         a.assign(math_ops.cast(val1, dtypes.float32))
         b.assign(math_ops.cast(val2, dtypes.float32))
         return out

       val1 = constant_op.constant(2)
       val2 = constant_op.constant(50)

       # OK since the write happens after the reshape.
       out = f(random_ops.random_normal([10, 10]), val1, val2)
       self.assertEqual(out.shape[0], 50)
       self.assertEqual(out.shape[1], 2)

   def testTfAssert(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(x):
         control_flow_ops.Assert(x == 1, ['Wrong value'])

       f(constant_op.constant(1))

   def testTensorArrayErrorMessage(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f():
         # The error message as old and new bridge differ in which op they flag.
         # The one points to the creation of the unitialized tensor array, the
         # other is the use of the unitialized tensor array.
         ta = tensor_array_ops.TensorArray(  # EXPECTED_MESSAGE_NEW
             dtype=dtypes.float32,
             size=2,
             dynamic_size=True,
             element_shape=(None,))
         return ta.concat()  # EXPECTED_MESSAGE_OLD

       if test_util.is_mlir_bridge_enabled():
         with self.assertRaisesRegex(errors.InvalidArgumentError,
                                     'EXPECTED_MESSAGE_NEW'):
           f()
       else:
         with self.assertRaisesRegex(errors.InvalidArgumentError,
                                     'EXPECTED_MESSAGE_OLD'):
           f()

   def testCounter(self):
     cell_nojit = def_function._tf_function_counter.get_cell('0')
     cell_jit = def_function._tf_function_counter.get_cell('1')
     orig_nojit = cell_nojit.value()
     orig_jit = cell_jit.value()

     with ops.device('device:{}:0'.format(self.device)):
       @def_function.function
       def f(a):
         return a + a
       f(constant_op.constant(1))
       self.assertEqual(cell_nojit.value(), orig_nojit + 1)
       self.assertEqual(cell_jit.value(), orig_jit)
       f(constant_op.constant(1.))  # Calling again does not increment
       self.assertEqual(cell_nojit.value(), orig_nojit + 1)

       @def_function.function(jit_compile=True)
       def f1(a):
         return a + a
       f1(constant_op.constant(1))
       self.assertEqual(cell_nojit.value(), orig_nojit + 1)
       self.assertEqual(cell_jit.value(), orig_jit + 1)

       @def_function.function
       def f2(a):
         @def_function.function
         def g(a):
           return a + a
         @def_function.function(jit_compile=True)
         def h(a):
           return a + a
         return g(a) + h(a)
       f2(constant_op.constant(1))
       self.assertEqual(cell_nojit.value(), orig_nojit + 2)
       self.assertEqual(cell_jit.value(), orig_jit + 2)

       @def_function.function(jit_compile=True)
       def f3(a):
         @def_function.function
         def g(a):
           return a + a
         @def_function.function(jit_compile=True)
         def h(a):
           return a + a
         return g(a) + h(a)
       f3(constant_op.constant(1))
       self.assertEqual(cell_nojit.value(), orig_nojit + 2)
       self.assertEqual(cell_jit.value(), orig_jit + 3)

   @test_util.disable_mlir_bridge('TODO(b/162272821): MLIR bridge returns '
                                  ' wrong status type')
   def testResourceWrongDevice(self):
     if 'gpu' not in self.device.lower():
       self.skipTest('Need a GPU to have non-trivial device placement')

     with ops.device('device:CPU:0'):
       v = variables.Variable([3.1, 3.2])

     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(experimental_compile=True)
       def update_var(a):
         v.assign_add(a)

       arg = random_ops.random_normal([2])
       with self.assertRaisesRegex(errors.InvalidArgumentError,
                                   'def_function_xla_jit_test.py'):
         update_var(arg)

   def testMustBeConstantInsideCondition(self):
     with ops.device('device:{}:0'.format(self.device)):

       @def_function.function(jit_compile=True)
       def f(x, d):
         if math_ops.reduce_all(
             math_ops.greater(x, random_ops.random_normal([10, 10]))):
           return array_ops.reshape(x * 2, constant_op.constant([100]))
         else:
           return array_ops.reshape(x * 3, d)

       f(random_ops.random_normal([10, 10]), constant_op.constant([100]))

   def testConditionalGradientTapeMathRegression(self):
     with ops.device('device:{}:0'.format(self.device)):
       with backprop.GradientTape():

         @def_function.function(jit_compile=True, autograph=False)
         def f(x):
           return control_flow_ops.cond(
               math_ops.reduce_all(x > 1), lambda: 1. / x, lambda: x)

         v = variables.Variable([[2.]])
         self.assertAllClose(f(v), constant_op.constant([[0.5]]))


 if __name__ == '__main__':
   ops.enable_eager_execution()
   test.main()