test/test_unary_ufuncs.py - platform/external/pytorch - Git at Google

 import math
 from itertools import product, chain
 from numbers import Number

 import unittest

 import torch

 from torch.testing._internal.common_utils import \
     (TestCase, run_tests, torch_to_numpy_dtype_dict, suppress_warnings,
      IS_WINDOWS, TEST_NUMPY)
 from torch.testing._internal.common_methods_invocations import \
     (unary_ufuncs)
 from torch.testing._internal.common_device_type import \
     (instantiate_device_type_tests, ops, onlyOnCPUAndCUDA, skipCUDAIfRocm,
      dtypes)
 from torch.testing import \
     (floating_types_and, integral_types, complex_types)

 if TEST_NUMPY:
     import numpy as np

 # Tensor generators and helpers

 # Interesting values and extremal values for different dtypes
 _unsigned_int_vals = (0, 1, 55, 127)
 _int_vals = (0, -1, 1, -55, 55, -127, 127, -128, 128)
 _large_int_vals = (-1113, 1113, -10701, 10701)
 _float_vals = (0.,
                -.001, .001,
                -.25, .25,
                -1., 1.,
                -math.pi / 2, math.pi / 2,
                -math.pi + .00001, math.pi - .00001,
                -math.pi, math.pi,
                -math.pi - .00001, math.pi + .00001)
 _large_float_vals = (-501, 501,
                      -1001.2, 1001.2,
                      -13437.7, 13437.7,
                      -4988429.2, 4988429.2,
                      -1e20, 1e20)
 _float_extremals = (float('inf'), float('-inf'), float('nan'))


 def _make_tensor(size, device: torch.device, dtype: torch.dtype, *, low, high) -> torch.Tensor:
     if dtype is torch.bool:
         return torch.randint(0, 2, size, device=device, dtype=dtype)

     def _maybe_clamp(t, low_default, low, high_default, high):
         low = low_default if low is None else max(low_default, low)
         high = high_default if high is None else min(high_default, high)
         if low != low_default or high != high_default:
             return torch.clamp(t, low, high)
         return t

     if dtype is torch.uint8:
         t = torch.randint(0, 10, size, device=device, dtype=dtype)
         return _maybe_clamp(t, 0, low, 9, high)
     elif dtype in integral_types():
         t = torch.randint(-9, 10, size, device=device, dtype=dtype)
         return _maybe_clamp(t, -9, low, 9, high)
     elif dtype in floating_types_and(torch.half, torch.bfloat16):
         # Windows doesn't support torch.rand(bfloat16) on CUDA
         if IS_WINDOWS and torch.device(device).type == 'cuda' and dtype is torch.bfloat16:
             t = (torch.rand(size, device=device, dtype=torch.float32) * 18 - 9).to(torch.bfloat16)
         else:
             t = torch.rand(size, device=device, dtype=dtype) * 18 - 9
         return _maybe_clamp(t, -9, low, 9, high)
     else:
         assert dtype in complex_types()
         float_dtype = torch.float if dtype is torch.cfloat else torch.double
         real = torch.rand(size, device=device, dtype=float_dtype) * 18 - 9
         real = _maybe_clamp(real, -9, low, 9, high)
         imag = torch.rand(size, device=device, dtype=float_dtype) * 18 - 9
         imag = _maybe_clamp(imag, -9, low, 9, high)
         return torch.complex(real, imag)


 # Returns an iterable of contiguous tensors with the same storage on the requested
 #   device and with the requested dtype.
 #
 # This function is intended to test the non-vectorized and vectorized code
 #   paths of unary functions, as well as their handling of odd tensor
 #   sizes (like zero-dim tensors and tensors with zero elements).
 #
 # The iterable will include an empty tensor, tensors with no elements,
 #   zero dim (scalar) tensors, small 1D tensors, a medium 1D tensor, and
 #   a large 2D tensor.
 #
 # These tensors will include interesting values. If include_large_values
 #   is true they will include larger values (>500), too, and if
 #   include_extremal_values is true they will include extremal values
 #   like -inf, inf, and nan.
 #
 # The randomly generated values can be constracted by the domain
 #   argument.
 def generate_numeric_tensors(device, dtype, *,
                              domain=(None, None),
                              include_large_values=True,
                              include_extremal_values=True):
     medium_length = 812
     large_size = (1029, 917)
     offset = 63

     assert large_size[1] > (medium_length + offset)
     assert medium_length % 4 == 0

     # Special-cases bool
     if dtype is torch.bool:
         tensors = (torch.empty(0, device=device, dtype=torch.bool),
                    torch.tensor(True, device=device),
                    torch.tensor(False, device=device),
                    torch.tensor((True, False), device=device),
                    _make_tensor((medium_length,), device=device, dtype=dtype, low=None, high=None),
                    _make_tensor(large_size, device=device, dtype=dtype, low=None, high=None))
         return tensors

     # Acquires dtype-specific vals
     if dtype.is_floating_point or dtype.is_complex:
         large_vals = _large_float_vals if include_large_values else tuple()
         extremals = _float_extremals if include_extremal_values else tuple()
         vals = _float_vals + large_vals + extremals

         # Converts float -> complex vals if dtype is complex
         if dtype.is_complex:
             vals = tuple(complex(x, y) for x, y in product(vals, vals))
     elif dtype is torch.uint8:
         vals = _unsigned_int_vals
     else:  # dtypes is a signed integer type
         assert dtype in (torch.int8, torch.int16, torch.int32, torch.int64)
         large_vals = _large_int_vals if include_large_values else tuple()
         vals = _int_vals + large_vals

     assert len(vals) < medium_length

     # Constructs the large tensor containing vals
     large_tensor = _make_tensor(large_size, device=device, dtype=dtype, low=domain[0], high=domain[1])

     # Inserts the vals at an odd place
     large_tensor[57][offset:offset + len(vals)] = torch.tensor(vals, device=device, dtype=dtype)

     # Takes a medium sized copy of the large tensor containing vals
     medium_tensor = large_tensor[57][offset:offset + medium_length]

     # Constructs small tensors (4 elements)
     small_tensors = (t for t in torch.split(medium_tensor, 4))

     # Constructs scalar tensors
     scalar_tensors = (t.squeeze() for t in torch.split(medium_tensor, 1))

     # Tensors with no elements
     empty_sizes = ((0,), (0, 3, 3), (1, 0, 5), (6, 0, 0, 0), (3, 0, 1, 0))
     empty_tensors = (torch.empty(size, device=device, dtype=dtype) for size in empty_sizes)

     return chain(empty_tensors, scalar_tensors, small_tensors, (medium_tensor,), (large_tensor,))

 # Tests for unary "universal functions (ufuncs)" that accept a single
 # tensor and have common properties like:
 #   - they are elementwise functions
 #   - the input shape is the output shape
 #   - they typically have method and inplace variants
 #   - they typically support the out kwarg
 #   - they typically have NumPy or SciPy references

 # See NumPy's universal function documentation
 # (https://numpy.org/doc/1.18/reference/ufuncs.html) for more details
 # about the concept of ufuncs.

 # TODO: port test_unary_out_op_mem_overlap
 # TODO: add out= tests (different devices, dtypes, mismatched sizes,
 #                       correct sizes, 0 size, broadcasted out)
 # TODO: add test for inplace variants erroring on broadcasted inputs
 class TestUnaryUfuncs(TestCase):
     exact_dtype = True

     # Helper for comparing torch tensors and numpy arrays
     # TODO: should this or assertEqual also validate that strides are equal?
     def assertEqualHelper(self, actual, expected, *, dtype, exact_dtype=True, **kwargs):
         assert isinstance(actual, torch.Tensor)

         # Some NumPy functions return scalars, not arrays
         if isinstance(expected, Number):
             self.assertEqual(actual.item(), expected)
         elif isinstance(expected, np.ndarray):
             # Handles exact dtype comparisons between arrays and tensors
             if exact_dtype:
                 # Allows array dtype to be float32 when comparing with bfloat16 tensors
                 #   since NumPy doesn't support the bfloat16 dtype
                 if expected.dtype == np.float32:
                     assert actual.dtype in (torch.bfloat16, torch.float32)
                 else:
                     assert expected.dtype == torch_to_numpy_dtype_dict[actual.dtype]

             self.assertEqual(actual,
                              torch.from_numpy(expected).to(actual.dtype),
                              exact_device=False,
                              **kwargs)
         else:
             self.assertEqual(actual, expected, exact_device=False, **kwargs)

     # Verifies that the unary ufuncs have their supported dtypes
     #   registered correctly by testing that each unlisted dtype
     #   throws a runtime error
     @skipCUDAIfRocm
     @onlyOnCPUAndCUDA
     @ops(unary_ufuncs, unsupported_dtypes_only=True)
     def test_unsupported_dtypes(self, device, dtype, op):
         t = torch.empty(1, device=device, dtype=dtype)
         with self.assertRaises(RuntimeError):
             op(t)

     # Tests bool tensor negation raises the correct error
     def test_neg_error_message(self, device):
         msg = ("Negation, the `\\-` operator, on a bool tensor is not supported."
                " If you are trying to invert a mask, use the `\\~` or"
                " `logical_not\\(\\)` operator instead.")

         t = torch.tensor((False, True), device=device)

         with self.assertRaisesRegex(RuntimeError, msg):
             torch.neg(t)

     @dtypes(*floating_types_and(torch.bfloat16, torch.half))
     @ops((_fn for _fn in unary_ufuncs if _fn.domain != (None, None)))
     def test_float_domains(self, device, dtype, op):
         if not op.supports_dtype(dtype, torch.device(device).type):
             raise unittest.SkipTest('unsupported dtype')

         eps = (1e-5, 1e-3, 1e-1, 1, 2, 10, 20, 50, 100)

         low, high = op.domain
         # NOTE: the following two loops are separated for readability
         if low is not None:
             low_tensor = torch.tensor(low, device=device, dtype=dtype)
             for epsilon in eps:
                 lower_tensor = low_tensor - epsilon

                 # Skips the test if the difference is not representable,
                 #   which can occur if, for example, the difference is small
                 #   and the dtype is imprecise (like bfloat16 is)
                 if lower_tensor.item() == low_tensor.item():
                     continue

                 result = op(lower_tensor)
                 self.assertEqual(result.item(), float('nan'),
                                  msg=("input of {0} outside lower domain boundary"
                                       " {1} produced {2}, not nan!").format(lower_tensor.item(),
                                                                             low,
                                                                             result.item()))

         if high is not None:
             high_tensor = torch.tensor(high, device=device, dtype=dtype)
             for epsilon in eps:
                 higher_tensor = high_tensor + epsilon

                 # See above comment
                 if higher_tensor.item() == high_tensor.item():
                     continue

                 result = op(higher_tensor)
                 self.assertEqual(result.item(), float('nan'),
                                  msg=("input of {0} outside upper domain boundary"
                                       " {1} produced {2}, not nan!").format(higher_tensor.item(),
                                                                             high,
                                                                             result.item()))

     # Tests that fn == method == inplace == jit on a simple single tensor input
     # TODO: should this jitting the method and inplace variants, too?
     @ops(unary_ufuncs)
     def test_variant_consistency(self, device, dtype, op):
         def _fn(t):
             return op(t)

         t = _make_tensor((5, 5), device, dtype, low=op.domain[0], high=op.domain[1])
         expected = op(t)

         for alt in (op.get_method(), op.get_inplace(), torch.jit.script(_fn)):
             if alt is None:
                 with self.assertRaises(RuntimeError):
                     alt(t.clone())

             actual = alt(t.clone())
             self.assertEqual(actual, expected, rtol=0, atol=0)

     # Tests that the function and its (array-accepting) reference produce the same
     #   values on a range of tensors, including empty tensors, scalar tensors,
     #   1D tensors and a large 2D tensor with interesting and extremal values
     #   and discontiguities.
     @unittest.skipIf(not TEST_NUMPY, "NumPy not found")
     @suppress_warnings
     @ops(unary_ufuncs)
     def test_reference_numerics(self, device, dtype, op):
         include_extremals = (op.handles_complex_extremals if
                              dtype in (torch.cfloat, torch.cdouble) else op.handles_extremals)

         tensors = generate_numeric_tensors(device, dtype,
                                            domain=op.domain,
                                            include_large_values=op.handles_large_floats,
                                            include_extremal_values=include_extremals)
         for t in tensors:
             if dtype is torch.bfloat16:
                 a = t.cpu().to(torch.float32).numpy()
             else:
                 a = t.cpu().numpy()

             actual = op(t)
             expected = op.ref(a)

             # Crafts a custom error message for smaller, printable tensors
             if t.numel() < 10:
                 msg = ("Failed to produce expected results! Input tensor was"
                        " {0}, torch result is {1}, and reference result is"
                        " {2}.").format(t, actual, expected)
             else:
                 msg = None

             self.assertEqualHelper(actual, expected, dtype=dtype, msg=msg)

     # Tests for testing (dis)contiguity consistency

     @ops(unary_ufuncs)
     def test_contig_vs_every_other(self, device, dtype, op):
         contig = _make_tensor((1026,), device=device, dtype=dtype,
                               low=op.domain[0], high=op.domain[1])
         non_contig = contig[::2]

         self.assertTrue(contig.is_contiguous())
         self.assertFalse(non_contig.is_contiguous())

         self.assertEqual(op(contig)[::2], op(non_contig))

     @ops(unary_ufuncs)
     def test_contig_vs_transposed(self, device, dtype, op):
         contig = _make_tensor((789, 357), device=device, dtype=dtype,
                               low=op.domain[0], high=op.domain[1])
         non_contig = contig.T

         self.assertTrue(contig.is_contiguous())
         self.assertFalse(non_contig.is_contiguous())

         self.assertEqual(op(contig).T, op(non_contig))

     @ops(unary_ufuncs)
     def test_non_contig(self, device, dtype, op):
         shapes = [(5, 7), (1024,)]
         for shape in shapes:
             contig = _make_tensor(shape, device, dtype,
                                   low=op.domain[0], high=op.domain[1])
             non_contig = torch.empty(shape + (2,), device=device, dtype=dtype)[..., 0]
             non_contig.copy_(contig)

             self.assertTrue(contig.is_contiguous())
             self.assertFalse(non_contig.is_contiguous())

             self.assertEqual(op(contig), op(non_contig))

     @ops(unary_ufuncs)
     def test_non_contig_index(self, device, dtype, op):
         contig = _make_tensor((2, 2, 1, 2), device, dtype,
                               low=op.domain[0], high=op.domain[1])
         non_contig = contig[:, 1, ...]
         contig = non_contig.contiguous()

         self.assertTrue(contig.is_contiguous())
         self.assertFalse(non_contig.is_contiguous())

         self.assertEqual(op(contig), op(non_contig))

     @ops(unary_ufuncs)
     def test_non_contig_expand(self, device, dtype, op):
         shapes = [(1, 3), (1, 7), (5, 7)]
         for shape in shapes:
             contig = _make_tensor(shape, device, dtype,
                                   low=op.domain[0], high=op.domain[1])
             non_contig = contig.clone().expand(3, -1, -1)

             self.assertTrue(contig.is_contiguous())
             self.assertFalse(non_contig.is_contiguous())

             contig = op(contig)
             non_contig = op(non_contig)
             for i in range(3):
                 self.assertEqual(contig, non_contig[i],
                                  msg='non-contiguous expand[' + str(i) + ']')

     @ops(unary_ufuncs)
     def test_contig_size1(self, device, dtype, op):
         contig = _make_tensor((5, 100), device, dtype,
                               low=op.domain[0], high=op.domain[1])
         contig = contig[:1, :50]
         contig2 = torch.empty(contig.size(), device=device, dtype=dtype)
         contig2.copy_(contig)

         self.assertTrue(contig.is_contiguous())
         self.assertTrue(contig2.is_contiguous())

         self.assertEqual(op(contig), op(contig2))

     @ops(unary_ufuncs)
     def test_contig_size1_large_dim(self, device, dtype, op):
         contig = _make_tensor((5, 2, 3, 1, 4, 5, 3, 2, 1, 2, 3, 4), device, dtype,
                               low=op.domain[0], high=op.domain[1])
         contig = contig[:1, :, :, :, :, :, :, :, :, :, :, :]
         contig2 = torch.empty(contig.size(), device=device, dtype=dtype)
         contig2.copy_(contig)

         self.assertTrue(contig.is_contiguous())
         self.assertTrue(contig2.is_contiguous())

         self.assertEqual(op(contig), op(contig2))

     # Tests that computation on a multiple batches is the same as
     # per-batch computation.
     @ops(unary_ufuncs)
     def test_batch_vs_slicing(self, device, dtype, op):
         input = _make_tensor((1024, 512), dtype=dtype, device=device,
                              low=op.domain[0], high=op.domain[1])

         actual = op(input)
         expected = torch.stack([op(slice) for slice in input])

         self.assertEqual(actual, expected)


 instantiate_device_type_tests(TestUnaryUfuncs, globals())

 if __name__ == '__main__':
     run_tests()
	import math
	from itertools import product, chain
	from numbers import Number

	import unittest

	import torch

	from torch.testing._internal.common_utils import \
	(TestCase, run_tests, torch_to_numpy_dtype_dict, suppress_warnings,
	IS_WINDOWS, TEST_NUMPY)
	from torch.testing._internal.common_methods_invocations import \
	(unary_ufuncs)
	from torch.testing._internal.common_device_type import \
	(instantiate_device_type_tests, ops, onlyOnCPUAndCUDA, skipCUDAIfRocm,
	dtypes)
	from torch.testing import \
	(floating_types_and, integral_types, complex_types)

	if TEST_NUMPY:
	import numpy as np

	# Tensor generators and helpers

	# Interesting values and extremal values for different dtypes
	_unsigned_int_vals = (0, 1, 55, 127)
	_int_vals = (0, -1, 1, -55, 55, -127, 127, -128, 128)
	_large_int_vals = (-1113, 1113, -10701, 10701)
	_float_vals = (0.,
	-.001, .001,
	-.25, .25,
	-1., 1.,
	-math.pi / 2, math.pi / 2,
	-math.pi + .00001, math.pi - .00001,
	-math.pi, math.pi,
	-math.pi - .00001, math.pi + .00001)
	_large_float_vals = (-501, 501,
	-1001.2, 1001.2,
	-13437.7, 13437.7,
	-4988429.2, 4988429.2,
	-1e20, 1e20)
	_float_extremals = (float('inf'), float('-inf'), float('nan'))


	def _make_tensor(size, device: torch.device, dtype: torch.dtype, *, low, high) -> torch.Tensor:
	if dtype is torch.bool:
	return torch.randint(0, 2, size, device=device, dtype=dtype)

	def _maybe_clamp(t, low_default, low, high_default, high):
	low = low_default if low is None else max(low_default, low)
	high = high_default if high is None else min(high_default, high)
	if low != low_default or high != high_default:
	return torch.clamp(t, low, high)
	return t

	if dtype is torch.uint8:
	t = torch.randint(0, 10, size, device=device, dtype=dtype)
	return _maybe_clamp(t, 0, low, 9, high)
	elif dtype in integral_types():
	t = torch.randint(-9, 10, size, device=device, dtype=dtype)
	return _maybe_clamp(t, -9, low, 9, high)
	elif dtype in floating_types_and(torch.half, torch.bfloat16):
	# Windows doesn't support torch.rand(bfloat16) on CUDA
	if IS_WINDOWS and torch.device(device).type == 'cuda' and dtype is torch.bfloat16:
	t = (torch.rand(size, device=device, dtype=torch.float32) * 18 - 9).to(torch.bfloat16)
	else:
	t = torch.rand(size, device=device, dtype=dtype) * 18 - 9
	return _maybe_clamp(t, -9, low, 9, high)
	else:
	assert dtype in complex_types()
	float_dtype = torch.float if dtype is torch.cfloat else torch.double
	real = torch.rand(size, device=device, dtype=float_dtype) * 18 - 9
	real = _maybe_clamp(real, -9, low, 9, high)
	imag = torch.rand(size, device=device, dtype=float_dtype) * 18 - 9
	imag = _maybe_clamp(imag, -9, low, 9, high)
	return torch.complex(real, imag)


	# Returns an iterable of contiguous tensors with the same storage on the requested
	# device and with the requested dtype.
	#
	# This function is intended to test the non-vectorized and vectorized code
	# paths of unary functions, as well as their handling of odd tensor
	# sizes (like zero-dim tensors and tensors with zero elements).
	#
	# The iterable will include an empty tensor, tensors with no elements,
	# zero dim (scalar) tensors, small 1D tensors, a medium 1D tensor, and
	# a large 2D tensor.
	#
	# These tensors will include interesting values. If include_large_values
	# is true they will include larger values (>500), too, and if
	# include_extremal_values is true they will include extremal values
	# like -inf, inf, and nan.
	#
	# The randomly generated values can be constracted by the domain
	# argument.
	def generate_numeric_tensors(device, dtype, *,
	domain=(None, None),
	include_large_values=True,
	include_extremal_values=True):
	medium_length = 812
	large_size = (1029, 917)
	offset = 63

	assert large_size[1] > (medium_length + offset)
	assert medium_length % 4 == 0

	# Special-cases bool
	if dtype is torch.bool:
	tensors = (torch.empty(0, device=device, dtype=torch.bool),
	torch.tensor(True, device=device),
	torch.tensor(False, device=device),
	torch.tensor((True, False), device=device),
	_make_tensor((medium_length,), device=device, dtype=dtype, low=None, high=None),
	_make_tensor(large_size, device=device, dtype=dtype, low=None, high=None))
	return tensors

	# Acquires dtype-specific vals
	if dtype.is_floating_point or dtype.is_complex:
	large_vals = _large_float_vals if include_large_values else tuple()
	extremals = _float_extremals if include_extremal_values else tuple()
	vals = _float_vals + large_vals + extremals

	# Converts float -> complex vals if dtype is complex
	if dtype.is_complex:
	vals = tuple(complex(x, y) for x, y in product(vals, vals))
	elif dtype is torch.uint8:
	vals = _unsigned_int_vals
	else: # dtypes is a signed integer type
	assert dtype in (torch.int8, torch.int16, torch.int32, torch.int64)
	large_vals = _large_int_vals if include_large_values else tuple()
	vals = _int_vals + large_vals

	assert len(vals) < medium_length

	# Constructs the large tensor containing vals
	large_tensor = _make_tensor(large_size, device=device, dtype=dtype, low=domain[0], high=domain[1])

	# Inserts the vals at an odd place
	large_tensor[57][offset:offset + len(vals)] = torch.tensor(vals, device=device, dtype=dtype)

	# Takes a medium sized copy of the large tensor containing vals
	medium_tensor = large_tensor[57][offset:offset + medium_length]

	# Constructs small tensors (4 elements)
	small_tensors = (t for t in torch.split(medium_tensor, 4))

	# Constructs scalar tensors
	scalar_tensors = (t.squeeze() for t in torch.split(medium_tensor, 1))

	# Tensors with no elements
	empty_sizes = ((0,), (0, 3, 3), (1, 0, 5), (6, 0, 0, 0), (3, 0, 1, 0))
	empty_tensors = (torch.empty(size, device=device, dtype=dtype) for size in empty_sizes)

	return chain(empty_tensors, scalar_tensors, small_tensors, (medium_tensor,), (large_tensor,))

	# Tests for unary "universal functions (ufuncs)" that accept a single
	# tensor and have common properties like:
	# - they are elementwise functions
	# - the input shape is the output shape
	# - they typically have method and inplace variants
	# - they typically support the out kwarg
	# - they typically have NumPy or SciPy references

	# See NumPy's universal function documentation
	# (https://numpy.org/doc/1.18/reference/ufuncs.html) for more details
	# about the concept of ufuncs.

	# TODO: port test_unary_out_op_mem_overlap
	# TODO: add out= tests (different devices, dtypes, mismatched sizes,
	# correct sizes, 0 size, broadcasted out)
	# TODO: add test for inplace variants erroring on broadcasted inputs
	class TestUnaryUfuncs(TestCase):
	exact_dtype = True

	# Helper for comparing torch tensors and numpy arrays
	# TODO: should this or assertEqual also validate that strides are equal?
	def assertEqualHelper(self, actual, expected, , dtype, exact_dtype=True, *kwargs):
	assert isinstance(actual, torch.Tensor)

	# Some NumPy functions return scalars, not arrays
	if isinstance(expected, Number):
	self.assertEqual(actual.item(), expected)
	elif isinstance(expected, np.ndarray):
	# Handles exact dtype comparisons between arrays and tensors
	if exact_dtype:
	# Allows array dtype to be float32 when comparing with bfloat16 tensors
	# since NumPy doesn't support the bfloat16 dtype
	if expected.dtype == np.float32:
	assert actual.dtype in (torch.bfloat16, torch.float32)
	else:
	assert expected.dtype == torch_to_numpy_dtype_dict[actual.dtype]

	self.assertEqual(actual,
	torch.from_numpy(expected).to(actual.dtype),
	exact_device=False,
	**kwargs)
	else:
	self.assertEqual(actual, expected, exact_device=False, **kwargs)

	# Verifies that the unary ufuncs have their supported dtypes
	# registered correctly by testing that each unlisted dtype
	# throws a runtime error
	@skipCUDAIfRocm
	@onlyOnCPUAndCUDA
	@ops(unary_ufuncs, unsupported_dtypes_only=True)
	def test_unsupported_dtypes(self, device, dtype, op):
	t = torch.empty(1, device=device, dtype=dtype)
	with self.assertRaises(RuntimeError):
	op(t)

	# Tests bool tensor negation raises the correct error
	def test_neg_error_message(self, device):
	msg = ("Negation, the `\\-` operator, on a bool tensor is not supported."
	" If you are trying to invert a mask, use the `\\~` or"
	" `logical_not\\(\\)` operator instead.")

	t = torch.tensor((False, True), device=device)

	with self.assertRaisesRegex(RuntimeError, msg):
	torch.neg(t)

	@dtypes(*floating_types_and(torch.bfloat16, torch.half))
	@ops((_fn for _fn in unary_ufuncs if _fn.domain != (None, None)))
	def test_float_domains(self, device, dtype, op):
	if not op.supports_dtype(dtype, torch.device(device).type):
	raise unittest.SkipTest('unsupported dtype')

	eps = (1e-5, 1e-3, 1e-1, 1, 2, 10, 20, 50, 100)

	low, high = op.domain
	# NOTE: the following two loops are separated for readability
	if low is not None:
	low_tensor = torch.tensor(low, device=device, dtype=dtype)
	for epsilon in eps:
	lower_tensor = low_tensor - epsilon

	# Skips the test if the difference is not representable,
	# which can occur if, for example, the difference is small
	# and the dtype is imprecise (like bfloat16 is)
	if lower_tensor.item() == low_tensor.item():
	continue

	result = op(lower_tensor)
	self.assertEqual(result.item(), float('nan'),
	msg=("input of {0} outside lower domain boundary"
	" {1} produced {2}, not nan!").format(lower_tensor.item(),
	low,
	result.item()))

	if high is not None:
	high_tensor = torch.tensor(high, device=device, dtype=dtype)
	for epsilon in eps:
	higher_tensor = high_tensor + epsilon

	# See above comment
	if higher_tensor.item() == high_tensor.item():
	continue

	result = op(higher_tensor)
	self.assertEqual(result.item(), float('nan'),
	msg=("input of {0} outside upper domain boundary"
	" {1} produced {2}, not nan!").format(higher_tensor.item(),
	high,
	result.item()))

	# Tests that fn == method == inplace == jit on a simple single tensor input
	# TODO: should this jitting the method and inplace variants, too?
	@ops(unary_ufuncs)
	def test_variant_consistency(self, device, dtype, op):
	def _fn(t):
	return op(t)

	t = _make_tensor((5, 5), device, dtype, low=op.domain[0], high=op.domain[1])
	expected = op(t)

	for alt in (op.get_method(), op.get_inplace(), torch.jit.script(_fn)):
	if alt is None:
	with self.assertRaises(RuntimeError):
	alt(t.clone())

	actual = alt(t.clone())
	self.assertEqual(actual, expected, rtol=0, atol=0)

	# Tests that the function and its (array-accepting) reference produce the same
	# values on a range of tensors, including empty tensors, scalar tensors,
	# 1D tensors and a large 2D tensor with interesting and extremal values
	# and discontiguities.
	@unittest.skipIf(not TEST_NUMPY, "NumPy not found")
	@suppress_warnings
	@ops(unary_ufuncs)
	def test_reference_numerics(self, device, dtype, op):
	include_extremals = (op.handles_complex_extremals if
	dtype in (torch.cfloat, torch.cdouble) else op.handles_extremals)

	tensors = generate_numeric_tensors(device, dtype,
	domain=op.domain,
	include_large_values=op.handles_large_floats,
	include_extremal_values=include_extremals)
	for t in tensors:
	if dtype is torch.bfloat16:
	a = t.cpu().to(torch.float32).numpy()
	else:
	a = t.cpu().numpy()

	actual = op(t)
	expected = op.ref(a)

	# Crafts a custom error message for smaller, printable tensors
	if t.numel() < 10:
	msg = ("Failed to produce expected results! Input tensor was"
	" {0}, torch result is {1}, and reference result is"
	" {2}.").format(t, actual, expected)
	else:
	msg = None

	self.assertEqualHelper(actual, expected, dtype=dtype, msg=msg)

	# Tests for testing (dis)contiguity consistency

	@ops(unary_ufuncs)
	def test_contig_vs_every_other(self, device, dtype, op):
	contig = _make_tensor((1026,), device=device, dtype=dtype,
	low=op.domain[0], high=op.domain[1])
	non_contig = contig[::2]

	self.assertTrue(contig.is_contiguous())
	self.assertFalse(non_contig.is_contiguous())

	self.assertEqual(op(contig)[::2], op(non_contig))

	@ops(unary_ufuncs)
	def test_contig_vs_transposed(self, device, dtype, op):
	contig = _make_tensor((789, 357), device=device, dtype=dtype,
	low=op.domain[0], high=op.domain[1])
	non_contig = contig.T

	self.assertTrue(contig.is_contiguous())
	self.assertFalse(non_contig.is_contiguous())

	self.assertEqual(op(contig).T, op(non_contig))

	@ops(unary_ufuncs)
	def test_non_contig(self, device, dtype, op):
	shapes = [(5, 7), (1024,)]
	for shape in shapes:
	contig = _make_tensor(shape, device, dtype,
	low=op.domain[0], high=op.domain[1])
	non_contig = torch.empty(shape + (2,), device=device, dtype=dtype)[..., 0]
	non_contig.copy_(contig)

	self.assertTrue(contig.is_contiguous())
	self.assertFalse(non_contig.is_contiguous())

	self.assertEqual(op(contig), op(non_contig))

	@ops(unary_ufuncs)
	def test_non_contig_index(self, device, dtype, op):
	contig = _make_tensor((2, 2, 1, 2), device, dtype,
	low=op.domain[0], high=op.domain[1])
	non_contig = contig[:, 1, ...]
	contig = non_contig.contiguous()

	self.assertTrue(contig.is_contiguous())
	self.assertFalse(non_contig.is_contiguous())

	self.assertEqual(op(contig), op(non_contig))

	@ops(unary_ufuncs)
	def test_non_contig_expand(self, device, dtype, op):
	shapes = [(1, 3), (1, 7), (5, 7)]
	for shape in shapes:
	contig = _make_tensor(shape, device, dtype,
	low=op.domain[0], high=op.domain[1])
	non_contig = contig.clone().expand(3, -1, -1)

	self.assertTrue(contig.is_contiguous())
	self.assertFalse(non_contig.is_contiguous())

	contig = op(contig)
	non_contig = op(non_contig)
	for i in range(3):
	self.assertEqual(contig, non_contig[i],
	msg='non-contiguous expand[' + str(i) + ']')

	@ops(unary_ufuncs)
	def test_contig_size1(self, device, dtype, op):
	contig = _make_tensor((5, 100), device, dtype,
	low=op.domain[0], high=op.domain[1])
	contig = contig[:1, :50]
	contig2 = torch.empty(contig.size(), device=device, dtype=dtype)
	contig2.copy_(contig)

	self.assertTrue(contig.is_contiguous())
	self.assertTrue(contig2.is_contiguous())

	self.assertEqual(op(contig), op(contig2))

	@ops(unary_ufuncs)
	def test_contig_size1_large_dim(self, device, dtype, op):
	contig = _make_tensor((5, 2, 3, 1, 4, 5, 3, 2, 1, 2, 3, 4), device, dtype,
	low=op.domain[0], high=op.domain[1])
	contig = contig[:1, :, :, :, :, :, :, :, :, :, :, :]
	contig2 = torch.empty(contig.size(), device=device, dtype=dtype)
	contig2.copy_(contig)

	self.assertTrue(contig.is_contiguous())
	self.assertTrue(contig2.is_contiguous())

	self.assertEqual(op(contig), op(contig2))

	# Tests that computation on a multiple batches is the same as
	# per-batch computation.
	@ops(unary_ufuncs)
	def test_batch_vs_slicing(self, device, dtype, op):
	input = _make_tensor((1024, 512), dtype=dtype, device=device,
	low=op.domain[0], high=op.domain[1])

	actual = op(input)
	expected = torch.stack([op(slice) for slice in input])

	self.assertEqual(actual, expected)


	instantiate_device_type_tests(TestUnaryUfuncs, globals())

	if __name__ == '__main__':
	run_tests()