torch/testing/_internal/expecttest.py - platform/external/pytorch - Git at Google

 import re
 import unittest
 import traceback
 import os
 import string
 import sys
 from typing import Tuple


 # This file implements expect tests (also known as "golden" tests).
 # Expect tests are a method of writing tests where instead of
 # hard-coding the expected output of a test, you instead run the test to
 # get the output, and the test framework automatically populates the
 # expected output.  If the output of the test changes, you can rerun the
 # test with EXPECTTEST_ACCEPT=1 environment variable to automatically
 # update the expected output.
 #
 # Somewhat unusually, this file implements *inline* expect tests: that
 # is to say, the expected output isn't save to an external file, it is
 # saved directly in the Python file (and we modify your Python the file
 # when updating the expect test.)
 #
 # The general recipe for how to use this is as follows:
 #
 #   1. Write your test and use assertExpectedInline() instead of
 #      a normal assertEqual.  Leave the expected argument blank
 #      with an empty string:
 #
 #       self.assertExpectedInline(some_func(), "")
 #
 #   2. Run your test.  It should fail, and you get an error message
 #      about accepting the output with EXPECTTEST_ACCEPT=1
 #
 #   3. Rerun the test with EXPECTTEST_ACCEPT=1.  Now the previously
 #      blank string literal will now contain the expected value of
 #      the test.
 #
 #       self.assertExpectedInline(some_func(), "my_value")
 #
 # Some tips and tricks:
 #
 #   - Often, you will want to expect test on a multiline string.  This
 #     framework understands triple-quoted strings, so you can just
 #     write """my_value""" and it will turn into triple-quoted
 #     strings.
 #
 #   - Take some time thinking about how exactly you want to design
 #     the output format of the expect test.  It is often profitable
 #     to design an output representation specifically for expect tests.
 #


 ACCEPT = os.getenv('EXPECTTEST_ACCEPT')

 LINENO_AT_START = sys.version_info >= (3, 8)


 def nth_line(src, lineno):
     """
     Compute the starting index of the n-th line (where n is 1-indexed)

     >>> nth_line("aaa\\nbb\\nc", 2)
     4
     """
     assert lineno >= 1
     pos = 0
     for _ in range(lineno - 1):
         pos = src.find('\n', pos) + 1
     return pos


 def nth_eol(src, lineno):
     """
     Compute the ending index of the n-th line (before the newline,
     where n is 1-indexed)

     >>> nth_eol("aaa\\nbb\\nc", 2)
     6
     """
     assert lineno >= 1
     pos = -1
     for _ in range(lineno):
         pos = src.find('\n', pos + 1)
         if pos == -1:
             return len(src)
     return pos


 def normalize_nl(t):
     return t.replace('\r\n', '\n').replace('\r', '\n')


 def escape_trailing_quote(s, quote):
     if s and s[-1] == quote:
         return s[:-1] + '\\' + quote
     else:
         return s


 class EditHistory(object):
     def __init__(self):
         self.state = {}

     def adjust_lineno(self, fn, lineno):
         if fn not in self.state:
             return lineno
         for edit_loc, edit_diff in self.state[fn]:
             if lineno > edit_loc:
                 lineno += edit_diff
         return lineno

     def seen_file(self, fn):
         return fn in self.state

     def record_edit(self, fn, lineno, delta):
         self.state.setdefault(fn, []).append((lineno, delta))


 EDIT_HISTORY = EditHistory()


 def ok_for_raw_triple_quoted_string(s, quote):
     """
     Is this string representable inside a raw triple-quoted string?
     Due to the fact that backslashes are always treated literally,
     some strings are not representable.

     >>> ok_for_raw_triple_quoted_string("blah", quote="'")
     True
     >>> ok_for_raw_triple_quoted_string("'", quote="'")
     False
     >>> ok_for_raw_triple_quoted_string("a ''' b", quote="'")
     False
     """
     return quote * 3 not in s and (not s or s[-1] not in [quote, '\\'])


 RE_EXPECT = re.compile(
     (
         r"^(?P<prefix>[^\n]*?)"
         r"(?P<raw>r?)"
         r"(?P<quote>'''|" r'""")'
         r"(?P<body>.*?)"
         r"(?P=quote)"
     ),
     re.DOTALL
 )


 # This operates on the REVERSED string (that's why suffix is first)
 RE_REVERSED_EXPECT = \
     re.compile(r"^(?P<suffix>[^\n]*?)"
                r"(?P<quote>'''|" r'""")'
                r"(?P<body>.*?)"
                r"(?P=quote)"
                r"(?P<raw>r?)", re.DOTALL)


 def replace_string_literal(src : str, lineno : int,
                            new_string : str, *, lineno_at_start: bool) -> Tuple[str, int]:
     r"""
     Replace a triple quoted string literal with new contents.
     Only handles printable ASCII correctly at the moment.  This
     will preserve the quote style of the original string, and
     makes a best effort to preserve raw-ness (unless it is impossible
     to do so.)

     Returns a tuple of the replaced string, as well as a delta of
     number of lines added/removed.

     >>> replace_string_literal("'''arf'''", 1, "barf", lineno_at_start=False)
     ("'''barf'''", 0)
     >>> r = replace_string_literal("  moo = '''arf'''", 1, "'a'\n\\b\n", lineno_at_start=False)
     >>> print(r[0])
       moo = '''\
     'a'
     \\b
     '''
     >>> r[1]
     3
     >>> replace_string_literal("  moo = '''\\\narf'''", 2, "'a'\n\\b\n", lineno_at_start=False)[1]
     2
     >>> print(replace_string_literal("    f('''\"\"\"''')", 1, "a ''' b", lineno_at_start=False)[0])
         f('''a \'\'\' b''')
     """
     # Haven't implemented correct escaping for non-printable characters
     assert all(c in string.printable for c in new_string)

     new_string = normalize_nl(new_string)

     delta = [new_string.count("\n")]
     if delta[0] > 0:
         delta[0] += 1  # handle the extra \\\n

     def compute_raw_new_body_and_adjust_delta(m):
         s = new_string
         raw = m.group('raw') == 'r'
         if not raw or not ok_for_raw_triple_quoted_string(s, quote=m.group('quote')[0]):
             raw = False
             s = s.replace('\\', '\\\\')
             if m.group('quote') == "'''":
                 s = escape_trailing_quote(s, "'").replace("'''", r"\'\'\'")
             else:
                 s = escape_trailing_quote(s, '"').replace('"""', r'\"\"\"')

         new_body = "\\\n" + s if "\n" in s and not raw else s
         delta[0] -= m.group('body').count("\n")
         return raw, new_body

     if lineno_at_start:
         i = nth_line(src, lineno)

         # i points to the start of the string
         def replace(m):
             raw, new_body = compute_raw_new_body_and_adjust_delta(m)
             return ''.join([m.group('prefix'),
                             'r' if raw else '',
                             m.group('quote'),
                             new_body,
                             m.group('quote'),
                             ])

         return (src[:i] + RE_EXPECT.sub(replace, src[i:], count=1), delta[0])
     else:
         i = nth_eol(src, lineno)

         # i points to the END of the string.  Do some funny
         # business with reversing the string to do the replace
         def replace(m):
             raw, new_body = compute_raw_new_body_and_adjust_delta(m)
             return ''.join([m.group('suffix'),
                             m.group('quote'),
                             new_body[::-1],
                             m.group('quote'),
                             'r' if raw else '',
                             ])

         # Having to do this in reverse is very irritating, but it's the
         # only way to make the non-greedy matches work correctly.
         return (RE_REVERSED_EXPECT.sub(replace, src[:i][::-1], count=1)[::-1] + src[i:], delta[0])


 class TestCase(unittest.TestCase):
     longMessage = True

     def assertExpectedInline(self, actual, expect, skip=0):
         """
         Assert that actual is equal to expect.  The expect argument
         MUST be a string literal (triple-quoted strings OK), and will
         get updated directly in source when you run the test suite
         with EXPECTTEST_ACCEPT=1.

         If you want to write a helper function that makes use of
         assertExpectedInline (e.g., expect is not a string literal),
         set the skip argument to how many function calls we should
         skip to find the string literal to update.
         """
         if ACCEPT:
             if actual != expect:
                 # current frame and parent frame, plus any requested skip
                 tb = traceback.extract_stack(limit=2 + skip)
                 fn, lineno, _, _ = tb[0]
                 print("Accepting new output for {} at {}:{}".format(self.id(), fn, lineno))
                 with open(fn, 'r+') as f:
                     old = f.read()

                     # compute the change in lineno
                     lineno = EDIT_HISTORY.adjust_lineno(fn, lineno)
                     new, delta = replace_string_literal(
                         old, lineno, actual,
                         lineno_at_start=LINENO_AT_START
                     )

                     assert old != new, f"Failed to substitute string at {fn}:{lineno}; did you use triple quotes?"

                     # Only write the backup file the first time we hit the
                     # file
                     if not EDIT_HISTORY.seen_file(fn):
                         with open(fn + ".bak", 'w') as f_bak:
                             f_bak.write(old)
                     f.seek(0)
                     f.truncate(0)

                     f.write(new)

                 EDIT_HISTORY.record_edit(fn, lineno, delta)
         else:
             help_text = ("To accept the new output, re-run test with "
                          "envvar EXPECTTEST_ACCEPT=1 (we recommend "
                          "staging/committing your changes before doing this)")
             self.assertMultiLineEqualMaybeCppStack(expect, actual, msg=help_text)

     def assertExpectedRaisesInline(self, exc_type, callable, expect, *args, **kwargs):
         """
         Like assertExpectedInline, but tests the str() representation of
         the raised exception from callable.  The raised exeption must
         be exc_type.
         """
         try:
             callable(*args, **kwargs)
         except exc_type as e:
             self.assertExpectedInline(str(e), expect, skip=1)
             return
         # Don't put this in the try block; the AssertionError will catch it
         self.fail(msg="Did not raise when expected to")

     def assertMultiLineEqualMaybeCppStack(self, expect, actual, *args, **kwargs):
         self.assertGreaterEqual(len(actual), len(expect), *args, **kwargs)
         if hasattr(self, "assertMultiLineEqual"):
             self.assertMultiLineEqual(expect, actual[:len(expect)], *args, **kwargs)
         else:
             self.assertEqual(expect, actual[:len(expect)], *args, **kwargs)
         if len(actual) > len(expect):
             cpp_stacktrace_header = "\nException raised from"
             end_header = len(expect) + len(cpp_stacktrace_header)
             self.assertEqual(actual[len(expect): end_header], cpp_stacktrace_header)


 if __name__ == "__main__":
     import doctest
     doctest.testmod()
	import re
	import unittest
	import traceback
	import os
	import string
	import sys
	from typing import Tuple


	# This file implements expect tests (also known as "golden" tests).
	# Expect tests are a method of writing tests where instead of
	# hard-coding the expected output of a test, you instead run the test to
	# get the output, and the test framework automatically populates the
	# expected output. If the output of the test changes, you can rerun the
	# test with EXPECTTEST_ACCEPT=1 environment variable to automatically
	# update the expected output.
	#
	# Somewhat unusually, this file implements inline expect tests: that
	# is to say, the expected output isn't save to an external file, it is
	# saved directly in the Python file (and we modify your Python the file
	# when updating the expect test.)
	#
	# The general recipe for how to use this is as follows:
	#
	# 1. Write your test and use assertExpectedInline() instead of
	# a normal assertEqual. Leave the expected argument blank
	# with an empty string:
	#
	# self.assertExpectedInline(some_func(), "")
	#
	# 2. Run your test. It should fail, and you get an error message
	# about accepting the output with EXPECTTEST_ACCEPT=1
	#
	# 3. Rerun the test with EXPECTTEST_ACCEPT=1. Now the previously
	# blank string literal will now contain the expected value of
	# the test.
	#
	# self.assertExpectedInline(some_func(), "my_value")
	#
	# Some tips and tricks:
	#
	# - Often, you will want to expect test on a multiline string. This
	# framework understands triple-quoted strings, so you can just
	# write """my_value""" and it will turn into triple-quoted
	# strings.
	#
	# - Take some time thinking about how exactly you want to design
	# the output format of the expect test. It is often profitable
	# to design an output representation specifically for expect tests.
	#


	ACCEPT = os.getenv('EXPECTTEST_ACCEPT')

	LINENO_AT_START = sys.version_info >= (3, 8)


	def nth_line(src, lineno):
	"""
	Compute the starting index of the n-th line (where n is 1-indexed)

	>>> nth_line("aaa\\nbb\\nc", 2)
	4
	"""
	assert lineno >= 1
	pos = 0
	for _ in range(lineno - 1):
	pos = src.find('\n', pos) + 1
	return pos


	def nth_eol(src, lineno):
	"""
	Compute the ending index of the n-th line (before the newline,
	where n is 1-indexed)

	>>> nth_eol("aaa\\nbb\\nc", 2)
	6
	"""
	assert lineno >= 1
	pos = -1
	for _ in range(lineno):
	pos = src.find('\n', pos + 1)
	if pos == -1:
	return len(src)
	return pos


	def normalize_nl(t):
	return t.replace('\r\n', '\n').replace('\r', '\n')


	def escape_trailing_quote(s, quote):
	if s and s[-1] == quote:
	return s[:-1] + '\\' + quote
	else:
	return s


	class EditHistory(object):
	def __init__(self):
	self.state = {}

	def adjust_lineno(self, fn, lineno):
	if fn not in self.state:
	return lineno
	for edit_loc, edit_diff in self.state[fn]:
	if lineno > edit_loc:
	lineno += edit_diff
	return lineno

	def seen_file(self, fn):
	return fn in self.state

	def record_edit(self, fn, lineno, delta):
	self.state.setdefault(fn, []).append((lineno, delta))


	EDIT_HISTORY = EditHistory()


	def ok_for_raw_triple_quoted_string(s, quote):
	"""
	Is this string representable inside a raw triple-quoted string?
	Due to the fact that backslashes are always treated literally,
	some strings are not representable.

	>>> ok_for_raw_triple_quoted_string("blah", quote="'")
	True
	>>> ok_for_raw_triple_quoted_string("'", quote="'")
	False
	>>> ok_for_raw_triple_quoted_string("a ''' b", quote="'")
	False
	"""
	return quote * 3 not in s and (not s or s[-1] not in [quote, '\\'])


	RE_EXPECT = re.compile(
	(
	r"^(?P<prefix>[^\n]*?)"
	r"(?P<raw>r?)"
	r"(?P<quote>'''\|" r'""")'
	r"(?P<body>.*?)"
	r"(?P=quote)"
	),
	re.DOTALL
	)


	# This operates on the REVERSED string (that's why suffix is first)
	RE_REVERSED_EXPECT = \
	re.compile(r"^(?P<suffix>[^\n]*?)"
	r"(?P<quote>'''\|" r'""")'
	r"(?P<body>.*?)"
	r"(?P=quote)"
	r"(?P<raw>r?)", re.DOTALL)


	def replace_string_literal(src : str, lineno : int,
	new_string : str, *, lineno_at_start: bool) -> Tuple[str, int]:
	r"""
	Replace a triple quoted string literal with new contents.
	Only handles printable ASCII correctly at the moment. This
	will preserve the quote style of the original string, and
	makes a best effort to preserve raw-ness (unless it is impossible
	to do so.)

	Returns a tuple of the replaced string, as well as a delta of
	number of lines added/removed.

	>>> replace_string_literal("'''arf'''", 1, "barf", lineno_at_start=False)
	("'''barf'''", 0)
	>>> r = replace_string_literal(" moo = '''arf'''", 1, "'a'\n\\b\n", lineno_at_start=False)
	>>> print(r[0])
	moo = '''\
	'a'
	\\b
	'''
	>>> r[1]
	3
	>>> replace_string_literal(" moo = '''\\\narf'''", 2, "'a'\n\\b\n", lineno_at_start=False)[1]
	2
	>>> print(replace_string_literal(" f('''\"\"\"''')", 1, "a ''' b", lineno_at_start=False)[0])
	f('''a \'\'\' b''')
	"""
	# Haven't implemented correct escaping for non-printable characters
	assert all(c in string.printable for c in new_string)

	new_string = normalize_nl(new_string)

	delta = [new_string.count("\n")]
	if delta[0] > 0:
	delta[0] += 1 # handle the extra \\\n

	def compute_raw_new_body_and_adjust_delta(m):
	s = new_string
	raw = m.group('raw') == 'r'
	if not raw or not ok_for_raw_triple_quoted_string(s, quote=m.group('quote')[0]):
	raw = False
	s = s.replace('\\', '\\\\')
	if m.group('quote') == "'''":
	s = escape_trailing_quote(s, "'").replace("'''", r"\'\'\'")
	else:
	s = escape_trailing_quote(s, '"').replace('"""', r'\"\"\"')

	new_body = "\\\n" + s if "\n" in s and not raw else s
	delta[0] -= m.group('body').count("\n")
	return raw, new_body

	if lineno_at_start:
	i = nth_line(src, lineno)

	# i points to the start of the string
	def replace(m):
	raw, new_body = compute_raw_new_body_and_adjust_delta(m)
	return ''.join([m.group('prefix'),
	'r' if raw else '',
	m.group('quote'),
	new_body,
	m.group('quote'),
	])

	return (src[:i] + RE_EXPECT.sub(replace, src[i:], count=1), delta[0])
	else:
	i = nth_eol(src, lineno)

	# i points to the END of the string. Do some funny
	# business with reversing the string to do the replace
	def replace(m):
	raw, new_body = compute_raw_new_body_and_adjust_delta(m)
	return ''.join([m.group('suffix'),
	m.group('quote'),
	new_body[::-1],
	m.group('quote'),
	'r' if raw else '',
	])

	# Having to do this in reverse is very irritating, but it's the
	# only way to make the non-greedy matches work correctly.
	return (RE_REVERSED_EXPECT.sub(replace, src[:i][::-1], count=1)[::-1] + src[i:], delta[0])


	class TestCase(unittest.TestCase):
	longMessage = True

	def assertExpectedInline(self, actual, expect, skip=0):
	"""
	Assert that actual is equal to expect. The expect argument
	MUST be a string literal (triple-quoted strings OK), and will
	get updated directly in source when you run the test suite
	with EXPECTTEST_ACCEPT=1.

	If you want to write a helper function that makes use of
	assertExpectedInline (e.g., expect is not a string literal),
	set the skip argument to how many function calls we should
	skip to find the string literal to update.
	"""
	if ACCEPT:
	if actual != expect:
	# current frame and parent frame, plus any requested skip
	tb = traceback.extract_stack(limit=2 + skip)
	fn, lineno, _, _ = tb[0]
	print("Accepting new output for {} at {}:{}".format(self.id(), fn, lineno))
	with open(fn, 'r+') as f:
	old = f.read()

	# compute the change in lineno
	lineno = EDIT_HISTORY.adjust_lineno(fn, lineno)
	new, delta = replace_string_literal(
	old, lineno, actual,
	lineno_at_start=LINENO_AT_START
	)

	assert old != new, f"Failed to substitute string at {fn}:{lineno}; did you use triple quotes?"

	# Only write the backup file the first time we hit the
	# file
	if not EDIT_HISTORY.seen_file(fn):
	with open(fn + ".bak", 'w') as f_bak:
	f_bak.write(old)
	f.seek(0)
	f.truncate(0)

	f.write(new)

	EDIT_HISTORY.record_edit(fn, lineno, delta)
	else:
	help_text = ("To accept the new output, re-run test with "
	"envvar EXPECTTEST_ACCEPT=1 (we recommend "
	"staging/committing your changes before doing this)")
	self.assertMultiLineEqualMaybeCppStack(expect, actual, msg=help_text)

	def assertExpectedRaisesInline(self, exc_type, callable, expect, args, *kwargs):
	"""
	Like assertExpectedInline, but tests the str() representation of
	the raised exception from callable. The raised exeption must
	be exc_type.
	"""
	try:
	callable(args, *kwargs)
	except exc_type as e:
	self.assertExpectedInline(str(e), expect, skip=1)
	return
	# Don't put this in the try block; the AssertionError will catch it
	self.fail(msg="Did not raise when expected to")

	def assertMultiLineEqualMaybeCppStack(self, expect, actual, args, *kwargs):
	self.assertGreaterEqual(len(actual), len(expect), args, *kwargs)
	if hasattr(self, "assertMultiLineEqual"):
	self.assertMultiLineEqual(expect, actual[:len(expect)], args, *kwargs)
	else:
	self.assertEqual(expect, actual[:len(expect)], args, *kwargs)
	if len(actual) > len(expect):
	cpp_stacktrace_header = "\nException raised from"
	end_header = len(expect) + len(cpp_stacktrace_header)
	self.assertEqual(actual[len(expect): end_header], cpp_stacktrace_header)


	if __name__ == "__main__":
	import doctest
	doctest.testmod()