yapf/yapflib/format_token.py - platform/external/yapf - Git at Google

 # Copyright 2015 Google Inc. All Rights Reserved.
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 """Pytree nodes with extra formatting information.

 This is a thin wrapper around a pytree.Leaf node.
 """

 import keyword
 import re

 from lib2to3.pgen2 import token

 from yapf.yapflib import py3compat
 from yapf.yapflib import pytree_utils
 from yapf.yapflib import style
 from yapf.yapflib import subtypes

 CONTINUATION = token.N_TOKENS


 def _TabbedContinuationAlignPadding(spaces, align_style, tab_width):
   """Build padding string for continuation alignment in tabbed indentation.

   Arguments:
     spaces: (int) The number of spaces to place before the token for alignment.
     align_style: (str) The alignment style for continuation lines.
     tab_width: (int) Number of columns of each tab character.

   Returns:
     A padding string for alignment with style specified by align_style option.
   """
   if align_style in ('FIXED', 'VALIGN-RIGHT'):
     if spaces > 0:
       return '\t' * int((spaces + tab_width - 1) / tab_width)
     return ''
   return ' ' * spaces


 class FormatToken(object):
   """A wrapper around pytree Leaf nodes.

   This represents the token plus additional information useful for reformatting
   the code.

   Attributes:
     node: The PyTree node this token represents.
     next_token: The token in the unwrapped line after this token or None if this
       is the last token in the unwrapped line.
     previous_token: The token in the unwrapped line before this token or None if
       this is the first token in the unwrapped line.
     matching_bracket: If a bracket token ('[', '{', or '(') the matching
       bracket.
     parameters: If this and its following tokens make up a parameter list, then
       this is a list of those parameters.
     container_opening: If the object is in a container, this points to its
       opening bracket.
     container_elements: If this is the start of a container, a list of the
       elements in the container.
     whitespace_prefix: The prefix for the whitespace.
     spaces_required_before: The number of spaces required before a token. This
       is a lower-bound for the formatter and not a hard requirement. For
       instance, a comment may have n required spaces before it. But the
       formatter won't place n spaces before all comments. Only those that are
       moved to the end of a line of code. The formatter may use different
       spacing when appropriate.
     total_length: The total length of the unwrapped line up to and including
       whitespace and this token. However, this doesn't include the initial
       indentation amount.
     split_penalty: The penalty for splitting the line before this token.
     can_break_before: True if we're allowed to break before this token.
     must_break_before: True if we're required to break before this token.
     newlines: The number of newlines needed before this token.
   """

   def __init__(self, node):
     """Constructor.

     Arguments:
       node: (pytree.Leaf) The node that's being wrapped.
     """
     self.node = node
     self.next_token = None
     self.previous_token = None
     self.matching_bracket = None
     self.parameters = []
     self.container_opening = None
     self.container_elements = []
     self.whitespace_prefix = ''
     self.total_length = 0
     self.split_penalty = 0
     self.can_break_before = False
     self.must_break_before = pytree_utils.GetNodeAnnotation(
         node, pytree_utils.Annotation.MUST_SPLIT, default=False)
     self.newlines = pytree_utils.GetNodeAnnotation(
         node, pytree_utils.Annotation.NEWLINES)

     self.type = node.type
     self.column = node.column
     self.lineno = node.lineno
     self.name = pytree_utils.NodeName(node)

     self.spaces_required_before = 0
     if self.is_comment:
       self.spaces_required_before = style.Get('SPACES_BEFORE_COMMENT')

     self.value = node.value
     if self.is_continuation:
       self.value = node.value.rstrip()

     stypes = pytree_utils.GetNodeAnnotation(node,
                                             pytree_utils.Annotation.SUBTYPE)
     self.subtypes = [subtypes.NONE] if stypes is None else stypes
     self.is_pseudo = hasattr(node, 'is_pseudo') and node.is_pseudo

   @property
   def formatted_whitespace_prefix(self):
     if style.Get('INDENT_BLANK_LINES'):
       without_newlines = self.whitespace_prefix.lstrip('\n')
       height = len(self.whitespace_prefix) - len(without_newlines)
       if height:
         return ('\n' + without_newlines) * height
     return self.whitespace_prefix

   def AddWhitespacePrefix(self, newlines_before, spaces=0, indent_level=0):
     """Register a token's whitespace prefix.

     This is the whitespace that will be output before a token's string.

     Arguments:
       newlines_before: (int) The number of newlines to place before the token.
       spaces: (int) The number of spaces to place before the token.
       indent_level: (int) The indentation level.
     """
     if style.Get('USE_TABS'):
       if newlines_before > 0:
         indent_before = '\t' * indent_level + _TabbedContinuationAlignPadding(
             spaces, style.Get('CONTINUATION_ALIGN_STYLE'),
             style.Get('INDENT_WIDTH'))
       else:
         indent_before = '\t' * indent_level + ' ' * spaces
     else:
       indent_before = (' ' * indent_level * style.Get('INDENT_WIDTH') +
                        ' ' * spaces)

     if self.is_comment:
       comment_lines = [s.lstrip() for s in self.value.splitlines()]
       self.value = ('\n' + indent_before).join(comment_lines)

       # Update our own value since we are changing node value
       self.value = self.value

     if not self.whitespace_prefix:
       self.whitespace_prefix = ('\n' * (self.newlines or newlines_before) +
                                 indent_before)
     else:
       self.whitespace_prefix += indent_before

   def AdjustNewlinesBefore(self, newlines_before):
     """Change the number of newlines before this token."""
     self.whitespace_prefix = ('\n' * newlines_before +
                               self.whitespace_prefix.lstrip('\n'))

   def RetainHorizontalSpacing(self, first_column, depth):
     """Retains a token's horizontal spacing."""
     previous = self.previous_token
     if not previous:
       return

     if previous.is_pseudo:
       previous = previous.previous_token
       if not previous:
         return

     cur_lineno = self.lineno
     prev_lineno = previous.lineno
     if previous.is_multiline_string:
       prev_lineno += previous.value.count('\n')

     if (cur_lineno != prev_lineno or
         (previous.is_pseudo and previous.value != ')' and
          cur_lineno != previous.previous_token.lineno)):
       self.spaces_required_before = (
           self.column - first_column + depth * style.Get('INDENT_WIDTH'))
       return

     cur_column = self.column
     prev_column = previous.node.column
     prev_len = len(previous.value)

     if previous.is_pseudo and previous.value == ')':
       prev_column -= 1
       prev_len = 0

     if previous.is_multiline_string:
       prev_len = len(previous.value.split('\n')[-1])
       if '\n' in previous.value:
         prev_column = 0  # Last line starts in column 0.

     self.spaces_required_before = cur_column - (prev_column + prev_len)

   def OpensScope(self):
     return self.value in pytree_utils.OPENING_BRACKETS

   def ClosesScope(self):
     return self.value in pytree_utils.CLOSING_BRACKETS

   def __repr__(self):
     msg = ('FormatToken(name={0}, value={1}, column={2}, lineno={3}, '
            'splitpenalty={4}'.format(
                'DOCSTRING' if self.is_docstring else self.name, self.value,
                self.column, self.lineno, self.split_penalty))
     msg += ', pseudo)' if self.is_pseudo else ')'
     return msg

   @property
   def node_split_penalty(self):
     """Split penalty attached to the pytree node of this token."""
     return pytree_utils.GetNodeAnnotation(
         self.node, pytree_utils.Annotation.SPLIT_PENALTY, default=0)

   @property
   def is_binary_op(self):
     """Token is a binary operator."""
     return subtypes.BINARY_OPERATOR in self.subtypes

   @property
   @py3compat.lru_cache()
   def is_arithmetic_op(self):
     """Token is an arithmetic operator."""
     return self.value in frozenset({
         '+',  # Add
         '-',  # Subtract
         '*',  # Multiply
         '@',  # Matrix Multiply
         '/',  # Divide
         '//',  # Floor Divide
         '%',  # Modulo
         '<<',  # Left Shift
         '>>',  # Right Shift
         '|',  # Bitwise Or
         '&',  # Bitwise Add
         '^',  # Bitwise Xor
         '**',  # Power
     })

   @property
   def is_simple_expr(self):
     """Token is an operator in a simple expression."""
     return subtypes.SIMPLE_EXPRESSION in self.subtypes

   @property
   def is_subscript_colon(self):
     """Token is a subscript colon."""
     return subtypes.SUBSCRIPT_COLON in self.subtypes

   @property
   def is_comment(self):
     return self.type == token.COMMENT

   @property
   def is_continuation(self):
     return self.type == CONTINUATION

   @property
   @py3compat.lru_cache()
   def is_keyword(self):
     return keyword.iskeyword(self.value)

   @property
   def is_name(self):
     return self.type == token.NAME and not self.is_keyword

   @property
   def is_number(self):
     return self.type == token.NUMBER

   @property
   def is_string(self):
     return self.type == token.STRING

   @property
   def is_multiline_string(self):
     """Test if this string is a multiline string.

     Returns:
       A multiline string always ends with triple quotes, so if it is a string
       token, inspect the last 3 characters and return True if it is a triple
       double or triple single quote mark.
     """
     return self.is_string and self.value.endswith(('"""', "'''"))

   @property
   def is_docstring(self):
     return self.is_string and self.previous_token is None

   @property
   def is_pylint_comment(self):
     return self.is_comment and re.match(r'#.*\bpylint:\s*(disable|enable)=',
                                         self.value)

   @property
   def is_pytype_comment(self):
     return self.is_comment and re.match(r'#.*\bpytype:\s*(disable|enable)=',
                                         self.value)

   @property
   def is_copybara_comment(self):
     return self.is_comment and re.match(
         r'#.*\bcopybara:\s*(strip|insert|replace)', self.value)
	# Copyright 2015 Google Inc. All Rights Reserved.
	#
	# Licensed under the Apache License, Version 2.0 (the "License");
	# you may not use this file except in compliance with the License.
	# You may obtain a copy of the License at
	#
	# http://www.apache.org/licenses/LICENSE-2.0
	#
	# Unless required by applicable law or agreed to in writing, software
	# distributed under the License is distributed on an "AS IS" BASIS,
	# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	# See the License for the specific language governing permissions and
	# limitations under the License.
	"""Pytree nodes with extra formatting information.

	This is a thin wrapper around a pytree.Leaf node.
	"""

	import keyword
	import re

	from lib2to3.pgen2 import token

	from yapf.yapflib import py3compat
	from yapf.yapflib import pytree_utils
	from yapf.yapflib import style
	from yapf.yapflib import subtypes

	CONTINUATION = token.N_TOKENS


	def _TabbedContinuationAlignPadding(spaces, align_style, tab_width):
	"""Build padding string for continuation alignment in tabbed indentation.

	Arguments:
	spaces: (int) The number of spaces to place before the token for alignment.
	align_style: (str) The alignment style for continuation lines.
	tab_width: (int) Number of columns of each tab character.

	Returns:
	A padding string for alignment with style specified by align_style option.
	"""
	if align_style in ('FIXED', 'VALIGN-RIGHT'):
	if spaces > 0:
	return '\t' * int((spaces + tab_width - 1) / tab_width)
	return ''
	return ' ' * spaces


	class FormatToken(object):
	"""A wrapper around pytree Leaf nodes.

	This represents the token plus additional information useful for reformatting
	the code.

	Attributes:
	node: The PyTree node this token represents.
	next_token: The token in the unwrapped line after this token or None if this
	is the last token in the unwrapped line.
	previous_token: The token in the unwrapped line before this token or None if
	this is the first token in the unwrapped line.
	matching_bracket: If a bracket token ('[', '{', or '(') the matching
	bracket.
	parameters: If this and its following tokens make up a parameter list, then
	this is a list of those parameters.
	container_opening: If the object is in a container, this points to its
	opening bracket.
	container_elements: If this is the start of a container, a list of the
	elements in the container.
	whitespace_prefix: The prefix for the whitespace.
	spaces_required_before: The number of spaces required before a token. This
	is a lower-bound for the formatter and not a hard requirement. For
	instance, a comment may have n required spaces before it. But the
	formatter won't place n spaces before all comments. Only those that are
	moved to the end of a line of code. The formatter may use different
	spacing when appropriate.
	total_length: The total length of the unwrapped line up to and including
	whitespace and this token. However, this doesn't include the initial
	indentation amount.
	split_penalty: The penalty for splitting the line before this token.
	can_break_before: True if we're allowed to break before this token.
	must_break_before: True if we're required to break before this token.
	newlines: The number of newlines needed before this token.
	"""

	def __init__(self, node):
	"""Constructor.

	Arguments:
	node: (pytree.Leaf) The node that's being wrapped.
	"""
	self.node = node
	self.next_token = None
	self.previous_token = None
	self.matching_bracket = None
	self.parameters = []
	self.container_opening = None
	self.container_elements = []
	self.whitespace_prefix = ''
	self.total_length = 0
	self.split_penalty = 0
	self.can_break_before = False
	self.must_break_before = pytree_utils.GetNodeAnnotation(
	node, pytree_utils.Annotation.MUST_SPLIT, default=False)
	self.newlines = pytree_utils.GetNodeAnnotation(
	node, pytree_utils.Annotation.NEWLINES)

	self.type = node.type
	self.column = node.column
	self.lineno = node.lineno
	self.name = pytree_utils.NodeName(node)

	self.spaces_required_before = 0
	if self.is_comment:
	self.spaces_required_before = style.Get('SPACES_BEFORE_COMMENT')

	self.value = node.value
	if self.is_continuation:
	self.value = node.value.rstrip()

	stypes = pytree_utils.GetNodeAnnotation(node,
	pytree_utils.Annotation.SUBTYPE)
	self.subtypes = [subtypes.NONE] if stypes is None else stypes
	self.is_pseudo = hasattr(node, 'is_pseudo') and node.is_pseudo

	@property
	def formatted_whitespace_prefix(self):
	if style.Get('INDENT_BLANK_LINES'):
	without_newlines = self.whitespace_prefix.lstrip('\n')
	height = len(self.whitespace_prefix) - len(without_newlines)
	if height:
	return ('\n' + without_newlines) * height
	return self.whitespace_prefix

	def AddWhitespacePrefix(self, newlines_before, spaces=0, indent_level=0):
	"""Register a token's whitespace prefix.

	This is the whitespace that will be output before a token's string.

	Arguments:
	newlines_before: (int) The number of newlines to place before the token.
	spaces: (int) The number of spaces to place before the token.
	indent_level: (int) The indentation level.
	"""
	if style.Get('USE_TABS'):
	if newlines_before > 0:
	indent_before = '\t' * indent_level + _TabbedContinuationAlignPadding(
	spaces, style.Get('CONTINUATION_ALIGN_STYLE'),
	style.Get('INDENT_WIDTH'))
	else:
	indent_before = '\t' * indent_level + ' ' * spaces
	else:
	indent_before = (' ' * indent_level * style.Get('INDENT_WIDTH') +
	' ' * spaces)

	if self.is_comment:
	comment_lines = [s.lstrip() for s in self.value.splitlines()]
	self.value = ('\n' + indent_before).join(comment_lines)

	# Update our own value since we are changing node value
	self.value = self.value

	if not self.whitespace_prefix:
	self.whitespace_prefix = ('\n' * (self.newlines or newlines_before) +
	indent_before)
	else:
	self.whitespace_prefix += indent_before

	def AdjustNewlinesBefore(self, newlines_before):
	"""Change the number of newlines before this token."""
	self.whitespace_prefix = ('\n' * newlines_before +
	self.whitespace_prefix.lstrip('\n'))

	def RetainHorizontalSpacing(self, first_column, depth):
	"""Retains a token's horizontal spacing."""
	previous = self.previous_token
	if not previous:
	return

	if previous.is_pseudo:
	previous = previous.previous_token
	if not previous:
	return

	cur_lineno = self.lineno
	prev_lineno = previous.lineno
	if previous.is_multiline_string:
	prev_lineno += previous.value.count('\n')

	if (cur_lineno != prev_lineno or
	(previous.is_pseudo and previous.value != ')' and
	cur_lineno != previous.previous_token.lineno)):
	self.spaces_required_before = (
	self.column - first_column + depth * style.Get('INDENT_WIDTH'))
	return

	cur_column = self.column
	prev_column = previous.node.column
	prev_len = len(previous.value)

	if previous.is_pseudo and previous.value == ')':
	prev_column -= 1
	prev_len = 0

	if previous.is_multiline_string:
	prev_len = len(previous.value.split('\n')[-1])
	if '\n' in previous.value:
	prev_column = 0 # Last line starts in column 0.

	self.spaces_required_before = cur_column - (prev_column + prev_len)

	def OpensScope(self):
	return self.value in pytree_utils.OPENING_BRACKETS

	def ClosesScope(self):
	return self.value in pytree_utils.CLOSING_BRACKETS

	def __repr__(self):
	msg = ('FormatToken(name={0}, value={1}, column={2}, lineno={3}, '
	'splitpenalty={4}'.format(
	'DOCSTRING' if self.is_docstring else self.name, self.value,
	self.column, self.lineno, self.split_penalty))
	msg += ', pseudo)' if self.is_pseudo else ')'
	return msg

	@property
	def node_split_penalty(self):
	"""Split penalty attached to the pytree node of this token."""
	return pytree_utils.GetNodeAnnotation(
	self.node, pytree_utils.Annotation.SPLIT_PENALTY, default=0)

	@property
	def is_binary_op(self):
	"""Token is a binary operator."""
	return subtypes.BINARY_OPERATOR in self.subtypes

	@property
	@py3compat.lru_cache()
	def is_arithmetic_op(self):
	"""Token is an arithmetic operator."""
	return self.value in frozenset({
	'+', # Add
	'-', # Subtract
	'*', # Multiply
	'@', # Matrix Multiply
	'/', # Divide
	'//', # Floor Divide
	'%', # Modulo
	'<<', # Left Shift
	'>>', # Right Shift
	'\|', # Bitwise Or
	'&', # Bitwise Add
	'^', # Bitwise Xor
	'**', # Power
	})

	@property
	def is_simple_expr(self):
	"""Token is an operator in a simple expression."""
	return subtypes.SIMPLE_EXPRESSION in self.subtypes

	@property
	def is_subscript_colon(self):
	"""Token is a subscript colon."""
	return subtypes.SUBSCRIPT_COLON in self.subtypes

	@property
	def is_comment(self):
	return self.type == token.COMMENT

	@property
	def is_continuation(self):
	return self.type == CONTINUATION

	@property
	@py3compat.lru_cache()
	def is_keyword(self):
	return keyword.iskeyword(self.value)

	@property
	def is_name(self):
	return self.type == token.NAME and not self.is_keyword

	@property
	def is_number(self):
	return self.type == token.NUMBER

	@property
	def is_string(self):
	return self.type == token.STRING

	@property
	def is_multiline_string(self):
	"""Test if this string is a multiline string.

	Returns:
	A multiline string always ends with triple quotes, so if it is a string
	token, inspect the last 3 characters and return True if it is a triple
	double or triple single quote mark.
	"""
	return self.is_string and self.value.endswith(('"""', "'''"))

	@property
	def is_docstring(self):
	return self.is_string and self.previous_token is None

	@property
	def is_pylint_comment(self):
	return self.is_comment and re.match(r'#.\bpylint:\s(disable\|enable)=',
	self.value)

	@property
	def is_pytype_comment(self):
	return self.is_comment and re.match(r'#.\bpytype:\s(disable\|enable)=',
	self.value)

	@property
	def is_copybara_comment(self):
	return self.is_comment and re.match(
	r'#.\bcopybara:\s(strip\|insert\|replace)', self.value)