| # Copyright 2015 Google Inc. All Rights Reserved. |
| # |
| # Licensed under the Apache License, Version 2.0 (the "License"); |
| # you may not use this file except in compliance with the License. |
| # You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| """Pytree nodes with extra formatting information. |
| |
| This is a thin wrapper around a pytree.Leaf node. |
| """ |
| |
| import keyword |
| import re |
| |
| from lib2to3.pgen2 import token |
| |
| from yapf.yapflib import py3compat |
| from yapf.yapflib import pytree_utils |
| from yapf.yapflib import style |
| from yapf.yapflib import subtypes |
| |
| CONTINUATION = token.N_TOKENS |
| |
| |
| def _TabbedContinuationAlignPadding(spaces, align_style, tab_width): |
| """Build padding string for continuation alignment in tabbed indentation. |
| |
| Arguments: |
| spaces: (int) The number of spaces to place before the token for alignment. |
| align_style: (str) The alignment style for continuation lines. |
| tab_width: (int) Number of columns of each tab character. |
| |
| Returns: |
| A padding string for alignment with style specified by align_style option. |
| """ |
| if align_style in ('FIXED', 'VALIGN-RIGHT'): |
| if spaces > 0: |
| return '\t' * int((spaces + tab_width - 1) / tab_width) |
| return '' |
| return ' ' * spaces |
| |
| |
| class FormatToken(object): |
| """A wrapper around pytree Leaf nodes. |
| |
| This represents the token plus additional information useful for reformatting |
| the code. |
| |
| Attributes: |
| node: The PyTree node this token represents. |
| next_token: The token in the unwrapped line after this token or None if this |
| is the last token in the unwrapped line. |
| previous_token: The token in the unwrapped line before this token or None if |
| this is the first token in the unwrapped line. |
| matching_bracket: If a bracket token ('[', '{', or '(') the matching |
| bracket. |
| parameters: If this and its following tokens make up a parameter list, then |
| this is a list of those parameters. |
| container_opening: If the object is in a container, this points to its |
| opening bracket. |
| container_elements: If this is the start of a container, a list of the |
| elements in the container. |
| whitespace_prefix: The prefix for the whitespace. |
| spaces_required_before: The number of spaces required before a token. This |
| is a lower-bound for the formatter and not a hard requirement. For |
| instance, a comment may have n required spaces before it. But the |
| formatter won't place n spaces before all comments. Only those that are |
| moved to the end of a line of code. The formatter may use different |
| spacing when appropriate. |
| total_length: The total length of the unwrapped line up to and including |
| whitespace and this token. However, this doesn't include the initial |
| indentation amount. |
| split_penalty: The penalty for splitting the line before this token. |
| can_break_before: True if we're allowed to break before this token. |
| must_break_before: True if we're required to break before this token. |
| newlines: The number of newlines needed before this token. |
| """ |
| |
| def __init__(self, node): |
| """Constructor. |
| |
| Arguments: |
| node: (pytree.Leaf) The node that's being wrapped. |
| """ |
| self.node = node |
| self.next_token = None |
| self.previous_token = None |
| self.matching_bracket = None |
| self.parameters = [] |
| self.container_opening = None |
| self.container_elements = [] |
| self.whitespace_prefix = '' |
| self.total_length = 0 |
| self.split_penalty = 0 |
| self.can_break_before = False |
| self.must_break_before = pytree_utils.GetNodeAnnotation( |
| node, pytree_utils.Annotation.MUST_SPLIT, default=False) |
| self.newlines = pytree_utils.GetNodeAnnotation( |
| node, pytree_utils.Annotation.NEWLINES) |
| |
| self.type = node.type |
| self.column = node.column |
| self.lineno = node.lineno |
| self.name = pytree_utils.NodeName(node) |
| |
| self.spaces_required_before = 0 |
| if self.is_comment: |
| self.spaces_required_before = style.Get('SPACES_BEFORE_COMMENT') |
| |
| self.value = node.value |
| if self.is_continuation: |
| self.value = node.value.rstrip() |
| |
| stypes = pytree_utils.GetNodeAnnotation(node, |
| pytree_utils.Annotation.SUBTYPE) |
| self.subtypes = [subtypes.NONE] if stypes is None else stypes |
| self.is_pseudo = hasattr(node, 'is_pseudo') and node.is_pseudo |
| |
| @property |
| def formatted_whitespace_prefix(self): |
| if style.Get('INDENT_BLANK_LINES'): |
| without_newlines = self.whitespace_prefix.lstrip('\n') |
| height = len(self.whitespace_prefix) - len(without_newlines) |
| if height: |
| return ('\n' + without_newlines) * height |
| return self.whitespace_prefix |
| |
| def AddWhitespacePrefix(self, newlines_before, spaces=0, indent_level=0): |
| """Register a token's whitespace prefix. |
| |
| This is the whitespace that will be output before a token's string. |
| |
| Arguments: |
| newlines_before: (int) The number of newlines to place before the token. |
| spaces: (int) The number of spaces to place before the token. |
| indent_level: (int) The indentation level. |
| """ |
| if style.Get('USE_TABS'): |
| if newlines_before > 0: |
| indent_before = '\t' * indent_level + _TabbedContinuationAlignPadding( |
| spaces, style.Get('CONTINUATION_ALIGN_STYLE'), |
| style.Get('INDENT_WIDTH')) |
| else: |
| indent_before = '\t' * indent_level + ' ' * spaces |
| else: |
| indent_before = (' ' * indent_level * style.Get('INDENT_WIDTH') + |
| ' ' * spaces) |
| |
| if self.is_comment: |
| comment_lines = [s.lstrip() for s in self.value.splitlines()] |
| self.value = ('\n' + indent_before).join(comment_lines) |
| |
| # Update our own value since we are changing node value |
| self.value = self.value |
| |
| if not self.whitespace_prefix: |
| self.whitespace_prefix = ('\n' * (self.newlines or newlines_before) + |
| indent_before) |
| else: |
| self.whitespace_prefix += indent_before |
| |
| def AdjustNewlinesBefore(self, newlines_before): |
| """Change the number of newlines before this token.""" |
| self.whitespace_prefix = ('\n' * newlines_before + |
| self.whitespace_prefix.lstrip('\n')) |
| |
| def RetainHorizontalSpacing(self, first_column, depth): |
| """Retains a token's horizontal spacing.""" |
| previous = self.previous_token |
| if not previous: |
| return |
| |
| if previous.is_pseudo: |
| previous = previous.previous_token |
| if not previous: |
| return |
| |
| cur_lineno = self.lineno |
| prev_lineno = previous.lineno |
| if previous.is_multiline_string: |
| prev_lineno += previous.value.count('\n') |
| |
| if (cur_lineno != prev_lineno or |
| (previous.is_pseudo and previous.value != ')' and |
| cur_lineno != previous.previous_token.lineno)): |
| self.spaces_required_before = ( |
| self.column - first_column + depth * style.Get('INDENT_WIDTH')) |
| return |
| |
| cur_column = self.column |
| prev_column = previous.node.column |
| prev_len = len(previous.value) |
| |
| if previous.is_pseudo and previous.value == ')': |
| prev_column -= 1 |
| prev_len = 0 |
| |
| if previous.is_multiline_string: |
| prev_len = len(previous.value.split('\n')[-1]) |
| if '\n' in previous.value: |
| prev_column = 0 # Last line starts in column 0. |
| |
| self.spaces_required_before = cur_column - (prev_column + prev_len) |
| |
| def OpensScope(self): |
| return self.value in pytree_utils.OPENING_BRACKETS |
| |
| def ClosesScope(self): |
| return self.value in pytree_utils.CLOSING_BRACKETS |
| |
| def __repr__(self): |
| msg = ('FormatToken(name={0}, value={1}, column={2}, lineno={3}, ' |
| 'splitpenalty={4}'.format( |
| 'DOCSTRING' if self.is_docstring else self.name, self.value, |
| self.column, self.lineno, self.split_penalty)) |
| msg += ', pseudo)' if self.is_pseudo else ')' |
| return msg |
| |
| @property |
| def node_split_penalty(self): |
| """Split penalty attached to the pytree node of this token.""" |
| return pytree_utils.GetNodeAnnotation( |
| self.node, pytree_utils.Annotation.SPLIT_PENALTY, default=0) |
| |
| @property |
| def is_binary_op(self): |
| """Token is a binary operator.""" |
| return subtypes.BINARY_OPERATOR in self.subtypes |
| |
| @property |
| @py3compat.lru_cache() |
| def is_arithmetic_op(self): |
| """Token is an arithmetic operator.""" |
| return self.value in frozenset({ |
| '+', # Add |
| '-', # Subtract |
| '*', # Multiply |
| '@', # Matrix Multiply |
| '/', # Divide |
| '//', # Floor Divide |
| '%', # Modulo |
| '<<', # Left Shift |
| '>>', # Right Shift |
| '|', # Bitwise Or |
| '&', # Bitwise Add |
| '^', # Bitwise Xor |
| '**', # Power |
| }) |
| |
| @property |
| def is_simple_expr(self): |
| """Token is an operator in a simple expression.""" |
| return subtypes.SIMPLE_EXPRESSION in self.subtypes |
| |
| @property |
| def is_subscript_colon(self): |
| """Token is a subscript colon.""" |
| return subtypes.SUBSCRIPT_COLON in self.subtypes |
| |
| @property |
| def is_comment(self): |
| return self.type == token.COMMENT |
| |
| @property |
| def is_continuation(self): |
| return self.type == CONTINUATION |
| |
| @property |
| @py3compat.lru_cache() |
| def is_keyword(self): |
| return keyword.iskeyword(self.value) |
| |
| @property |
| def is_name(self): |
| return self.type == token.NAME and not self.is_keyword |
| |
| @property |
| def is_number(self): |
| return self.type == token.NUMBER |
| |
| @property |
| def is_string(self): |
| return self.type == token.STRING |
| |
| @property |
| def is_multiline_string(self): |
| """Test if this string is a multiline string. |
| |
| Returns: |
| A multiline string always ends with triple quotes, so if it is a string |
| token, inspect the last 3 characters and return True if it is a triple |
| double or triple single quote mark. |
| """ |
| return self.is_string and self.value.endswith(('"""', "'''")) |
| |
| @property |
| def is_docstring(self): |
| return self.is_string and self.previous_token is None |
| |
| @property |
| def is_pylint_comment(self): |
| return self.is_comment and re.match(r'#.*\bpylint:\s*(disable|enable)=', |
| self.value) |
| |
| @property |
| def is_pytype_comment(self): |
| return self.is_comment and re.match(r'#.*\bpytype:\s*(disable|enable)=', |
| self.value) |
| |
| @property |
| def is_copybara_comment(self): |
| return self.is_comment and re.match( |
| r'#.*\bcopybara:\s*(strip|insert|replace)', self.value) |