Update docs for configuration

[third_party/pep8] / pep8.py
diff --git a/pep8.py b/pep8.py

index 1000a06e8bd5ea2eef36b33cc0b40eb6b9e40649..67b32d16d9320d436d813eedf9374664117df3bc 100755 (executable)
--- a/pep8.py
+++ b/pep8.py
@@ -47,8 +47,6 @@ W warnings
  """
  from __future__ import with_statement
  
-__version__ = '1.6.0a0'
-
  import os
  import sys
  import re
@@ -64,13 +62,19 @@ try:
  except ImportError:
      from ConfigParser import RawConfigParser
  
-DEFAULT_EXCLUDE = '.svn,CVS,.bzr,.hg,.git,__pycache__'
-DEFAULT_IGNORE = 'E123,E226,E24,E704'
-if sys.platform == 'win32':
-    DEFAULT_CONFIG = os.path.expanduser(r'~\.pep8')
-else:
-    DEFAULT_CONFIG = os.path.join(os.getenv('XDG_CONFIG_HOME') or
-                                  os.path.expanduser('~/.config'), 'pep8')
+__version__ = '1.6.0a0'
+
+DEFAULT_EXCLUDE = '.svn,CVS,.bzr,.hg,.git,__pycache__,.tox'
+DEFAULT_IGNORE = 'E121,E123,E126,E226,E24,E704'
+try:
+    if sys.platform == 'win32':
+        DEFAULT_CONFIG = os.path.expanduser(r'~\.pep8')
+    else:
+        DEFAULT_CONFIG = os.path.join(os.getenv('XDG_CONFIG_HOME') or
+                                      os.path.expanduser('~/.config'), 'pep8')
+except ImportError:
+    DEFAULT_CONFIG = None
+
  PROJECT_CONFIG = ('setup.cfg', 'tox.ini', '.pep8')
  TESTSUITE_PATH = os.path.join(os.path.dirname(__file__), 'testsuite')
  MAX_LINE_LENGTH = 79
@@ -102,8 +106,9 @@ ERRORCODE_REGEX = re.compile(r'\b[A-Z]\d{3}\b')
  DOCSTRING_REGEX = re.compile(r'u?r?["\']')
  EXTRANEOUS_WHITESPACE_REGEX = re.compile(r'[[({] | []}),;:]')
  WHITESPACE_AFTER_COMMA_REGEX = re.compile(r'[,;:]\s*(?:  |\t)')
-COMPARE_SINGLETON_REGEX = re.compile(r'([=!]=)\s*(None|False|True)')
-COMPARE_NEGATIVE_REGEX = re.compile(r'\b(not)\s+[^[({ ]+\s+(in|is)\s')
+COMPARE_SINGLETON_REGEX = re.compile(r'\b(None|False|True)?\s*([=!]=)'
+                                     r'\s*(?(1)|(None|False|True))\b')
+COMPARE_NEGATIVE_REGEX = re.compile(r'\b(not)\s+[^][)(}{ ]+\s+(in|is)\s')
  COMPARE_TYPE_REGEX = re.compile(r'(?:[=!]=|is(?:\s+not)?)\s*type(?:s.\w+Type'
                                  r'|\s*\(\s*([^)]*[^ )])\s*\))')
  KEYWORD_REGEX = re.compile(r'(\s*)\b(?:%s)\b(\s*)' % r'|'.join(KEYWORDS))
@@ -681,7 +686,7 @@ def missing_whitespace_around_operator(logical_line, tokens):
                  if need_space is True or need_space[1]:
                      # A needed trailing space was not found
                      yield prev_end, "E225 missing whitespace around operator"
-                else:
+                elif prev_text != '**':
                      code, optype = 'E226', 'arithmetic'
                      if prev_text == '%':
                          code, optype = 'E228', 'modulo'
@@ -749,6 +754,7 @@ def whitespace_around_named_parameter_equals(logical_line, tokens):
      Okay: boolean(a != b)
      Okay: boolean(a <= b)
      Okay: boolean(a >= b)
+    Okay: def foo(arg: int = 42):
  
      E251: def complex(real, imag = 0.0):
      E251: return magic(r = real, i = imag)
@@ -756,6 +762,8 @@ def whitespace_around_named_parameter_equals(logical_line, tokens):
      parens = 0
      no_space = False
      prev_end = None
+    annotated_func_arg = False
+    in_def = logical_line.startswith('def')
      message = "E251 unexpected spaces around keyword / parameter equals"
      for token_type, text, start, end, line in tokens:
          if token_type == tokenize.NL:
@@ -764,15 +772,22 @@ def whitespace_around_named_parameter_equals(logical_line, tokens):
              no_space = False
              if start != prev_end:
                  yield (prev_end, message)
-        elif token_type == tokenize.OP:
+        if token_type == tokenize.OP:
              if text == '(':
                  parens += 1
              elif text == ')':
                  parens -= 1
-            elif parens and text == '=':
+            elif in_def and text == ':' and parens == 1:
+                annotated_func_arg = True
+            elif parens and text == ',' and parens == 1:
+                annotated_func_arg = False
+            elif parens and text == '=' and not annotated_func_arg:
                  no_space = True
                  if start != prev_end:
                      yield (prev_end, message)
+            if not parens:
+                annotated_func_arg = False
+
          prev_end = end
  
  
@@ -836,6 +851,56 @@ def imports_on_separate_lines(logical_line):
              yield found, "E401 multiple imports on one line"
  
  
+def module_imports_on_top_of_file(
+        logical_line, indent_level, checker_state, noqa):
+    r"""Imports are always put at the top of the file, just after any module
+    comments and docstrings, and before module globals and constants.
+
+    Okay: import os
+    Okay: # this is a comment\nimport os
+    Okay: '''this is a module docstring'''\nimport os
+    Okay: r'''this is a module docstring'''\nimport os
+    Okay: try:\n    import x\nexcept:\n    pass\nelse:\n    pass\nimport y
+    Okay: try:\n    import x\nexcept:\n    pass\nfinally:\n    pass\nimport y
+    E402: a=1\nimport os
+    E402: 'One string'\n"Two string"\nimport os
+    E402: a=1\nfrom sys import x
+
+    Okay: if x:\n    import os
+    """
+    def is_string_literal(line):
+        if line[0] in 'uUbB':
+            line = line[1:]
+        if line and line[0] in 'rR':
+            line = line[1:]
+        return line and (line[0] == '"' or line[0] == "'")
+
+    allowed_try_keywords = ('try', 'except', 'else', 'finally')
+
+    if indent_level:  # Allow imports in conditional statements or functions
+        return
+    if not logical_line:  # Allow empty lines or comments
+        return
+    if noqa:
+        return
+    line = logical_line
+    if line.startswith('import ') or line.startswith('from '):
+        if checker_state.get('seen_non_imports', False):
+            yield 0, "E402 module level import not at top of file"
+    elif any(line.startswith(kw) for kw in allowed_try_keywords):
+        # Allow try, except, else, finally keywords intermixed with imports in
+        # order to support conditional importing
+        return
+    elif is_string_literal(line):
+        # The first literal is a docstring, allow it. Otherwise, report error.
+        if checker_state.get('seen_docstring', False):
+            checker_state['seen_non_imports'] = True
+        else:
+            checker_state['seen_docstring'] = True
+    else:
+        checker_state['seen_non_imports'] = True
+
+
  def compound_statements(logical_line):
      r"""Compound statements (on the same line) are generally discouraged.
  
@@ -872,8 +937,12 @@ def compound_statements(logical_line):
          if ((before.count('{') <= before.count('}') and   # {'a': 1} (dict)
               before.count('[') <= before.count(']') and   # [1:2] (slice)
               before.count('(') <= before.count(')'))):    # (annotation)
-            if LAMBDA_REGEX.search(before):
-                yield 0, "E731 do not assign a lambda expression, use a def"
+            lambda_kw = LAMBDA_REGEX.search(before)
+            if lambda_kw:
+                before = line[:lambda_kw.start()].rstrip()
+                if before[-1:] == '=' and isidentifier(before[:-1].strip()):
+                    yield 0, ("E731 do not assign a lambda expression, use a "
+                              "def")
                  break
              if before.startswith('def '):
                  yield 0, "E704 multiple statements on one line (def)"
@@ -931,7 +1000,9 @@ def comparison_to_singleton(logical_line, noqa):
  
      Okay: if arg is not None:
      E711: if arg != None:
+    E711: if None == arg:
      E712: if arg == True:
+    E712: if False == arg:
  
      Also, beware of writing if x when you really mean if x is not None --
      e.g. when testing whether a variable or argument that defaults to None was
@@ -940,8 +1011,9 @@ def comparison_to_singleton(logical_line, noqa):
      """
      match = not noqa and COMPARE_SINGLETON_REGEX.search(logical_line)
      if match:
-        same = (match.group(1) == '==')
-        singleton = match.group(2)
+        singleton = match.group(1) or match.group(3)
+        same = (match.group(2) == '==')
+
          msg = "'if cond is %s:'" % (('' if same else 'not ') + singleton)
          if singleton in ('None',):
              code = 'E711'
@@ -950,7 +1022,7 @@ def comparison_to_singleton(logical_line, noqa):
              nonzero = ((singleton == 'True' and same) or
                         (singleton == 'False' and not same))
              msg += " or 'if %scond:'" % ('' if nonzero else 'not ')
-        yield match.start(1), ("%s comparison to %s should be %s" %
+        yield match.start(2), ("%s comparison to %s should be %s" %
                                 (code, singleton, msg))
  
  
@@ -1057,7 +1129,7 @@ if '' == ''.encode():
          """Read the source code."""
          with open(filename, 'rU') as f:
              return f.readlines()
-    isidentifier = re.compile(r'[a-zA-Z_]\w*').match
+    isidentifier = re.compile(r'[a-zA-Z_]\w*$').match
      stdin_get_value = sys.stdin.read
  else:
      # Python 3
@@ -1156,10 +1228,13 @@ def normalize_paths(value, parent=os.curdir):
  
      Return a list of absolute paths.
      """
-    if not value or isinstance(value, list):
+    if not value:
+        return []
+    if isinstance(value, list):
          return value
      paths = []
      for path in value.split(','):
+        path = path.strip()
          if '/' in path:
              path = os.path.abspath(os.path.join(parent, path))
          paths.append(path.rstrip('/'))
@@ -1176,14 +1251,12 @@ def filename_match(filename, patterns, default=True):
      return any(fnmatch(filename, pattern) for pattern in patterns)
  
  
+def _is_eol_token(token):
+    return token[0] in NEWLINE or token[4][token[3][1]:].lstrip() == '\\\n'
  if COMMENT_WITH_NL:
-    def _is_eol_token(token):
-        return (token[0] in NEWLINE or
-                (token[0] == tokenize.COMMENT and token[1] == token[4]))
-else:
-    def _is_eol_token(token):
-        return token[0] in NEWLINE
-
+    def _is_eol_token(token, _eol_token=_is_eol_token):
+        return _eol_token(token) or (token[0] == tokenize.COMMENT and
+                                     token[1] == token[4])
  
  ##############################################################################
  # Framework to run all checks
@@ -1240,6 +1313,8 @@ class Checker(object):
          self.hang_closing = options.hang_closing
          self.verbose = options.verbose
          self.filename = filename
+        # Dictionary where a checker can store its custom state.
+        self._checker_states = {}
          if filename is None:
              self.filename = 'stdin'
              self.lines = lines or []
@@ -1295,10 +1370,16 @@ class Checker(object):
              arguments.append(getattr(self, name))
          return check(*arguments)
  
+    def init_checker_state(self, name, argument_names):
+        """ Prepares a custom state for the specific checker plugin."""
+        if 'checker_state' in argument_names:
+            self.checker_state = self._checker_states.setdefault(name, {})
+
      def check_physical(self, line):
          """Run all physical checks on a raw input line."""
          self.physical_line = line
          for name, check, argument_names in self._physical_checks:
+            self.init_checker_state(name, argument_names)
              result = self.run_check(check, argument_names)
              if result is not None:
                  (offset, text) = result
@@ -1343,6 +1424,10 @@ class Checker(object):
          """Build a line from tokens and run all logical checks on it."""
          self.report.increment_logical_line()
          mapping = self.build_tokens_line()
+
+        if not mapping:
+            return
+
          (start_row, start_col) = mapping[0][1]
          start_line = self.lines[start_row - 1]
          self.indent_level = expand_indent(start_line[:start_col])
@@ -1353,6 +1438,7 @@ class Checker(object):
          for name, check, argument_names in self._logical_checks:
              if self.verbose >= 4:
                  print('   ' + name)
+            self.init_checker_state(name, argument_names)
              for offset, text in self.run_check(check, argument_names) or ():
                  if not isinstance(offset, tuple):
                      for token_offset, pos in mapping:
@@ -1790,7 +1876,8 @@ def get_parser(prog='pep8', version=__version__):
      parser.add_option('--select', metavar='errors', default='',
                        help="select errors and warnings (e.g. E,W6)")
      parser.add_option('--ignore', metavar='errors', default='',
-                      help="skip errors and warnings (e.g. E4,W)")
+                      help="skip errors and warnings (e.g. E4,W) "
+                           "(default: %s)" % DEFAULT_IGNORE)
      parser.add_option('--show-source', action='store_true',
                        help="show source code for each error")
      parser.add_option('--show-pep8', action='store_true',