Update docs for configuration

[third_party/pep8] / pep8.py
diff --git a/pep8.py b/pep8.py

index 92042fba12aa26ea917d16883264d6b72aca62ee..67b32d16d9320d436d813eedf9374664117df3bc 100755 (executable)
--- a/pep8.py
+++ b/pep8.py
@@ -2,6 +2,7 @@
  # pep8.py - Check Python source code formatting, according to PEP 8
  # Copyright (C) 2006-2009 Johann C. Rocholl <johann@rocholl.net>
  # Copyright (C) 2009-2014 Florent Xicluna <florent.xicluna@gmail.com>
+# Copyright (C) 2014 Ian Lee <ianlee1521@gmail.com>
  #
  # Permission is hereby granted, free of charge, to any person
  # obtaining a copy of this software and associated documentation files
@@ -46,8 +47,6 @@ W warnings
  """
  from __future__ import with_statement
  
-__version__ = '1.5.7a0'
-
  import os
  import sys
  import re
@@ -63,13 +62,19 @@ try:
  except ImportError:
      from ConfigParser import RawConfigParser
  
-DEFAULT_EXCLUDE = '.svn,CVS,.bzr,.hg,.git,__pycache__'
-DEFAULT_IGNORE = 'E123,E226,E24'
-if sys.platform == 'win32':
-    DEFAULT_CONFIG = os.path.expanduser(r'~\.pep8')
-else:
-    DEFAULT_CONFIG = os.path.join(os.getenv('XDG_CONFIG_HOME') or
-                                  os.path.expanduser('~/.config'), 'pep8')
+__version__ = '1.6.0a0'
+
+DEFAULT_EXCLUDE = '.svn,CVS,.bzr,.hg,.git,__pycache__,.tox'
+DEFAULT_IGNORE = 'E121,E123,E126,E226,E24,E704'
+try:
+    if sys.platform == 'win32':
+        DEFAULT_CONFIG = os.path.expanduser(r'~\.pep8')
+    else:
+        DEFAULT_CONFIG = os.path.join(os.getenv('XDG_CONFIG_HOME') or
+                                      os.path.expanduser('~/.config'), 'pep8')
+except ImportError:
+    DEFAULT_CONFIG = None
+
  PROJECT_CONFIG = ('setup.cfg', 'tox.ini', '.pep8')
  TESTSUITE_PATH = os.path.join(os.path.dirname(__file__), 'testsuite')
  MAX_LINE_LENGTH = 79
@@ -101,8 +106,9 @@ ERRORCODE_REGEX = re.compile(r'\b[A-Z]\d{3}\b')
  DOCSTRING_REGEX = re.compile(r'u?r?["\']')
  EXTRANEOUS_WHITESPACE_REGEX = re.compile(r'[[({] | []}),;:]')
  WHITESPACE_AFTER_COMMA_REGEX = re.compile(r'[,;:]\s*(?:  |\t)')
-COMPARE_SINGLETON_REGEX = re.compile(r'([=!]=)\s*(None|False|True)')
-COMPARE_NEGATIVE_REGEX = re.compile(r'\b(not)\s+[^[({ ]+\s+(in|is)\s')
+COMPARE_SINGLETON_REGEX = re.compile(r'\b(None|False|True)?\s*([=!]=)'
+                                     r'\s*(?(1)|(None|False|True))\b')
+COMPARE_NEGATIVE_REGEX = re.compile(r'\b(not)\s+[^][)(}{ ]+\s+(in|is)\s')
  COMPARE_TYPE_REGEX = re.compile(r'(?:[=!]=|is(?:\s+not)?)\s*type(?:s.\w+Type'
                                  r'|\s*\(\s*([^)]*[^ )])\s*\))')
  KEYWORD_REGEX = re.compile(r'(\s*)\b(?:%s)\b(\s*)' % r'|'.join(KEYWORDS))
@@ -353,20 +359,25 @@ def indentation(logical_line, previous_logical, indent_char,
      Okay: a = 1
      Okay: if a == 0:\n    a = 1
      E111:   a = 1
+    E114:   # a = 1
  
      Okay: for item in items:\n    pass
      E112: for item in items:\npass
+    E115: for item in items:\n# Hi\n    pass
  
      Okay: a = 1\nb = 2
      E113: a = 1\n    b = 2
+    E116: a = 1\n    # b = 2
      """
-    if indent_char == ' ' and indent_level % 4:
-        yield 0, "E111 indentation is not a multiple of four"
+    c = 0 if logical_line else 3
+    tmpl = "E11%d %s" if logical_line else "E11%d %s (comment)"
+    if indent_level % 4:
+        yield 0, tmpl % (1 + c, "indentation is not a multiple of four")
      indent_expect = previous_logical.endswith(':')
      if indent_expect and indent_level <= previous_indent_level:
-        yield 0, "E112 expected an indented block"
-    if indent_level > previous_indent_level and not indent_expect:
-        yield 0, "E113 unexpected indentation"
+        yield 0, tmpl % (2 + c, "expected an indented block")
+    elif not indent_expect and indent_level > previous_indent_level:
+        yield 0, tmpl % (3 + c, "unexpected indentation")
  
  
  def continued_indentation(logical_line, tokens, indent_level, hang_closing,
@@ -675,7 +686,7 @@ def missing_whitespace_around_operator(logical_line, tokens):
                  if need_space is True or need_space[1]:
                      # A needed trailing space was not found
                      yield prev_end, "E225 missing whitespace around operator"
-                else:
+                elif prev_text != '**':
                      code, optype = 'E226', 'arithmetic'
                      if prev_text == '%':
                          code, optype = 'E228', 'modulo'
@@ -743,6 +754,7 @@ def whitespace_around_named_parameter_equals(logical_line, tokens):
      Okay: boolean(a != b)
      Okay: boolean(a <= b)
      Okay: boolean(a >= b)
+    Okay: def foo(arg: int = 42):
  
      E251: def complex(real, imag = 0.0):
      E251: return magic(r = real, i = imag)
@@ -750,6 +762,8 @@ def whitespace_around_named_parameter_equals(logical_line, tokens):
      parens = 0
      no_space = False
      prev_end = None
+    annotated_func_arg = False
+    in_def = logical_line.startswith('def')
      message = "E251 unexpected spaces around keyword / parameter equals"
      for token_type, text, start, end, line in tokens:
          if token_type == tokenize.NL:
@@ -758,15 +772,22 @@ def whitespace_around_named_parameter_equals(logical_line, tokens):
              no_space = False
              if start != prev_end:
                  yield (prev_end, message)
-        elif token_type == tokenize.OP:
+        if token_type == tokenize.OP:
              if text == '(':
                  parens += 1
              elif text == ')':
                  parens -= 1
-            elif parens and text == '=':
+            elif in_def and text == ':' and parens == 1:
+                annotated_func_arg = True
+            elif parens and text == ',' and parens == 1:
+                annotated_func_arg = False
+            elif parens and text == '=' and not annotated_func_arg:
                  no_space = True
                  if start != prev_end:
                      yield (prev_end, message)
+            if not parens:
+                annotated_func_arg = False
+
          prev_end = end
  
  
@@ -787,6 +808,7 @@ def whitespace_before_comment(logical_line, tokens):
      E262: x = x + 1  #Increment x
      E262: x = x + 1  #  Increment x
      E265: #Block comment
+    E266: ### Block comment
      """
      prev_end = (0, 0)
      for token_type, text, start, end, line in tokens:
@@ -797,13 +819,15 @@ def whitespace_before_comment(logical_line, tokens):
                      yield (prev_end,
                             "E261 at least two spaces before inline comment")
              symbol, sp, comment = text.partition(' ')
-            bad_prefix = symbol not in ('#', '#:')
+            bad_prefix = symbol not in '#:' and (symbol.lstrip('#')[:1] or '#')
              if inline_comment:
-                if bad_prefix or comment[:1].isspace():
+                if bad_prefix or comment[:1] in WHITESPACE:
                      yield start, "E262 inline comment should start with '# '"
-            elif bad_prefix:
-                if text.rstrip('#') and (start[0] > 1 or symbol[1] != '!'):
+            elif bad_prefix and (bad_prefix != '!' or start[0] > 1):
+                if bad_prefix != '#':
                      yield start, "E265 block comment should start with '# '"
+                elif comment:
+                    yield start, "E266 too many leading '#' for block comment"
          elif token_type != tokenize.NL:
              prev_end = end
  
@@ -827,6 +851,56 @@ def imports_on_separate_lines(logical_line):
              yield found, "E401 multiple imports on one line"
  
  
+def module_imports_on_top_of_file(
+        logical_line, indent_level, checker_state, noqa):
+    r"""Imports are always put at the top of the file, just after any module
+    comments and docstrings, and before module globals and constants.
+
+    Okay: import os
+    Okay: # this is a comment\nimport os
+    Okay: '''this is a module docstring'''\nimport os
+    Okay: r'''this is a module docstring'''\nimport os
+    Okay: try:\n    import x\nexcept:\n    pass\nelse:\n    pass\nimport y
+    Okay: try:\n    import x\nexcept:\n    pass\nfinally:\n    pass\nimport y
+    E402: a=1\nimport os
+    E402: 'One string'\n"Two string"\nimport os
+    E402: a=1\nfrom sys import x
+
+    Okay: if x:\n    import os
+    """
+    def is_string_literal(line):
+        if line[0] in 'uUbB':
+            line = line[1:]
+        if line and line[0] in 'rR':
+            line = line[1:]
+        return line and (line[0] == '"' or line[0] == "'")
+
+    allowed_try_keywords = ('try', 'except', 'else', 'finally')
+
+    if indent_level:  # Allow imports in conditional statements or functions
+        return
+    if not logical_line:  # Allow empty lines or comments
+        return
+    if noqa:
+        return
+    line = logical_line
+    if line.startswith('import ') or line.startswith('from '):
+        if checker_state.get('seen_non_imports', False):
+            yield 0, "E402 module level import not at top of file"
+    elif any(line.startswith(kw) for kw in allowed_try_keywords):
+        # Allow try, except, else, finally keywords intermixed with imports in
+        # order to support conditional importing
+        return
+    elif is_string_literal(line):
+        # The first literal is a docstring, allow it. Otherwise, report error.
+        if checker_state.get('seen_docstring', False):
+            checker_state['seen_non_imports'] = True
+        else:
+            checker_state['seen_docstring'] = True
+    else:
+        checker_state['seen_non_imports'] = True
+
+
  def compound_statements(logical_line):
      r"""Compound statements (on the same line) are generally discouraged.
  
@@ -834,6 +908,9 @@ def compound_statements(logical_line):
      on the same line, never do this for multi-clause statements.
      Also avoid folding such long lines!
  
+    Always use a def statement instead of an assignment statement that
+    binds a lambda expression directly to a name.
+
      Okay: if foo == 'blah':\n    do_blah_thing()
      Okay: do_one()
      Okay: do_two()
@@ -847,20 +924,30 @@ def compound_statements(logical_line):
      E701: try: something()
      E701: finally: cleanup()
      E701: if foo == 'blah': one(); two(); three()
-
      E702: do_one(); do_two(); do_three()
      E703: do_four();  # useless semicolon
+    E704: def f(x): return 2*x
+    E731: f = lambda x: 2*x
      """
      line = logical_line
      last_char = len(line) - 1
      found = line.find(':')
      while -1 < found < last_char:
          before = line[:found]
-        if (before.count('{') <= before.count('}') and  # {'a': 1} (dict)
-            before.count('[') <= before.count(']') and  # [1:2] (slice)
-            before.count('(') <= before.count(')') and  # (Python 3 annotation)
-                not LAMBDA_REGEX.search(before)):       # lambda x: x
-            yield found, "E701 multiple statements on one line (colon)"
+        if ((before.count('{') <= before.count('}') and   # {'a': 1} (dict)
+             before.count('[') <= before.count(']') and   # [1:2] (slice)
+             before.count('(') <= before.count(')'))):    # (annotation)
+            lambda_kw = LAMBDA_REGEX.search(before)
+            if lambda_kw:
+                before = line[:lambda_kw.start()].rstrip()
+                if before[-1:] == '=' and isidentifier(before[:-1].strip()):
+                    yield 0, ("E731 do not assign a lambda expression, use a "
+                              "def")
+                break
+            if before.startswith('def '):
+                yield 0, "E704 multiple statements on one line (def)"
+            else:
+                yield found, "E701 multiple statements on one line (colon)"
          found = line.find(':', found + 1)
      found = line.find(';')
      while -1 < found:
@@ -913,7 +1000,9 @@ def comparison_to_singleton(logical_line, noqa):
  
      Okay: if arg is not None:
      E711: if arg != None:
+    E711: if None == arg:
      E712: if arg == True:
+    E712: if False == arg:
  
      Also, beware of writing if x when you really mean if x is not None --
      e.g. when testing whether a variable or argument that defaults to None was
@@ -922,8 +1011,9 @@ def comparison_to_singleton(logical_line, noqa):
      """
      match = not noqa and COMPARE_SINGLETON_REGEX.search(logical_line)
      if match:
-        same = (match.group(1) == '==')
-        singleton = match.group(2)
+        singleton = match.group(1) or match.group(3)
+        same = (match.group(2) == '==')
+
          msg = "'if cond is %s:'" % (('' if same else 'not ') + singleton)
          if singleton in ('None',):
              code = 'E711'
@@ -932,7 +1022,7 @@ def comparison_to_singleton(logical_line, noqa):
              nonzero = ((singleton == 'True' and same) or
                         (singleton == 'False' and not same))
              msg += " or 'if %scond:'" % ('' if nonzero else 'not ')
-        yield match.start(1), ("%s comparison to %s should be %s" %
+        yield match.start(2), ("%s comparison to %s should be %s" %
                                 (code, singleton, msg))
  
  
@@ -1039,7 +1129,7 @@ if '' == ''.encode():
          """Read the source code."""
          with open(filename, 'rU') as f:
              return f.readlines()
-    isidentifier = re.compile(r'[a-zA-Z_]\w*').match
+    isidentifier = re.compile(r'[a-zA-Z_]\w*$').match
      stdin_get_value = sys.stdin.read
  else:
      # Python 3
@@ -1138,10 +1228,13 @@ def normalize_paths(value, parent=os.curdir):
  
      Return a list of absolute paths.
      """
-    if not value or isinstance(value, list):
+    if not value:
+        return []
+    if isinstance(value, list):
          return value
      paths = []
      for path in value.split(','):
+        path = path.strip()
          if '/' in path:
              path = os.path.abspath(os.path.join(parent, path))
          paths.append(path.rstrip('/'))
@@ -1158,14 +1251,12 @@ def filename_match(filename, patterns, default=True):
      return any(fnmatch(filename, pattern) for pattern in patterns)
  
  
+def _is_eol_token(token):
+    return token[0] in NEWLINE or token[4][token[3][1]:].lstrip() == '\\\n'
  if COMMENT_WITH_NL:
-    def _is_eol_token(token):
-        return (token[0] in NEWLINE or
-                (token[0] == tokenize.COMMENT and token[1] == token[4]))
-else:
-    def _is_eol_token(token):
-        return token[0] in NEWLINE
-
+    def _is_eol_token(token, _eol_token=_is_eol_token):
+        return _eol_token(token) or (token[0] == tokenize.COMMENT and
+                                     token[1] == token[4])
  
  ##############################################################################
  # Framework to run all checks
@@ -1222,6 +1313,8 @@ class Checker(object):
          self.hang_closing = options.hang_closing
          self.verbose = options.verbose
          self.filename = filename
+        # Dictionary where a checker can store its custom state.
+        self._checker_states = {}
          if filename is None:
              self.filename = 'stdin'
              self.lines = lines or []
@@ -1277,10 +1370,16 @@ class Checker(object):
              arguments.append(getattr(self, name))
          return check(*arguments)
  
+    def init_checker_state(self, name, argument_names):
+        """ Prepares a custom state for the specific checker plugin."""
+        if 'checker_state' in argument_names:
+            self.checker_state = self._checker_states.setdefault(name, {})
+
      def check_physical(self, line):
          """Run all physical checks on a raw input line."""
          self.physical_line = line
          for name, check, argument_names in self._physical_checks:
+            self.init_checker_state(name, argument_names)
              result = self.run_check(check, argument_names)
              if result is not None:
                  (offset, text) = result
@@ -1325,6 +1424,10 @@ class Checker(object):
          """Build a line from tokens and run all logical checks on it."""
          self.report.increment_logical_line()
          mapping = self.build_tokens_line()
+
+        if not mapping:
+            return
+
          (start_row, start_col) = mapping[0][1]
          start_line = self.lines[start_row - 1]
          self.indent_level = expand_indent(start_line[:start_col])
@@ -1335,6 +1438,7 @@ class Checker(object):
          for name, check, argument_names in self._logical_checks:
              if self.verbose >= 4:
                  print('   ' + name)
+            self.init_checker_state(name, argument_names)
              for offset, text in self.run_check(check, argument_names) or ():
                  if not isinstance(offset, tuple):
                      for token_offset, pos in mapping:
@@ -1772,7 +1876,8 @@ def get_parser(prog='pep8', version=__version__):
      parser.add_option('--select', metavar='errors', default='',
                        help="select errors and warnings (e.g. E,W6)")
      parser.add_option('--ignore', metavar='errors', default='',
-                      help="skip errors and warnings (e.g. E4,W)")
+                      help="skip errors and warnings (e.g. E4,W) "
+                           "(default: %s)" % DEFAULT_IGNORE)
      parser.add_option('--show-source', action='store_true',
                        help="show source code for each error")
      parser.add_option('--show-pep8', action='store_true',