Format pr to pass flake8 and update functions used

vmuriart · vmuriart · commit a7c7d9586208 · 2016-06-06T06:31:35.000-07:00
diff --git a/sqlparse/filters.py b/sqlparse/filters.py
@@ -139,24 +139,23 @@ def process(self, stmt, depth=0):
             stmt.tokens.pop(-1)
 
 
-class SpacesAroundOperatorsFilter:
+class SpacesAroundOperatorsFilter(object):
     whitelist = (sql.Identifier, sql.Comparison, sql.Where)
 
     def _process(self, tlist):
         def next_token(idx):
-            # HACK: distinguish between real wildcard from multiplication operator
-            return tlist.token_next_by_type(idx, (T.Operator, T.Comparison, T.Wildcard))
+            return tlist.token_next_by(t=(T.Operator, T.Comparison), idx=idx)
+
         idx = 0
         token = next_token(idx)
         while token:
             idx = tlist.token_index(token)
             if idx > 0 and tlist.tokens[idx - 1].ttype != T.Whitespace:
-                tlist.tokens.insert(idx, sql.Token(T.Whitespace, ' '))  # insert before
+                # insert before
+                tlist.tokens.insert(idx, sql.Token(T.Whitespace, ' '))
                 idx += 1
             if idx < len(tlist.tokens) - 1:
-                if token.ttype == T.Wildcard and tlist.tokens[idx + 1].match(T.Punctuation, ','):
-                    pass  # this must have been a real wildcard, not multiplication
-                elif tlist.tokens[idx + 1].ttype != T.Whitespace:
+                if tlist.tokens[idx + 1].ttype != T.Whitespace:
                     tlist.tokens.insert(idx + 1, sql.Token(T.Whitespace, ' '))
 
             idx += 1
@@ -165,7 +164,7 @@ def next_token(idx):
         for sgroup in tlist.get_sublists():
             self._process(sgroup)
 
-    def process(self, stack, stmt):
+    def process(self, stmt):
         self._process(stmt)
 
 
@@ -365,16 +364,16 @@ def process(self, stmt):
                 self._last_stmt = stmt
 
 
-class AlignedIndentFilter:
-    join_words = r'((LEFT\s+|RIGHT\s+|FULL\s+)?(INNER\s+|OUTER\s+|STRAIGHT\s+)?|(CROSS\s+|NATURAL\s+)?)?JOIN\b'
-    split_words = (
-        'FROM',
-        join_words, 'ON',
-        'WHERE', 'AND', 'OR',
-        'GROUP', 'HAVING', 'LIMIT',
-        'ORDER', 'UNION', 'VALUES',
-        'SET', 'BETWEEN', 'EXCEPT',
-        )
+class AlignedIndentFilter(object):
+    join_words = (r'((LEFT\s+|RIGHT\s+|FULL\s+)?'
+                  r'(INNER\s+|OUTER\s+|STRAIGHT\s+)?|'
+                  r'(CROSS\s+|NATURAL\s+)?)?JOIN\b')
+    split_words = ('FROM',
+                   join_words, 'ON',
+                   'WHERE', 'AND', 'OR',
+                   'GROUP', 'HAVING', 'LIMIT',
+                   'ORDER', 'UNION', 'VALUES',
+                   'SET', 'BETWEEN', 'EXCEPT')
 
     def __init__(self, char=' ', line_width=None):
         self.char = char
@@ -384,43 +383,51 @@ def newline(self):
         return sql.Token(T.Newline, '\n')
 
     def whitespace(self, chars=0, newline_before=False, newline_after=False):
-        return sql.Token(
-            T.Whitespace,
-            (str(self.newline()) if newline_before else '') + self.char * chars + (str(self.newline()) if newline_after else ''))
+        return sql.Token(T.Whitespace, ('\n' if newline_before else '') +
+                         self.char * chars + ('\n' if newline_after else ''))
 
     def _process_statement(self, tlist, base_indent=0):
         if tlist.tokens[0].is_whitespace() and base_indent == 0:
             tlist.tokens.pop(0)
 
         # process the main query body
-        return self._process(sql.TokenList(tlist.tokens), base_indent=base_indent)
+        return self._process(sql.TokenList(tlist.tokens),
+                             base_indent=base_indent)
 
     def _process_parenthesis(self, tlist, base_indent=0):
-        if not tlist.token_next_match(0, T.DML, 'SELECT'):
+        if not tlist.token_next_by(m=(T.DML, 'SELECT')):
             # if this isn't a subquery, don't re-indent
             return tlist
 
-        sub_indent = base_indent + self._max_kwd_len + 2  # add two for the space and parens
-        tlist.insert_after(tlist.tokens[0], self.whitespace(sub_indent, newline_before=True))
+        # add two for the space and parens
+        sub_indent = base_indent + self._max_kwd_len + 2
+        tlist.insert_after(tlist.tokens[0],
+                           self.whitespace(sub_indent, newline_before=True))
         # de-indent the last parenthesis
-        tlist.insert_before(tlist.tokens[-1], self.whitespace(sub_indent - 1, newline_before=True))
+        tlist.insert_before(tlist.tokens[-1],
+                            self.whitespace(sub_indent - 1,
+                                            newline_before=True))
 
         # process the inside of the parantheses
         tlist.tokens = (
             [tlist.tokens[0]] +
-            self._process(sql.TokenList(tlist._groupable_tokens), base_indent=sub_indent).tokens +
+            self._process(sql.TokenList(tlist._groupable_tokens),
+                          base_indent=sub_indent).tokens +
             [tlist.tokens[-1]]
-            )
+        )
         return tlist
 
     def _process_identifierlist(self, tlist, base_indent=0):
         # columns being selected
         new_tokens = []
-        identifiers = filter(lambda t: t.ttype not in (T.Punctuation, T.Whitespace, T.Newline), tlist.tokens)
+        identifiers = list(filter(
+            lambda t: t.ttype not in (T.Punctuation, T.Whitespace, T.Newline),
+            tlist.tokens))
         for i, token in enumerate(identifiers):
             if i > 0:
                 new_tokens.append(self.newline())
-                new_tokens.append(self.whitespace(self._max_kwd_len + base_indent + 1))
+                new_tokens.append(
+                    self.whitespace(self._max_kwd_len + base_indent + 1))
             new_tokens.append(token)
             if i < len(identifiers) - 1:
                 # if not last column in select, add a comma seperator
@@ -437,10 +444,11 @@ def _process_case(self, tlist, base_indent=0):
         case_offset = len('when ')
         cases = tlist.get_cases(skip_ws=True)
         # align the end as well
-        end_token = tlist.token_next_match(0, T.Keyword, 'END')
+        end_token = tlist.token_next_by(m=(T.Keyword, 'END'))
         cases.append((None, [end_token]))
 
-        condition_width = max(len(' '.join(map(str, cond))) for cond, value in cases if cond)
+        condition_width = max(
+            len(' '.join(map(str, cond))) for cond, value in cases if cond)
         for i, (cond, value) in enumerate(cases):
             if cond is None:  # else or end
                 stmt = value[0]
@@ -449,17 +457,20 @@ def _process_case(self, tlist, base_indent=0):
                 stmt = cond[0]
                 line = cond + value
             if i > 0:
-                tlist.insert_before(stmt, self.whitespace(base_offset + case_offset - len(str(stmt))))
+                tlist.insert_before(stmt, self.whitespace(
+                    base_offset + case_offset - len(str(stmt))))
             if cond:
-                tlist.insert_after(cond[-1], self.whitespace(condition_width - len(' '.join(map(str, cond)))))
+                tlist.insert_after(cond[-1], self.whitespace(
+                    condition_width - len(' '.join(map(str, cond)))))
 
             if i < len(cases) - 1:
                 # if not the END add a newline
                 tlist.insert_after(line[-1], self.newline())
 
     def _process_substatement(self, tlist, base_indent=0):
         def _next_token(i):
-            t = tlist.token_next_match(i, T.Keyword, self.split_words, regex=True)
+            t = tlist.token_next_by(m=(T.Keyword, self.split_words, True),
+                                    idx=i)
             # treat "BETWEEN x and y" as a single statement
             if t and t.value.upper() == 'BETWEEN':
                 t = _next_token(tlist.token_index(t) + 1)
@@ -470,35 +481,35 @@ def _next_token(i):
         idx = 0
         token = _next_token(idx)
         while token:
+            # joins are special case. only consider the first word as aligner
             if token.match(T.Keyword, self.join_words, regex=True):
-                # joins are a special case. we only consider the first word of the join as the aligner
                 token_indent = len(token.value.split()[0])
             else:
                 token_indent = len(str(token))
-            tlist.insert_before(token, self.whitespace(self._max_kwd_len - token_indent + base_indent, newline_before=True))
+            tlist.insert_before(token, self.whitespace(
+                self._max_kwd_len - token_indent + base_indent,
+                newline_before=True))
             next_idx = tlist.token_index(token) + 1
             token = _next_token(next_idx)
 
         # process any sub-sub statements
         for sgroup in tlist.get_sublists():
             prev_token = tlist.token_prev(tlist.token_index(sgroup))
             indent_offset = 0
+            # HACK: make "group/order by" work. Longer than _max_kwd_len.
             if prev_token and prev_token.match(T.Keyword, 'BY'):
-                # HACK: make "group by" and "order by" indents work. these are longer than _max_kwd_len.
                 # TODO: generalize this
                 indent_offset = 3
             self._process(sgroup, base_indent=base_indent + indent_offset)
         return tlist
 
-    def _process(self, tlist, base_indent=0, verbose=False):
+    def _process(self, tlist, base_indent=0):
         token_name = tlist.__class__.__name__.lower()
         func_name = '_process_%s' % token_name
         func = getattr(self, func_name, self._process_substatement)
-        if verbose:
-            print func.__name__, token_name, str(tlist)
         return func(tlist, base_indent=base_indent)
 
-    def process(self, stack, stmt):
+    def process(self, stmt):
         self._process(stmt)
 
 
diff --git a/sqlparse/formatter.py b/sqlparse/formatter.py
@@ -30,10 +30,10 @@ def validate_options(options):
         raise SQLParseError('Invalid value for strip_comments: %r'
                             % strip_comments)
 
-    use_space_around_operators = options.get('use_space_around_operators', False)
-    if use_space_around_operators not in [True, False]:
+    space_around_operators = options.get('use_space_around_operators', False)
+    if space_around_operators not in [True, False]:
         raise SQLParseError('Invalid value for use_space_around_operators: %r'
-                            % use_space_around_operators)
+                            % space_around_operators)
 
     strip_ws = options.get('strip_whitespace', False)
     if strip_ws not in [True, False]:
diff --git a/tests/test_format.py b/tests/test_format.py
@@ -252,7 +252,7 @@ def test_group_by(self):
             ]))
 
     def test_group_by_subquery(self):
-        # TODO: add subquery alias in again when test_grouping.TestGrouping.test_identifier_list_subquery fixed
+        # TODO: add subquery alias when test_identifier_list_subquery fixed
         sql = """
             select *, sum_b + 2 as mod_sum
             from (
@@ -275,23 +275,27 @@ def test_group_by_subquery(self):
                 '       )',
                 ' order by 1,',
                 '          2',
-                ]))
+            ]))
 
     def test_window_functions(self):
         sql = """
             select a,
-            SUM(a) OVER (PARTITION BY b ORDER BY c ROWS BETWEEN UNBOUNDED PRECEDING AND CURRENT ROW) as sum_a,
-            ROW_NUMBER() OVER (PARTITION BY b, c ORDER BY d DESC) as row_num
+            SUM(a) OVER (PARTITION BY b ORDER BY c ROWS
+            BETWEEN UNBOUNDED PRECEDING AND CURRENT ROW) as sum_a,
+            ROW_NUMBER() OVER
+            (PARTITION BY b, c ORDER BY d DESC) as row_num
             from table
             """
         self.ndiffAssertEqual(
             self.formatter(sql),
             '\n'.join([
                 'select a,',
-                '       SUM(a) OVER (PARTITION BY b ORDER BY c ROWS BETWEEN UNBOUNDED PRECEDING AND CURRENT ROW) as sum_a,',
-                '       ROW_NUMBER() OVER (PARTITION BY b, c ORDER BY d DESC) as row_num',
+                ('       SUM(a) OVER (PARTITION BY b ORDER BY c ROWS '
+                 'BETWEEN UNBOUNDED PRECEDING AND CURRENT ROW) as sum_a,'),
+                ('       ROW_NUMBER() OVER '
+                 '(PARTITION BY b, c ORDER BY d DESC) as row_num'),
                 '  from table',
-                ]))
+            ]))
 
 
 class TestSpacesAroundOperators(TestCaseBase):
@@ -300,32 +304,34 @@ def formatter(sql):
         return sqlparse.format(sql, use_space_around_operators=True)
 
     def test_basic(self):
-        sql = 'select a+b as d from table where (c-d)%2= 1 and e> 3.0/4 and z^2 <100'
+        sql = ('select a+b as d from table '
+               'where (c-d)%2= 1 and e> 3.0/4 and z^2 <100')
         self.ndiffAssertEqual(
-            self.formatter(sql),
-            'select a + b as d from table where (c - d) % 2 = 1 and e > 3.0 / 4 and z ^ 2 < 100'
-            )
+            self.formatter(sql), (
+                'select a + b as d from table '
+                'where (c - d) % 2 = 1 and e > 3.0 / 4 and z ^ 2 < 100')
+        )
 
     def test_bools(self):
         sql = 'select * from table where a &&b or c||d'
         self.ndiffAssertEqual(
             self.formatter(sql),
             'select * from table where a && b or c || d'
-            )
+        )
 
     def test_nested(self):
         sql = 'select *, case when a-b then c end from table'
         self.ndiffAssertEqual(
             self.formatter(sql),
             'select *, case when a - b then c end from table'
-            )
+        )
 
     def test_wildcard_vs_mult(self):
         sql = 'select a*b-c from table'
         self.ndiffAssertEqual(
             self.formatter(sql),
             'select a * b - c from table'
-            )
+        )
 
 
 class TestFormatReindent(TestCaseBase):
diff --git a/tests/test_grouping.py b/tests/test_grouping.py
@@ -122,15 +122,16 @@ def test_identifier_list(self):
         p = sqlparse.parse('(a, b, c)')[0]
         self.assert_(isinstance(p.tokens[0].tokens[1], sql.IdentifierList))
 
-    @pytest.mark.xfail(strict=True)
     def test_identifier_list_subquery(self):
         """identifier lists should still work in subqueries with aliases"""
-        p = sqlparse.parse("""select * from (select a, b + c as d from table) sub""")[0]
+        p = sqlparse.parse("select * from ("
+                           "select a, b + c as d from table) sub")[0]
         subquery = p.tokens[-1].tokens[0]
-        iden_list = subquery.token_next_by_instance(0, sql.IdentifierList)
+        iden_list = subquery.token_next_by(i=sql.IdentifierList)
         self.assert_(iden_list is not None)
         # all the identifiers should be within the IdentifierList
-        self.assert_(subquery.token_next_by_instance(subquery.token_index(iden_list), sql.Identifier) is None)
+        self.assert_(subquery.token_next_by(i=sql.Identifier,
+                                            idx=iden_list) is None)
 
     def test_identifier_list_case(self):
         p = sqlparse.parse('a, case when 1 then 2 else 3 end as b, c')[0]
@@ -152,7 +153,8 @@ def test_identifier_list_with_inline_comments(self):  # issue163
 
     def test_identifiers_with_operators(self):
         p = sqlparse.parse('a+b as c from table where (d-e)%2= 1')[0]
-        self.assertEqual(len([x for x in p.flatten() if x.ttype == sqlparse.tokens.Name]), 5)
+        self.assertEqual(len([x for x in p.flatten()
+                              if x.ttype == sqlparse.tokens.Name]), 5)
 
     def test_identifier_list_with_order(self):  # issue101
         p = sqlparse.parse('1, 2 desc, 3')[0]