HashYang
diff --git a/‎.travis.yml‎
Lines changed: 0 additions & 1 deletion b/‎.travis.yml‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎docs/source/intro.rst‎
Lines changed: 4 additions & 4 deletions b/‎docs/source/intro.rst‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎setup.py‎
Lines changed: 2 additions & 3 deletions b/‎setup.py‎
Lines changed: 2 additions & 3 deletions
diff --git a/‎sqlparse/__init__.py‎
Lines changed: 2 additions & 1 deletion b/‎sqlparse/__init__.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎sqlparse/compat.py‎
Lines changed: 2 additions & 2 deletions b/‎sqlparse/compat.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎sqlparse/filters.py‎
Lines changed: 12 additions & 11 deletions b/‎sqlparse/filters.py‎
Lines changed: 12 additions & 11 deletions
diff --git a/‎sqlparse/lexer.py‎
Lines changed: 16 additions & 13 deletions b/‎sqlparse/lexer.py‎
Lines changed: 16 additions & 13 deletions
diff --git a/‎sqlparse/sql.py‎
Lines changed: 12 additions & 11 deletions b/‎sqlparse/sql.py‎
Lines changed: 12 additions & 11 deletions
diff --git a/‎tests/test_filters.py‎
Lines changed: 1 addition & 0 deletions b/‎tests/test_filters.py‎
Lines changed: 1 addition & 0 deletions
@@ -4,7 +4,6 @@ python:
   - "3.5"
   - "3.4"
   - "3.3"
-  - "3.2"
   - "2.7"
   - "pypy"
   - "pypy3"
 
@@ -100,10 +100,10 @@ Each object can be converted back to a string at any time:
 
 .. code-block:: python
 
-   >>> unicode(stmt)  # str(stmt) for Python 3
-   u'select * from "someschema"."mytable" where id = 1'
-   >>> unicode(stmt.tokens[-1])  # or just the WHERE part
-   u'where id = 1'
+   >>> str(stmt)  # str(stmt) for Python 3
+   'select * from "someschema"."mytable" where id = 1'
+   >>> str(stmt.tokens[-1])  # or just the WHERE part
+   'where id = 1'
 
 Details of the returned objects are described in :ref:`analyze`.
 
 
@@ -67,8 +67,8 @@ def get_version():
    >>> res
    (<Statement 'select...' at 0x9ad08ec>,)
    >>> stmt = res[0]
-   >>> unicode(stmt)  # converting it back to unicode
-   u'select * from someschema.mytable where id = 1'
+   >>> str(stmt)  # converting it back to unicode
+   'select * from someschema.mytable where id = 1'
    >>> # This is how the internal representation looks like:
    >>> stmt.tokens
    (<DML 'select' at 0x9b63c34>,
@@ -110,7 +110,6 @@ def get_version():
         'Programming Language :: Python :: 2',
         'Programming Language :: Python :: 2.7',
         'Programming Language :: Python :: 3',
-        'Programming Language :: Python :: 3.2',
         'Programming Language :: Python :: 3.3',
         'Programming Language :: Python :: 3.4',
         'Programming Language :: Python :: 3.5',
 
@@ -14,6 +14,7 @@
 from sqlparse import filters
 from sqlparse import formatter
 
+from sqlparse.compat import u
 # Deprecated in 0.1.5. Will be removed in 0.2.0
 from sqlparse.exceptions import SQLParseError
 
@@ -67,7 +68,7 @@ def split(sql, encoding=None):
     """
     stack = engine.FilterStack()
     stack.split_statements = True
-    return [unicode(stmt).strip() for stmt in stack.run(sql, encoding)]
+    return [u(stmt).strip() for stmt in stack.run(sql, encoding)]
 
 
 from sqlparse.engine.filter import StatementFilter
 
@@ -19,15 +19,15 @@
     from io import StringIO
 
     def u(s):
-        return s
+        return str(s)
 
 elif PY2:
     text_type = unicode
     string_types = (basestring,)
     from StringIO import StringIO  # flake8: noqa
 
     def u(s):
-        return unicode(s, 'unicode_escape')
+        return unicode(s)
 
 
 # Directly copied from six:
 
@@ -5,6 +5,7 @@
 from os.path import abspath, join
 
 from sqlparse import sql, tokens as T
+from sqlparse.compat import u, text_type
 from sqlparse.engine import FilterStack
 from sqlparse.lexer import tokenize
 from sqlparse.pipeline import Pipeline
@@ -25,7 +26,7 @@ def __init__(self, case=None):
         if case is None:
             case = 'upper'
         assert case in ['lower', 'upper', 'capitalize']
-        self.convert = getattr(unicode, case)
+        self.convert = getattr(text_type, case)
 
     def process(self, stack, stream):
         for ttype, value in stream:
@@ -52,7 +53,7 @@ class TruncateStringFilter:
 
     def __init__(self, width, char):
         self.width = max(width, 1)
-        self.char = unicode(char)
+        self.char = u(char)
 
     def process(self, stack, stream):
         for ttype, value in stream:
@@ -154,7 +155,7 @@ def process(self, stack, stream):
                         f.close()
 
                     # There was a problem loading the include file
-                    except IOError, err:
+                    except IOError as err:
                         # Raise the exception to the interpreter
                         if self.raiseexceptions:
                             raise
@@ -171,7 +172,7 @@ def process(self, stack, stream):
                                                      self.raiseexceptions)
 
                         # Max recursion limit reached
-                        except ValueError, err:
+                        except ValueError as err:
                             # Raise the exception to the interpreter
                             if self.raiseexceptions:
                                 raise
@@ -300,7 +301,7 @@ def _flatten_up_to_token(self, token):
                 raise StopIteration
 
     def _get_offset(self, token):
-        raw = ''.join(map(unicode, self._flatten_up_to_token(token)))
+        raw = ''.join(map(text_type, self._flatten_up_to_token(token)))
         line = raw.splitlines()[-1]
         # Now take current offset into account and return relative offset.
         full_offset = len(line) - len(self.char * (self.width * self.indent))
@@ -340,7 +341,7 @@ def _next_token(i):
             if prev and prev.is_whitespace() and prev not in added:
                 tlist.tokens.pop(tlist.token_index(prev))
                 offset += 1
-            uprev = unicode(prev)
+            uprev = u(prev)
             if (prev and (uprev.endswith('\n') or uprev.endswith('\r'))):
                 nl = tlist.token_next(token)
             else:
@@ -462,7 +463,7 @@ def process(self, stack, stmt):
         self._process(stmt)
         if isinstance(stmt, sql.Statement):
             if self._last_stmt is not None:
-                if unicode(self._last_stmt).endswith('\n'):
+                if u(self._last_stmt).endswith('\n'):
                     nl = '\n'
                 else:
                     nl = '\n\n'
@@ -494,7 +495,7 @@ def _process(self, stack, group, stream):
                   and not token.__class__ in self.keep_together):
                 token.tokens = self._process(stack, token, token.tokens)
             else:
-                val = unicode(token)
+                val = u(token)
                 if len(self.line) + len(val) > self.width:
                     match = re.search('^ +', self.line)
                     if match is not None:
@@ -568,7 +569,7 @@ def process(self, stack, stream):
 class SerializerUnicode:
 
     def process(self, stack, stmt):
-        raw = unicode(stmt)
+        raw = u(stmt)
         lines = split_unquoted_newlines(raw)
         res = '\n'.join(line.rstrip() for line in lines)
         return res
@@ -578,7 +579,7 @@ def Tokens2Unicode(stream):
     result = ""
 
     for _, value in stream:
-        result += unicode(value)
+        result += u(value)
 
     return result
 
@@ -600,7 +601,7 @@ def process(self, stack, stmt):
         else:
             varname = self.varname
 
-        has_nl = len(unicode(stmt).strip().splitlines()) > 1
+        has_nl = len(u(stmt).strip().splitlines()) > 1
         stmt.tokens = self._process(stmt.tokens, varname, has_nl)
         return stmt
 
 
@@ -17,7 +17,7 @@
 
 from sqlparse import tokens
 from sqlparse.keywords import KEYWORDS, KEYWORDS_COMMON
-from cStringIO import StringIO
+from sqlparse.compat import StringIO, string_types, with_metaclass, text_type
 
 
 class include(str):
@@ -81,14 +81,14 @@ def _process_state(cls, unprocessed, processed, state):
 
             try:
                 rex = re.compile(tdef[0], rflags).match
-            except Exception, err:
+            except Exception as err:
                 raise ValueError(("uncompilable regex %r in state"
                                   " %r of %r: %s"
                                   % (tdef[0], state, cls, err)))
 
             assert type(tdef[1]) is tokens._TokenType or callable(tdef[1]), \
-                   ('token type must be simple type or callable, not %r'
-                    % (tdef[1],))
+                ('token type must be simple type or callable, not %r'
+                 % (tdef[1],))
 
             if len(tdef) == 2:
                 new_state = None
@@ -113,7 +113,7 @@ def _process_state(cls, unprocessed, processed, state):
                     itokens = []
                     for istate in tdef2:
                         assert istate != state, \
-                               'circular state ref %r' % istate
+                            'circular state ref %r' % istate
                         itokens.extend(cls._process_state(unprocessed,
                                                           processed, istate))
                     processed[new_state] = itokens
@@ -123,7 +123,7 @@ def _process_state(cls, unprocessed, processed, state):
                     for state in tdef2:
                         assert (state in unprocessed or
                                 state in ('#pop', '#push')), \
-                               'unknown new state ' + state
+                                'unknown new state ' + state
                     new_state = tdef2
                 else:
                     assert False, 'unknown new state def %r' % tdef2
@@ -134,7 +134,7 @@ def process_tokendef(cls):
         cls._all_tokens = {}
         cls._tmpname = 0
         processed = cls._all_tokens[cls.__name__] = {}
-        #tokendefs = tokendefs or cls.tokens[name]
+        # tokendefs = tokendefs or cls.tokens[name]
         for state in cls.tokens.keys():
             cls._process_state(cls.tokens, processed, state)
         return processed
@@ -152,9 +152,7 @@ def __call__(cls, *args, **kwds):
         return type.__call__(cls, *args, **kwds)
 
 
-class Lexer(object):
-
-    __metaclass__ = LexerMeta
+class _Lexer(object):
 
     encoding = 'utf-8'
     stripall = False
@@ -201,7 +199,8 @@ class Lexer(object):
             # cannot be preceded by word character or a right bracket --
             # otherwise it's probably an array index
             (r'(?<![\w\])])(\[[^\]]+\])', tokens.Name),
-            (r'((LEFT\s+|RIGHT\s+|FULL\s+)?(INNER\s+|OUTER\s+|STRAIGHT\s+)?|(CROSS\s+|NATURAL\s+)?)?JOIN\b', tokens.Keyword),
+            (r'((LEFT\s+|RIGHT\s+|FULL\s+)?(INNER\s+|OUTER\s+|STRAIGHT\s+)?'
+             r'|(CROSS\s+|NATURAL\s+)?)?JOIN\b', tokens.Keyword),
             (r'END(\s+IF|\s+LOOP)?\b', tokens.Keyword),
             (r'NOT NULL\b', tokens.Keyword),
             (r'CREATE(\s+OR\s+REPLACE)?\b', tokens.Keyword.DDL),
@@ -258,13 +257,13 @@ def get_tokens(self, text, unfiltered=False):
         Also preprocess the text, i.e. expand tabs and strip it if
         wanted and applies registered filters.
         """
-        if isinstance(text, basestring):
+        if isinstance(text, string_types):
             if self.stripall:
                 text = text.strip()
             elif self.stripnl:
                 text = text.strip('\n')
 
-            if sys.version_info[0] < 3 and isinstance(text, unicode):
+            if sys.version_info[0] < 3 and isinstance(text, text_type):
                 text = StringIO(text.encode('utf-8'))
                 self.encoding = 'utf-8'
             else:
@@ -350,6 +349,10 @@ def get_tokens_unprocessed(self, stream, stack=('root',)):
                     break
 
 
+class Lexer(with_metaclass(LexerMeta, _Lexer)):
+    pass
+
+
 def tokenize(sql, encoding=None):
     """Tokenize sql.
 
 
@@ -6,6 +6,7 @@
 import sys
 
 from sqlparse import tokens as T
+from sqlparse.compat import string_types, u
 
 
 class Token(object):
@@ -32,7 +33,7 @@ def __str__(self):
         if sys.version_info[0] == 3:
             return self.value
         else:
-            return unicode(self).encode('utf-8')
+            return u(self).encode('utf-8')
 
     def __repr__(self):
         short = self._get_repr_value()
@@ -51,13 +52,13 @@ def to_unicode(self):
         .. deprecated:: 0.1.5
            Use ``unicode(token)`` (for Python 3: ``str(token)``) instead.
         """
-        return unicode(self)
+        return u(self)
 
     def _get_repr_name(self):
         return str(self.ttype).split('.')[-1]
 
     def _get_repr_value(self):
-        raw = unicode(self)
+        raw = u(self)
         if len(raw) > 7:
             raw = raw[:6] + u'...'
         return re.sub('\s+', ' ', raw)
@@ -83,7 +84,7 @@ def match(self, ttype, values, regex=False):
             return type_matched
 
         if regex:
-            if isinstance(values, basestring):
+            if isinstance(values, string_types):
                 values = set([values])
 
             if self.ttype is T.Keyword:
@@ -96,7 +97,7 @@ def match(self, ttype, values, regex=False):
                     return True
             return False
 
-        if isinstance(values, basestring):
+        if isinstance(values, string_types):
             if self.is_keyword:
                 return values.upper() == self.normalized
             return values == self.value
@@ -172,7 +173,7 @@ def _to_string(self):
         if sys.version_info[0] == 3:
             return ''.join(x.value for x in self.flatten())
         else:
-            return ''.join(unicode(x) for x in self.flatten())
+            return ''.join(u(x) for x in self.flatten())
 
     def _get_repr_name(self):
         return self.__class__.__name__
@@ -185,9 +186,9 @@ def _pprint_tree(self, max_depth=None, depth=0):
                 pre = ' +-'
             else:
                 pre = ' | '
-            print '%s%s%d %s \'%s\'' % (indent, pre, idx,
+            print('%s%s%d %s \'%s\'' % (indent, pre, idx,
                                         token._get_repr_name(),
-                                        token._get_repr_value())
+                                        token._get_repr_value()))
             if (token.is_group() and (max_depth is None or depth < max_depth)):
                 token._pprint_tree(max_depth, depth + 1)
 
@@ -285,7 +286,7 @@ def token_next_match(self, idx, ttype, value, regex=False):
         if not isinstance(idx, int):
             idx = self.token_index(idx)
 
-        for n in xrange(idx, len(self.tokens)):
+        for n in range(idx, len(self.tokens)):
             token = self.tokens[n]
             if token.match(ttype, value, regex):
                 return token
@@ -349,7 +350,7 @@ def token_index(self, token, start=0):
             # Performing `index` manually is much faster when starting in the middle
             # of the list of tokens and expecting to find the token near to the starting
             # index.
-            for i in xrange(start, len(self.tokens)):
+            for i in range(start, len(self.tokens)):
                 if self.tokens[i] == token:
                     return i
             return -1
@@ -518,7 +519,7 @@ def get_typecast(self):
         next_ = self.token_next(self.token_index(marker), False)
         if next_ is None:
             return None
-        return unicode(next_)
+        return u(next_)
 
     def get_ordering(self):
         """Returns the ordering or ``None`` as uppercase string."""
 
@@ -5,6 +5,7 @@
 '''
 import unittest
 
+from sqlparse.compat import u
 from sqlparse.filters import StripWhitespace, Tokens2Unicode
 from sqlparse.lexer import tokenize
-Original file line number
+Diff line change
   - "3.5"
   - "3.4"
   - "3.3"
 -  - "3.2"
   - "2.7"
   - "pypy"
   - "pypy3"