sqlparse/sqlparse/filters/reindent.py at master · tbarbugli/sqlparse

History

181 lines (151 loc) · 6.78 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

# -*- coding: utf-8 -*-

# This module is part of python-sqlparse and is released under

# the BSD License: https://opensource.org/licenses/BSD-3-Clause

from sqlparse import sql, tokens as T

from sqlparse.compat import text_type

from sqlparse.utils import offset, indent

class ReindentFilter(object):

def __init__(self, width=2, char=' ', wrap_after=0, n='\n',

comma_first=False):

self.n = n

self.width = width

self.char = char

self.indent = 0

self.offset = 0

self.wrap_after = wrap_after

self.comma_first = comma_first

self._curr_stmt = None

self._last_stmt = None

def _flatten_up_to_token(self, token):

"""Yields all tokens up to token but excluding current."""

if token.is_group:

token = next(token.flatten())

for t in self._curr_stmt.flatten():

if t == token:

raise StopIteration

yield t

@property

def leading_ws(self):

return self.offset + self.indent * self.width

def _get_offset(self, token):

raw = u''.join(map(text_type, self._flatten_up_to_token(token)))

line = (raw or '\n').splitlines()[-1]

# Now take current offset into account and return relative offset.

return len(line) - len(self.char * self.leading_ws)

def nl(self, offset=0):

return sql.Token(

T.Whitespace,

self.n + self.char * max(0, self.leading_ws + offset))

def _next_token(self, tlist, idx=-1):

split_words = ('FROM', 'STRAIGHT_JOIN$', 'JOIN$', 'AND', 'OR',

'GROUP', 'ORDER', 'UNION', 'VALUES',

'SET', 'BETWEEN', 'EXCEPT', 'HAVING')

m_split = T.Keyword, split_words, True

tidx, token = tlist.token_next_by(m=m_split, idx=idx)

if token and token.normalized == 'BETWEEN':

tidx, token = self._next_token(tlist, tidx)

if token and token.normalized == 'AND':

tidx, token = self._next_token(tlist, tidx)

return tidx, token

def _split_kwds(self, tlist):

tidx, token = self._next_token(tlist)

while token:

pidx, prev_ = tlist.token_prev(tidx, skip_ws=False)

uprev = text_type(prev_)

if prev_ and prev_.is_whitespace:

del tlist.tokens[pidx]

tidx -= 1

if not (uprev.endswith('\n') or uprev.endswith('\r')):

tlist.insert_before(tidx, self.nl())

tidx += 1

tidx, token = self._next_token(tlist, tidx)

def _split_statements(self, tlist):

ttypes = T.Keyword.DML, T.Keyword.DDL

tidx, token = tlist.token_next_by(t=ttypes)

while token:

pidx, prev_ = tlist.token_prev(tidx, skip_ws=False)

if prev_ and prev_.is_whitespace:

del tlist.tokens[pidx]

tidx -= 1

# only break if it's not the first token

if prev_:

tlist.insert_before(tidx, self.nl())

tidx += 1

tidx, token = tlist.token_next_by(t=ttypes, idx=tidx)

def _process(self, tlist):

func_name = '_process_{cls}'.format(cls=type(tlist).__name__)

func = getattr(self, func_name.lower(), self._process_default)

func(tlist)

def _process_where(self, tlist):

tidx, token = tlist.token_next_by(m=(T.Keyword, 'WHERE'))

# issue121, errors in statement fixed??

tlist.insert_before(tidx, self.nl())

with indent(self):

self._process_default(tlist)

def _process_parenthesis(self, tlist):

ttypes = T.Keyword.DML, T.Keyword.DDL

_, is_dml_dll = tlist.token_next_by(t=ttypes)

fidx, first = tlist.token_next_by(m=sql.Parenthesis.M_OPEN)

with indent(self, 1 if is_dml_dll else 0):

tlist.tokens.insert(0, self.nl()) if is_dml_dll else None

with offset(self, self._get_offset(first) + 1):

self._process_default(tlist, not is_dml_dll)

def _process_identifierlist(self, tlist):

identifiers = list(tlist.get_identifiers())

first = next(identifiers.pop(0).flatten())

num_offset = 1 if self.char == '\t' else self._get_offset(first)

if not tlist.within(sql.Function):

with offset(self, num_offset):

position = 0

for token in identifiers:

# Add 1 for the "," separator

position += len(token.value) + 1

if position > (self.wrap_after - self.offset):

adjust = 0

if self.comma_first:

adjust = -2

_, comma = tlist.token_prev(

tlist.token_index(token))

if comma is None:

continue

token = comma

tlist.insert_before(token, self.nl(offset=adjust))

if self.comma_first:

_, ws = tlist.token_next(

tlist.token_index(token), skip_ws=False)

if (ws is not None

and ws.ttype is not T.Text.Whitespace):

tlist.insert_after(

token, sql.Token(T.Whitespace, ' '))

position = 0

self._process_default(tlist)

def _process_case(self, tlist):

iterable = iter(tlist.get_cases())

cond, _ = next(iterable)

first = next(cond[0].flatten())

with offset(self, self._get_offset(tlist[0])):

with offset(self, self._get_offset(first)):

for cond, value in iterable:

token = value[0] if cond is None else cond[0]

tlist.insert_before(token, self.nl())

# Line breaks on group level are done. let's add an offset of

# len "when ", "then ", "else "

with offset(self, len("WHEN ")):

self._process_default(tlist)

end_idx, end = tlist.token_next_by(m=sql.Case.M_CLOSE)

tlist.insert_before(end_idx, self.nl())

def _process_default(self, tlist, stmts=True):

self._split_statements(tlist) if stmts else None

self._split_kwds(tlist)

[self._process(sgroup) for sgroup in tlist.get_sublists()]

def process(self, stmt):

self._curr_stmt = stmt

self._process(stmt)

if self._last_stmt is not None:

nl = '\n' if text_type(self._last_stmt).endswith('\n') else '\n\n'

stmt.tokens.insert(0, sql.Token(T.Whitespace, nl))

self._last_stmt = stmt

return stmt

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

reindent.py

Latest commit

History

reindent.py

File metadata and controls