1 files changed, 117 insertions, 53 deletions
diff --git a/debug_toolbar/utils/sqlparse/engine/grouping.py b/debug_toolbar/utils/sqlparse/engine/grouping.py
index 532ccec..4e50c7b 100644
--- a/debug_toolbar/utils/sqlparse/engine/grouping.py
+++ b/debug_toolbar/utils/sqlparse/engine/grouping.py
@@ -1,16 +1,19 @@
 # -*- coding: utf-8 -*-
 
 import itertools
-import re
-import types
 
+from debug_toolbar.utils.sqlparse import sql
 from debug_toolbar.utils.sqlparse import tokens as T
-from debug_toolbar.utils.sqlparse.sql import *
 
+try:
+    next
+except NameError:  # Python < 2.6
+    next = lambda i: i.next()
 
 
 def _group_left_right(tlist, ttype, value, cls,
                       check_right=lambda t: True,
+                      check_left=lambda t: True,
                       include_semicolon=False):
     [_group_left_right(sgroup, ttype, value, cls, check_right,
                        include_semicolon) for sgroup in tlist.get_sublists()
@@ -20,14 +23,20 @@ def _group_left_right(tlist, ttype, value, cls,
     while token:
         right = tlist.token_next(tlist.token_index(token))
         left = tlist.token_prev(tlist.token_index(token))
-        if (right is None or not check_right(right)
-            or left is None):
-            token = tlist.token_next_match(tlist.token_index(token)+1,
+        if right is None or not check_right(right):
+            token = tlist.token_next_match(tlist.token_index(token) + 1,
+                                           ttype, value)
+        elif left is None or not check_right(left):
+            token = tlist.token_next_match(tlist.token_index(token) + 1,
                                            ttype, value)
         else:
             if include_semicolon:
-                right = tlist.token_next_match(tlist.token_index(right),
-                                               T.Punctuation, ';')
+                sright = tlist.token_next_match(tlist.token_index(right),
+                                                T.Punctuation, ';')
+                if sright is not None:
+                    # only overwrite "right" if a semicolon is actually
+                    # present.
+                    right = sright
             tokens = tlist.tokens_between(left, right)[1:]
             if not isinstance(left, cls):
                 new = cls([left])
@@ -38,9 +47,10 @@ def _group_left_right(tlist, ttype, value, cls,
             left.tokens.extend(tokens)
             for t in tokens:
                 tlist.tokens.remove(t)
-            token = tlist.token_next_match(tlist.token_index(left)+1,
+            token = tlist.token_next_match(tlist.token_index(left) + 1,
                                            ttype, value)
 
+
 def _group_matching(tlist, start_ttype, start_value, end_ttype, end_value,
                     cls, include_semicolon=False, recurse=False):
     def _find_matching(i, tl, stt, sva, ett, eva):
@@ -66,7 +76,7 @@ def _group_matching(tlist, start_ttype, start_value, end_ttype, end_value,
         end = _find_matching(tidx, tlist, start_ttype, start_value,
                              end_ttype, end_value)
         if end is None:
-            idx = tidx+1
+            idx = tidx + 1
         else:
             if include_semicolon:
                 next_ = tlist.token_next(tlist.token_index(end))
@@ -75,71 +85,102 @@ def _group_matching(tlist, start_ttype, start_value, end_ttype, end_value,
             group = tlist.group_tokens(cls, tlist.tokens_between(token, end))
             _group_matching(group, start_ttype, start_value,
                             end_ttype, end_value, cls, include_semicolon)
-            idx = tlist.token_index(group)+1
+            idx = tlist.token_index(group) + 1
         token = tlist.token_next_match(idx, start_ttype, start_value)
 
+
 def group_if(tlist):
-    _group_matching(tlist, T.Keyword, 'IF', T.Keyword, 'END IF', If, True)
+    _group_matching(tlist, T.Keyword, 'IF', T.Keyword, 'END IF', sql.If, True)
+
 
 def group_for(tlist):
-    _group_matching(tlist, T.Keyword, 'FOR', T.Keyword, 'END LOOP', For, True)
+    _group_matching(tlist, T.Keyword, 'FOR', T.Keyword, 'END LOOP',
+                    sql.For, True)
+
 
 def group_as(tlist):
-    _group_left_right(tlist, T.Keyword, 'AS', Identifier)
+
+    def _right_valid(token):
+        # Currently limited to DML/DDL. Maybe additional more non SQL reserved
+        # keywords should appear here (see issue8).
+        return not token.ttype in (T.DML, T.DDL)
+    _group_left_right(tlist, T.Keyword, 'AS', sql.Identifier,
+                      check_right=_right_valid)
+
 
 def group_assignment(tlist):
-    _group_left_right(tlist, T.Assignment, ':=', Assignment,
+    _group_left_right(tlist, T.Assignment, ':=', sql.Assignment,
                       include_semicolon=True)
 
-def group_comparsion(tlist):
-    _group_left_right(tlist, T.Operator, None, Comparsion)
+
+def group_comparison(tlist):
+
+    def _parts_valid(token):
+        return (token.ttype in (T.String.Symbol, T.Name, T.Number,
+                                T.Number.Integer, T.Literal,
+                                T.Literal.Number.Integer)
+                or isinstance(token, (sql.Identifier,)))
+    _group_left_right(tlist, T.Operator.Comparison, None, sql.Comparison,
+                      check_left=_parts_valid, check_right=_parts_valid)
 
 
 def group_case(tlist):
-    _group_matching(tlist, T.Keyword, 'CASE', T.Keyword, 'END', Case,
+    _group_matching(tlist, T.Keyword, 'CASE', T.Keyword, 'END', sql.Case,
                     include_semicolon=True, recurse=True)
 
 
 def group_identifier(tlist):
     def _consume_cycle(tl, i):
-        x = itertools.cycle((lambda y: y.match(T.Punctuation, '.'),
-                             lambda y: y.ttype in (T.String.Symbol,
-                                                   T.Name,
-                                                   T.Wildcard)))
+        x = itertools.cycle((
+            lambda y: (y.match(T.Punctuation, '.')
+                       or y.ttype is T.Operator),
+            lambda y: (y.ttype in (T.String.Symbol,
+                                   T.Name,
+                                   T.Wildcard,
+                                   T.Literal.Number.Integer))))
         for t in tl.tokens[i:]:
-            if x.next()(t):
+            if next(x)(t):
                 yield t
             else:
                 raise StopIteration
 
     # bottom up approach: group subgroups first
     [group_identifier(sgroup) for sgroup in tlist.get_sublists()
-     if not isinstance(sgroup, Identifier)]
+     if not isinstance(sgroup, sql.Identifier)]
 
     # real processing
     idx = 0
-    token = tlist.token_next_by_type(idx, (T.String.Symbol, T.Name))
+    token = tlist.token_next_by_instance(idx, sql.Function)
+    if token is None:
+        token = tlist.token_next_by_type(idx, (T.String.Symbol, T.Name))
     while token:
-        identifier_tokens = [token]+list(
+        identifier_tokens = [token] + list(
             _consume_cycle(tlist,
-                           tlist.token_index(token)+1))
-        group = tlist.group_tokens(Identifier, identifier_tokens)
-        idx = tlist.token_index(group)+1
-        token = tlist.token_next_by_type(idx, (T.String.Symbol, T.Name))
+                           tlist.token_index(token) + 1))
+        if not (len(identifier_tokens) == 1
+                and isinstance(identifier_tokens[0], sql.Function)):
+            group = tlist.group_tokens(sql.Identifier, identifier_tokens)
+            idx = tlist.token_index(group) + 1
+        else:
+            idx += 1
+        token = tlist.token_next_by_instance(idx, sql.Function)
+        if token is None:
+            token = tlist.token_next_by_type(idx, (T.String.Symbol, T.Name))
 
 
 def group_identifier_list(tlist):
     [group_identifier_list(sgroup) for sgroup in tlist.get_sublists()
-     if not isinstance(sgroup, (Identifier, IdentifierList))]
+     if not isinstance(sgroup, sql.IdentifierList)]
     idx = 0
     # Allowed list items
-    fend1_funcs = [lambda t: isinstance(t, Identifier),
+    fend1_funcs = [lambda t: isinstance(t, (sql.Identifier, sql.Function)),
                    lambda t: t.is_whitespace(),
+                   lambda t: t.ttype == T.Name,
                    lambda t: t.ttype == T.Wildcard,
                    lambda t: t.match(T.Keyword, 'null'),
                    lambda t: t.ttype == T.Number.Integer,
                    lambda t: t.ttype == T.String.Single,
-                   lambda t: isinstance(t, Comparsion),
+                   lambda t: isinstance(t, sql.Comparison),
                    ]
     tcomma = tlist.token_next_match(idx, T.Punctuation, ',')
     start = None
@@ -156,7 +197,7 @@ def group_identifier_list(tlist):
         if not bpassed or not apassed:
             # Something's wrong here, skip ahead to next ","
             start = None
-            tcomma = tlist.token_next_match(tlist.token_index(tcomma)+1,
+            tcomma = tlist.token_next_match(tlist.token_index(tcomma) + 1,
                                             T.Punctuation, ',')
         else:
             if start is None:
@@ -165,25 +206,27 @@ def group_identifier_list(tlist):
             if next_ is None or not next_.match(T.Punctuation, ','):
                 # Reached the end of the list
                 tokens = tlist.tokens_between(start, after)
-                group = tlist.group_tokens(IdentifierList, tokens)
+                group = tlist.group_tokens(sql.IdentifierList, tokens)
                 start = None
-                tcomma = tlist.token_next_match(tlist.token_index(group)+1,
+                tcomma = tlist.token_next_match(tlist.token_index(group) + 1,
                                                 T.Punctuation, ',')
             else:
                 tcomma = next_
 
 
 def group_parenthesis(tlist):
-    _group_matching(tlist, T.Punctuation, '(', T.Punctuation, ')', Parenthesis)
+    _group_matching(tlist, T.Punctuation, '(', T.Punctuation, ')',
+                    sql.Parenthesis)
+
 
 def group_comments(tlist):
     [group_comments(sgroup) for sgroup in tlist.get_sublists()
-     if not isinstance(sgroup, Comment)]
+     if not isinstance(sgroup, sql.Comment)]
     idx = 0
     token = tlist.token_next_by_type(idx, T.Comment)
     while token:
         tidx = tlist.token_index(token)
-        end = tlist.token_not_matching(tidx+1,
+        end = tlist.token_not_matching(tidx + 1,
                                        [lambda t: t.ttype in T.Comment,
                                         lambda t: t.is_whitespace()])
         if end is None:
@@ -192,49 +235,70 @@ def group_comments(tlist):
             eidx = tlist.token_index(end)
             grp_tokens = tlist.tokens_between(token,
                                               tlist.token_prev(eidx, False))
-            group = tlist.group_tokens(Comment, grp_tokens)
+            group = tlist.group_tokens(sql.Comment, grp_tokens)
             idx = tlist.token_index(group)
         token = tlist.token_next_by_type(idx, T.Comment)
 
+
 def group_where(tlist):
     [group_where(sgroup) for sgroup in tlist.get_sublists()
-     if not isinstance(sgroup, Where)]
+     if not isinstance(sgroup, sql.Where)]
     idx = 0
     token = tlist.token_next_match(idx, T.Keyword, 'WHERE')
     stopwords = ('ORDER', 'GROUP', 'LIMIT', 'UNION')
     while token:
         tidx = tlist.token_index(token)
-        end = tlist.token_next_match(tidx+1, T.Keyword, stopwords)
+        end = tlist.token_next_match(tidx + 1, T.Keyword, stopwords)
         if end is None:
-            end = tlist.tokens[-1]
+            end = tlist._groupable_tokens[-1]
         else:
-            end = tlist.tokens[tlist.token_index(end)-1]
-        group = tlist.group_tokens(Where, tlist.tokens_between(token, end))
+            end = tlist.tokens[tlist.token_index(end) - 1]
+        group = tlist.group_tokens(sql.Where,
+                                   tlist.tokens_between(token, end),
+                                   ignore_ws=True)
         idx = tlist.token_index(group)
         token = tlist.token_next_match(idx, T.Keyword, 'WHERE')
 
+
 def group_aliased(tlist):
     [group_aliased(sgroup) for sgroup in tlist.get_sublists()
-     if not isinstance(sgroup, Identifier)]
+     if not isinstance(sgroup, (sql.Identifier, sql.Function))]
     idx = 0
-    token = tlist.token_next_by_instance(idx, Identifier)
+    token = tlist.token_next_by_instance(idx, (sql.Identifier, sql.Function))
     while token:
         next_ = tlist.token_next(tlist.token_index(token))
-        if next_ is not None and isinstance(next_, Identifier):
+        if next_ is not None and isinstance(next_, (sql.Identifier, sql.Function)):
             grp = tlist.tokens_between(token, next_)[1:]
             token.tokens.extend(grp)
             for t in grp:
                 tlist.tokens.remove(t)
-        idx = tlist.token_index(token)+1
-        token = tlist.token_next_by_instance(idx, Identifier)
+        idx = tlist.token_index(token) + 1
+        token = tlist.token_next_by_instance(idx, (sql.Identifier, sql.Function))
 
 
 def group_typecasts(tlist):
-    _group_left_right(tlist, T.Punctuation, '::', Identifier)
+    _group_left_right(tlist, T.Punctuation, '::', sql.Identifier)
+
+
+def group_functions(tlist):
+    [group_functions(sgroup) for sgroup in tlist.get_sublists()
+     if not isinstance(sgroup, sql.Function)]
+    idx = 0
+    token = tlist.token_next_by_type(idx, T.Name)
+    while token:
+        next_ = tlist.token_next(token)
+        if not isinstance(next_, sql.Parenthesis):
+            idx = tlist.token_index(token) + 1
+        else:
+            func = tlist.group_tokens(sql.Function,
+                                      tlist.tokens_between(token, next_))
+            idx = tlist.token_index(func) + 1
+        token = tlist.token_next_by_type(idx, T.Name)
 
 
 def group(tlist):
     for func in [group_parenthesis,
+                 group_functions,
                  group_comments,
                  group_where,
                  group_case,
@@ -243,8 +307,8 @@ def group(tlist):
                  group_as,
                  group_aliased,
                  group_assignment,
-                 group_comparsion,
+                 group_comparison,
                  group_identifier_list,
                  group_if,
-                 group_for,]:
+                 group_for]:
         func(tlist)