Merge.

author: Andi Albrecht <albrecht.andi@gmail.com> 2011-08-13 21:39:29 +0200
committer: Andi Albrecht <albrecht.andi@gmail.com> 2011-08-13 21:39:29 +0200
commit: 4307d56e67f33174eab003dbd1c32fc024bbd343 (patch)
tree: 96494ccc8e3ba7ea82ace4e0f60f90ace9d91019 /sqlparse
parent: 1ad1131f2f7f702df4a4018a97a5d5b08e64ea90 (diff)
parent: 5a1d58a6fc69ddc04abb8750e1cf2e156caa04ab (diff)
download: sqlparse-4307d56e67f33174eab003dbd1c32fc024bbd343.tar.gz
1 files changed, 158 insertions, 3 deletions
diff --git a/sqlparse/filters.py b/sqlparse/filters.py
index 813be99..cba7b8f 100644
--- a/sqlparse/filters.py
+++ b/sqlparse/filters.py
@@ -2,8 +2,15 @@
 
 import re
 
-from sqlparse import tokens as T
+from os.path import abspath, join
+
 from sqlparse import sql
+from sqlparse import tokens as T
+from sqlparse.engine import FilterStack
+from sqlparse.tokens import (
+    Comment, Keyword, Name,
+    Punctuation, String, Whitespace,
+)
 
 
 class Filter(object):
@@ -52,6 +59,81 @@ class IdentifierCaseFilter(_CaseFilter):
             yield ttype, value
 
 
+class GetComments(Filter):
+    """Get the comments from a stack"""
+    def process(self, stack, stream):
+        for token_type, value in stream:
+            if token_type in Comment:
+                yield token_type, value
+
+
+class StripComments(Filter):
+    """Strip the comments from a stack"""
+    def process(self, stack, stream):
+        for token_type, value in stream:
+            if token_type not in Comment:
+                yield token_type, value
+
+
+class IncludeStatement(Filter):
+    """Filter that enable a INCLUDE statement"""
+
+    def __init__(self, dirpath=".", maxRecursive=10):
+        self.dirpath = abspath(dirpath)
+        self.maxRecursive = maxRecursive
+
+        self.detected = False
+
+    def process(self, stack, stream):
+        # Run over all tokens in the stream
+        for token_type, value in stream:
+            # INCLUDE statement found, set detected mode
+            if token_type in Name and value.upper() == 'INCLUDE':
+                self.detected = True
+                continue
+
+            # INCLUDE statement was found, parse it
+            elif self.detected:
+                # Omit whitespaces
+                if token_type in Whitespace:
+                    pass
+
+                # Get path of file to include
+                path = None
+
+                if token_type in String.Symbol:
+#                if token_type in tokens.String.Symbol:
+                    path = join(self.dirpath, value[1:-1])
+
+                # Include file if path was found
+                if path:
+                    try:
+                        f = open(path)
+                        raw_sql = f.read()
+                        f.close()
+                    except IOError, err:
+                        yield Comment, u'-- IOError: %s\n' % err
+
+                    else:
+                        # Create new FilterStack to parse readed file
+                        # and add all its tokens to the main stack recursively
+                        # [ToDo] Add maximum recursive iteration value
+                        stack = FilterStack()
+                        stack.preprocess.append(IncludeStatement(self.dirpath))
+
+                        for tv in stack.run(raw_sql):
+                            yield tv
+
+                    # Set normal mode
+                    self.detected = False
+
+                # Don't include any token while in detected mode
+                continue
+
+            # Normal token
+            yield token_type, value
+
+
 # ----------------------
 # statement process
 
@@ -146,13 +228,14 @@ class ReindentFilter(Filter):
         split_words = ('FROM', 'JOIN$', 'AND', 'OR',
                        'GROUP', 'ORDER', 'UNION', 'VALUES',
                        'SET', 'BETWEEN')
+
         def _next_token(i):
             t = tlist.token_next_match(i, T.Keyword, split_words,
                                        regex=True)
             if t and t.value.upper() == 'BETWEEN':
-                t = _next_token(tlist.token_index(t)+1)
+                t = _next_token(tlist.token_index(t) + 1)
                 if t and t.value.upper() == 'AND':
-                    t = _next_token(tlist.token_index(t)+1)
+                    t = _next_token(tlist.token_index(t) + 1)
             return t
 
         idx = 0
@@ -316,6 +399,57 @@ class RightMarginFilter(Filter):
         group.tokens = self._process(stack, group, group.tokens)
 
 
+class ColumnsSelect(Filter):
+    """Get the columns names of a SELECT query"""
+    def process(self, stack, stream):
+        mode = 0
+        oldValue = ""
+        parenthesis = 0
+
+        for token_type, value in stream:
+            # Ignore comments
+            if token_type in Comment:
+                continue
+
+            # We have not detected a SELECT statement
+            if mode == 0:
+                if token_type in Keyword and value == 'SELECT':
+                    mode = 1
+
+            # We have detected a SELECT statement
+            elif mode == 1:
+                if value == 'FROM':
+                    if oldValue:
+                        yield Name, oldValue
+
+                    mode = 3    # Columns have been checked
+
+                elif value == 'AS':
+                    oldValue = ""
+                    mode = 2
+
+                elif (token_type == Punctuation
+                      and value == ',' and not parenthesis):
+                    if oldValue:
+                        yield Name, oldValue
+                    oldValue = ""
+
+                elif token_type not in Whitespace:
+                    if value == '(':
+                        parenthesis += 1
+                    elif value == ')':
+                        parenthesis -= 1
+
+                    oldValue += value
+
+            # We are processing an AS keyword
+            elif mode == 2:
+                # We check also for Keywords because a bug in SQLParse
+                if token_type == Name or token_type == Keyword:
+                    yield Name, value
+                    mode = 1
+
+
 # ---------------------------
 # postprocess
 
@@ -422,3 +556,24 @@ class OutputPHPFilter(Filter):
             varname = self.varname
         stmt.tokens = tuple(self._process(stmt.tokens, varname))
         return stmt
+
+
+class Limit(Filter):
+    """Get the LIMIT of a query.
+
+    If not defined, return -1 (SQL specification for no LIMIT query)
+    """
+    def process(self, stack, stream):
+        index = 7
+        stream = list(stream)
+        stream.reverse()
+
+        # Run over all tokens in the stream from the end
+        for token_type, value in stream:
+            index -= 1
+
+#            if index and token_type in Keyword:
+            if index and token_type in Keyword and value == 'LIMIT':
+                return stream[4 - index][1]
+
+        return -1
author	Andi Albrecht <albrecht.andi@gmail.com>	2011-08-13 21:39:29 +0200
committer	Andi Albrecht <albrecht.andi@gmail.com>	2011-08-13 21:39:29 +0200
commit	4307d56e67f33174eab003dbd1c32fc024bbd343 (patch)
tree	96494ccc8e3ba7ea82ace4e0f60f90ace9d91019 /sqlparse
parent	1ad1131f2f7f702df4a4018a97a5d5b08e64ea90 (diff)
parent	5a1d58a6fc69ddc04abb8750e1cf2e156caa04ab (diff)
download	sqlparse-4307d56e67f33174eab003dbd1c32fc024bbd343.tar.gz