1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
|
# simpleSQL.py
#
# simple demo of using the parsing library to do simple-minded SQL parsing
# could be extended to include where clauses etc.
#
# Copyright (c) 2003,2016, Paul McGuire
#
from pyparsing import (
Word,
delimitedList,
Optional,
Group,
alphas,
alphanums,
Forward,
oneOf,
quotedString,
infixNotation,
opAssoc,
restOfLine,
CaselessKeyword,
ParserElement,
pyparsing_common as ppc,
)
ParserElement.enablePackrat()
# define SQL tokens
selectStmt = Forward()
SELECT, FROM, WHERE, AND, OR, IN, IS, NOT, NULL = map(
CaselessKeyword, "select from where and or in is not null".split()
)
NOT_NULL = NOT + NULL
ident = Word(alphas, alphanums + "_$").setName("identifier")
columnName = delimitedList(ident, ".", combine=True).setName("column name")
columnName.addParseAction(ppc.upcaseTokens)
columnNameList = Group(delimitedList(columnName).setName("column_list"))
tableName = delimitedList(ident, ".", combine=True).setName("table name")
tableName.addParseAction(ppc.upcaseTokens)
tableNameList = Group(delimitedList(tableName).setName("table_list"))
binop = oneOf("= != < > >= <= eq ne lt le gt ge", caseless=True).setName("binop")
realNum = ppc.real().setName("real number")
intNum = ppc.signed_integer()
columnRval = (
realNum | intNum | quotedString | columnName
).setName("column_rvalue") # need to add support for alg expressions
whereCondition = Group(
(columnName + binop + columnRval)
| (columnName + IN + Group("(" + delimitedList(columnRval).setName("in_values_list") + ")"))
| (columnName + IN + Group("(" + selectStmt + ")"))
| (columnName + IS + (NULL | NOT_NULL))
).setName("where_condition")
whereExpression = infixNotation(
whereCondition,
[
(NOT, 1, opAssoc.RIGHT),
(AND, 2, opAssoc.LEFT),
(OR, 2, opAssoc.LEFT),
],
).setName("where_expression")
# define the grammar
selectStmt <<= (
SELECT
+ ("*" | columnNameList)("columns")
+ FROM
+ tableNameList("tables")
+ Optional(Group(WHERE + whereExpression), "")("where")
).setName("select_statement")
simpleSQL = selectStmt
# define Oracle comment format, and ignore them
oracleSqlComment = "--" + restOfLine
simpleSQL.ignore(oracleSqlComment)
if __name__ == "__main__":
simpleSQL.runTests(
"""\
# multiple tables
SELECT * from XYZZY, ABC
# dotted table name
select * from SYS.XYZZY
Select A from Sys.dual
Select A,B,C from Sys.dual
Select A, B, C from Sys.dual, Table2
# FAIL - invalid SELECT keyword
Xelect A, B, C from Sys.dual
# FAIL - invalid FROM keyword
Select A, B, C frox Sys.dual
# FAIL - incomplete statement
Select
# FAIL - incomplete statement
Select * from
# FAIL - invalid column
Select &&& frox Sys.dual
# where clause
Select A from Sys.dual where a in ('RED','GREEN','BLUE')
# compound where clause
Select A from Sys.dual where a in ('RED','GREEN','BLUE') and b in (10,20,30)
# where clause with comparison operator
Select A,b from table1,table2 where table1.id eq table2.id
"""
)
|