Statistics
| Branch: | Tag: | Revision:

root / lib / qlang.py @ 7578ab0a

History | View | Annotate | Download (6.3 kB)

1 a123dc19 Michael Hanselmann
#
2 a123dc19 Michael Hanselmann
#
3 a123dc19 Michael Hanselmann
4 341ff8e9 Michael Hanselmann
# Copyright (C) 2010, 2011 Google Inc.
5 a123dc19 Michael Hanselmann
#
6 a123dc19 Michael Hanselmann
# This program is free software; you can redistribute it and/or modify
7 a123dc19 Michael Hanselmann
# it under the terms of the GNU General Public License as published by
8 a123dc19 Michael Hanselmann
# the Free Software Foundation; either version 2 of the License, or
9 a123dc19 Michael Hanselmann
# (at your option) any later version.
10 a123dc19 Michael Hanselmann
#
11 a123dc19 Michael Hanselmann
# This program is distributed in the hope that it will be useful, but
12 a123dc19 Michael Hanselmann
# WITHOUT ANY WARRANTY; without even the implied warranty of
13 a123dc19 Michael Hanselmann
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14 a123dc19 Michael Hanselmann
# General Public License for more details.
15 a123dc19 Michael Hanselmann
#
16 a123dc19 Michael Hanselmann
# You should have received a copy of the GNU General Public License
17 a123dc19 Michael Hanselmann
# along with this program; if not, write to the Free Software
18 a123dc19 Michael Hanselmann
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
19 a123dc19 Michael Hanselmann
# 02110-1301, USA.
20 a123dc19 Michael Hanselmann
21 a123dc19 Michael Hanselmann
22 341ff8e9 Michael Hanselmann
"""Module for a simple query language
23 341ff8e9 Michael Hanselmann

24 341ff8e9 Michael Hanselmann
A query filter is always a list. The first item in the list is the operator
25 341ff8e9 Michael Hanselmann
(e.g. C{[OP_AND, ...]}), while the other items depend on the operator. For
26 341ff8e9 Michael Hanselmann
logic operators (e.g. L{OP_AND}, L{OP_OR}), they are subfilters whose results
27 341ff8e9 Michael Hanselmann
are combined. Unary operators take exactly one other item (e.g. a subfilter for
28 341ff8e9 Michael Hanselmann
L{OP_NOT} and a field name for L{OP_TRUE}). Binary operators take exactly two
29 341ff8e9 Michael Hanselmann
operands, usually a field name and a value to compare against. Filters are
30 341ff8e9 Michael Hanselmann
converted to callable functions by L{query._CompileFilter}.
31 341ff8e9 Michael Hanselmann

32 341ff8e9 Michael Hanselmann
"""
33 a123dc19 Michael Hanselmann
34 7578ab0a Michael Hanselmann
import re
35 7578ab0a Michael Hanselmann
36 7578ab0a Michael Hanselmann
import pyparsing as pyp
37 7578ab0a Michael Hanselmann
38 7578ab0a Michael Hanselmann
from ganeti import errors
39 7578ab0a Michael Hanselmann
40 7578ab0a Michael Hanselmann
41 341ff8e9 Michael Hanselmann
# Logic operators with one or more operands, each of which is a filter on its
42 341ff8e9 Michael Hanselmann
# own
43 a123dc19 Michael Hanselmann
OP_OR = "|"
44 88076fd1 Michael Hanselmann
OP_AND = "&"
45 88076fd1 Michael Hanselmann
46 88076fd1 Michael Hanselmann
47 341ff8e9 Michael Hanselmann
# Unary operators with exactly one operand
48 88076fd1 Michael Hanselmann
OP_NOT = "!"
49 3b877f08 Michael Hanselmann
OP_TRUE = "?"
50 88076fd1 Michael Hanselmann
51 88076fd1 Michael Hanselmann
52 341ff8e9 Michael Hanselmann
# Binary operators with exactly two operands, the field name and an
53 341ff8e9 Michael Hanselmann
# operator-specific value
54 a123dc19 Michael Hanselmann
OP_EQUAL = "="
55 88076fd1 Michael Hanselmann
OP_NOT_EQUAL = "!="
56 88076fd1 Michael Hanselmann
OP_REGEXP = "=~"
57 88076fd1 Michael Hanselmann
OP_CONTAINS = "=[]"
58 a123dc19 Michael Hanselmann
59 a123dc19 Michael Hanselmann
60 60cba7f8 Michael Hanselmann
def MakeSimpleFilter(namefield, values):
61 31554d0a Michael Hanselmann
  """Builds simple a filter.
62 60cba7f8 Michael Hanselmann

63 60cba7f8 Michael Hanselmann
  @param namefield: Name of field containing item name
64 60cba7f8 Michael Hanselmann
  @param values: List of names
65 60cba7f8 Michael Hanselmann

66 60cba7f8 Michael Hanselmann
  """
67 60cba7f8 Michael Hanselmann
  if values:
68 60cba7f8 Michael Hanselmann
    return [OP_OR] + [[OP_EQUAL, namefield, i] for i in values]
69 60cba7f8 Michael Hanselmann
70 60cba7f8 Michael Hanselmann
  return None
71 7578ab0a Michael Hanselmann
72 7578ab0a Michael Hanselmann
73 7578ab0a Michael Hanselmann
def _ConvertLogicOp(op):
74 7578ab0a Michael Hanselmann
  """Creates parsing action function for logic operator.
75 7578ab0a Michael Hanselmann

76 7578ab0a Michael Hanselmann
  @type op: string
77 7578ab0a Michael Hanselmann
  @param op: Operator for data structure, e.g. L{OP_AND}
78 7578ab0a Michael Hanselmann

79 7578ab0a Michael Hanselmann
  """
80 7578ab0a Michael Hanselmann
  def fn(toks):
81 7578ab0a Michael Hanselmann
    """Converts parser tokens to query operator structure.
82 7578ab0a Michael Hanselmann

83 7578ab0a Michael Hanselmann
    @rtype: list
84 7578ab0a Michael Hanselmann
    @return: Query operator structure, e.g. C{[OP_AND, ["=", "foo", "bar"]]}
85 7578ab0a Michael Hanselmann

86 7578ab0a Michael Hanselmann
    """
87 7578ab0a Michael Hanselmann
    operands = toks[0]
88 7578ab0a Michael Hanselmann
89 7578ab0a Michael Hanselmann
    if len(operands) == 1:
90 7578ab0a Michael Hanselmann
      return operands[0]
91 7578ab0a Michael Hanselmann
92 7578ab0a Michael Hanselmann
    # Build query operator structure
93 7578ab0a Michael Hanselmann
    return [[op] + operands.asList()]
94 7578ab0a Michael Hanselmann
95 7578ab0a Michael Hanselmann
  return fn
96 7578ab0a Michael Hanselmann
97 7578ab0a Michael Hanselmann
98 7578ab0a Michael Hanselmann
_KNOWN_REGEXP_DELIM = "/#^|"
99 7578ab0a Michael Hanselmann
_KNOWN_REGEXP_FLAGS = frozenset("si")
100 7578ab0a Michael Hanselmann
101 7578ab0a Michael Hanselmann
102 7578ab0a Michael Hanselmann
def _ConvertRegexpValue(_, loc, toks):
103 7578ab0a Michael Hanselmann
  """Regular expression value for condition.
104 7578ab0a Michael Hanselmann

105 7578ab0a Michael Hanselmann
  """
106 7578ab0a Michael Hanselmann
  (regexp, flags) = toks[0]
107 7578ab0a Michael Hanselmann
108 7578ab0a Michael Hanselmann
  # Ensure only whitelisted flags are used
109 7578ab0a Michael Hanselmann
  unknown_flags = (frozenset(flags) - _KNOWN_REGEXP_FLAGS)
110 7578ab0a Michael Hanselmann
  if unknown_flags:
111 7578ab0a Michael Hanselmann
    raise pyp.ParseFatalException("Unknown regular expression flags: '%s'" %
112 7578ab0a Michael Hanselmann
                                  "".join(unknown_flags), loc)
113 7578ab0a Michael Hanselmann
114 7578ab0a Michael Hanselmann
  if flags:
115 7578ab0a Michael Hanselmann
    re_flags = "(?%s)" % "".join(sorted(flags))
116 7578ab0a Michael Hanselmann
  else:
117 7578ab0a Michael Hanselmann
    re_flags = ""
118 7578ab0a Michael Hanselmann
119 7578ab0a Michael Hanselmann
  re_cond = re_flags + regexp
120 7578ab0a Michael Hanselmann
121 7578ab0a Michael Hanselmann
  # Test if valid
122 7578ab0a Michael Hanselmann
  try:
123 7578ab0a Michael Hanselmann
    re.compile(re_cond)
124 7578ab0a Michael Hanselmann
  except re.error, err:
125 7578ab0a Michael Hanselmann
    raise pyp.ParseFatalException("Invalid regular expression (%s)" % err, loc)
126 7578ab0a Michael Hanselmann
127 7578ab0a Michael Hanselmann
  return [re_cond]
128 7578ab0a Michael Hanselmann
129 7578ab0a Michael Hanselmann
130 7578ab0a Michael Hanselmann
def BuildFilterParser():
131 7578ab0a Michael Hanselmann
  """Builds a parser for query filter strings.
132 7578ab0a Michael Hanselmann

133 7578ab0a Michael Hanselmann
  @rtype: pyparsing.ParserElement
134 7578ab0a Michael Hanselmann

135 7578ab0a Michael Hanselmann
  """
136 7578ab0a Michael Hanselmann
  field_name = pyp.Word(pyp.alphas, pyp.alphanums + "_/.")
137 7578ab0a Michael Hanselmann
138 7578ab0a Michael Hanselmann
  # Integer
139 7578ab0a Michael Hanselmann
  num_sign = pyp.Word("-+", exact=1)
140 7578ab0a Michael Hanselmann
  number = pyp.Combine(pyp.Optional(num_sign) + pyp.Word(pyp.nums))
141 7578ab0a Michael Hanselmann
  number.setParseAction(lambda toks: int(toks[0]))
142 7578ab0a Michael Hanselmann
143 7578ab0a Michael Hanselmann
  # Right-hand-side value
144 7578ab0a Michael Hanselmann
  rval = (number | pyp.quotedString.setParseAction(pyp.removeQuotes))
145 7578ab0a Michael Hanselmann
146 7578ab0a Michael Hanselmann
  # Boolean condition
147 7578ab0a Michael Hanselmann
  bool_cond = field_name.copy()
148 7578ab0a Michael Hanselmann
  bool_cond.setParseAction(lambda (fname, ): [[OP_TRUE, fname]])
149 7578ab0a Michael Hanselmann
150 7578ab0a Michael Hanselmann
  # Simple binary conditions
151 7578ab0a Michael Hanselmann
  binopstbl = {
152 7578ab0a Michael Hanselmann
    "==": OP_EQUAL,
153 7578ab0a Michael Hanselmann
    "!=": OP_NOT_EQUAL,
154 7578ab0a Michael Hanselmann
    }
155 7578ab0a Michael Hanselmann
156 7578ab0a Michael Hanselmann
  binary_cond = (field_name + pyp.oneOf(binopstbl.keys()) + rval)
157 7578ab0a Michael Hanselmann
  binary_cond.setParseAction(lambda (lhs, op, rhs): [[binopstbl[op], lhs, rhs]])
158 7578ab0a Michael Hanselmann
159 7578ab0a Michael Hanselmann
  # "in" condition
160 7578ab0a Michael Hanselmann
  in_cond = (rval + pyp.Suppress("in") + field_name)
161 7578ab0a Michael Hanselmann
  in_cond.setParseAction(lambda (value, field): [[OP_CONTAINS, field, value]])
162 7578ab0a Michael Hanselmann
163 7578ab0a Michael Hanselmann
  # "not in" condition
164 7578ab0a Michael Hanselmann
  not_in_cond = (rval + pyp.Suppress("not") + pyp.Suppress("in") + field_name)
165 7578ab0a Michael Hanselmann
  not_in_cond.setParseAction(lambda (value, field): [[OP_NOT, [OP_CONTAINS,
166 7578ab0a Michael Hanselmann
                                                               field, value]]])
167 7578ab0a Michael Hanselmann
168 7578ab0a Michael Hanselmann
  # Regular expression, e.g. m/foobar/i
169 7578ab0a Michael Hanselmann
  regexp_val = pyp.Group(pyp.Optional("m").suppress() +
170 7578ab0a Michael Hanselmann
                         pyp.MatchFirst([pyp.QuotedString(i, escChar="\\")
171 7578ab0a Michael Hanselmann
                                         for i in _KNOWN_REGEXP_DELIM]) +
172 7578ab0a Michael Hanselmann
                         pyp.Optional(pyp.Word(pyp.alphas), default=""))
173 7578ab0a Michael Hanselmann
  regexp_val.setParseAction(_ConvertRegexpValue)
174 7578ab0a Michael Hanselmann
  regexp_cond = (field_name + pyp.Suppress("=~") + regexp_val)
175 7578ab0a Michael Hanselmann
  regexp_cond.setParseAction(lambda (field, value): [[OP_REGEXP, field, value]])
176 7578ab0a Michael Hanselmann
177 7578ab0a Michael Hanselmann
  not_regexp_cond = (field_name + pyp.Suppress("!~") + regexp_val)
178 7578ab0a Michael Hanselmann
  not_regexp_cond.setParseAction(lambda (field, value):
179 7578ab0a Michael Hanselmann
                                 [[OP_NOT, [OP_REGEXP, field, value]]])
180 7578ab0a Michael Hanselmann
181 7578ab0a Michael Hanselmann
  # All possible conditions
182 7578ab0a Michael Hanselmann
  condition = (binary_cond ^ bool_cond ^
183 7578ab0a Michael Hanselmann
               in_cond ^ not_in_cond ^
184 7578ab0a Michael Hanselmann
               regexp_cond ^ not_regexp_cond)
185 7578ab0a Michael Hanselmann
186 7578ab0a Michael Hanselmann
  # Associativity operators
187 7578ab0a Michael Hanselmann
  filter_expr = pyp.operatorPrecedence(condition, [
188 7578ab0a Michael Hanselmann
    (pyp.Keyword("not").suppress(), 1, pyp.opAssoc.RIGHT,
189 7578ab0a Michael Hanselmann
     lambda toks: [[OP_NOT, toks[0][0]]]),
190 7578ab0a Michael Hanselmann
    (pyp.Keyword("and").suppress(), 2, pyp.opAssoc.LEFT,
191 7578ab0a Michael Hanselmann
     _ConvertLogicOp(OP_AND)),
192 7578ab0a Michael Hanselmann
    (pyp.Keyword("or").suppress(), 2, pyp.opAssoc.LEFT,
193 7578ab0a Michael Hanselmann
     _ConvertLogicOp(OP_OR)),
194 7578ab0a Michael Hanselmann
    ])
195 7578ab0a Michael Hanselmann
196 7578ab0a Michael Hanselmann
  parser = pyp.StringStart() + filter_expr + pyp.StringEnd()
197 7578ab0a Michael Hanselmann
  parser.parseWithTabs()
198 7578ab0a Michael Hanselmann
199 7578ab0a Michael Hanselmann
  # Originally C{parser.validate} was called here, but there seems to be some
200 7578ab0a Michael Hanselmann
  # issue causing it to fail whenever the "not" operator is included above.
201 7578ab0a Michael Hanselmann
202 7578ab0a Michael Hanselmann
  return parser
203 7578ab0a Michael Hanselmann
204 7578ab0a Michael Hanselmann
205 7578ab0a Michael Hanselmann
def ParseFilter(text, parser=None):
206 7578ab0a Michael Hanselmann
  """Parses a query filter.
207 7578ab0a Michael Hanselmann

208 7578ab0a Michael Hanselmann
  @type text: string
209 7578ab0a Michael Hanselmann
  @param text: Query filter
210 7578ab0a Michael Hanselmann
  @type parser: pyparsing.ParserElement
211 7578ab0a Michael Hanselmann
  @param parser: Pyparsing object
212 7578ab0a Michael Hanselmann
  @rtype: list
213 7578ab0a Michael Hanselmann

214 7578ab0a Michael Hanselmann
  """
215 7578ab0a Michael Hanselmann
  if parser is None:
216 7578ab0a Michael Hanselmann
    parser = BuildFilterParser()
217 7578ab0a Michael Hanselmann
218 7578ab0a Michael Hanselmann
  try:
219 7578ab0a Michael Hanselmann
    return parser.parseString(text)[0]
220 7578ab0a Michael Hanselmann
  except pyp.ParseBaseException, err:
221 7578ab0a Michael Hanselmann
    raise errors.QueryFilterParseError("Failed to parse query filter"
222 7578ab0a Michael Hanselmann
                                       " '%s': %s" % (text, err), err)